diff --git a/.env.example b/.env.example
index 865d3de1..0b3be8d3 100644
--- a/.env.example
+++ b/.env.example
@@ -118,6 +118,20 @@ BOOTSTRAP_ADMIN_PASSWORD=your-secure-password
 # TURNSTILE_SITE_KEY=your-site-key
 # TURNSTILE_SECRET_KEY=your-secret-key
 
+# =============================================================================
+# LLM / AI providers
+# =============================================================================
+# LLM credentials are managed per-DJ via the gateway connector system
+# (admin: /admin/ai, DJ: /settings/ai) — there is NO env-var credential path.
+# The recommendation engine routes every call through the gateway, which
+# resolves the actor DJ's connector (or the org default).
+#
+# Historical note: the one-shot Alembic data migration (046_admin_ai_oauth)
+# reads ANTHROPIC_API_KEY *once* on first upgrade, converting it into a
+# system-default "anthropic_apikey" connector. Once that migration has run on a
+# deploy, the env var is no longer consumed at runtime and can be dropped. The
+# legacy env-var fallback in the recommendation engine was removed in #343.
+
 # =============================================================================
 # Frontend (Next.js)
 # =============================================================================
diff --git a/.github/workflows/ci.yml b/.github/workflows/ci.yml
index bcbc48f8..fa20bef7 100644
--- a/.github/workflows/ci.yml
+++ b/.github/workflows/ci.yml
@@ -65,7 +65,17 @@ jobs:
         #   PYSEC-2025-183 (pyjwt 2.10.1+ weak encryption, DISPUTED) - no fix released, the
         #                  pyjwt maintainers contest the advisory. We already pin pyjwt to the
         #                  latest available (2.12.1). Revisit when an upstream fix lands.
-        run: pip-audit --ignore-vuln CVE-2024-23342 --ignore-vuln CVE-2026-3219 --ignore-vuln CVE-2026-6357 --ignore-vuln PYSEC-2025-183
+        #   MAL-2026-4750  (fastapi 0.136.3 "malicious code", WITHDRAWN by OSV 2026-05-26) -
+        #                  False positive. 0.136.3 is an official tiangolo release; the flagged
+        #                  dependency 'fastar' is a legitimate Rust-tar-bindings package
+        #                  (published Oct 2025, predates the release) and is pulled ONLY via
+        #                  fastapi's [standard] extra, which we do NOT install (we use plain
+        #                  fastapi + uvicorn[standard]) - so it never enters our dependency tree.
+        #                  We deliberately stay on 0.136.3 for its underscore-header rejection
+        #                  (PR #15589) and SSE field validation (PR #15588). OSV withdrew the
+        #                  advisory; pip-audit's feed still serves it. REMOVE this ignore once
+        #                  the withdrawn entry is purged from the feed.
+        run: pip-audit --ignore-vuln CVE-2024-23342 --ignore-vuln CVE-2026-3219 --ignore-vuln CVE-2026-6357 --ignore-vuln PYSEC-2025-183 --ignore-vuln MAL-2026-4750
 
       - name: Run tests with coverage
         env:
diff --git a/CLAUDE.md b/CLAUDE.md
index e5895382..2758f1c2 100644
--- a/CLAUDE.md
+++ b/CLAUDE.md
@@ -66,7 +66,7 @@ NEXT_PUBLIC_API_URL="http://LAN_IP:8000" npm run dev
 - Encryption: `TOKEN_ENCRYPTION_KEY` (Fernet, 44 chars base64) — required in production for OAuth token encryption
 - Beatport: `BEATPORT_CLIENT_ID`, `BEATPORT_CLIENT_SECRET`, `BEATPORT_REDIRECT_URI`, `BEATPORT_AUTH_BASE_URL`
 - Soundcharts: `SOUNDCHARTS_APP_ID`, `SOUNDCHARTS_API_KEY` (song discovery for recommendations)
-- Anthropic (LLM recommendations): `ANTHROPIC_API_KEY`, `ANTHROPIC_MODEL` (default: `claude-haiku-4-5-20251001`), `ANTHROPIC_MAX_TOKENS`, `ANTHROPIC_TIMEOUT_SECONDS`
+- Anthropic (LLM recommendations): credentials live in the LLM Gateway connector system — there is **no env-var credential path**. The one-shot Alembic migration `046_admin_ai_oauth` reads `ANTHROPIC_API_KEY` *once* on first upgrade to seed a connector; the legacy env-var fallback in the recommendation engine was removed in #343. `ANTHROPIC_MODEL` (default: `claude-haiku-4-5-20251001`) is retained only as the default model-name label on recommendation responses and for the admin AI-settings/model-listing endpoints. The `ANTHROPIC_MAX_TOKENS` / `ANTHROPIC_TIMEOUT_SECONDS` settings were removed.
 
 ## Running CI Checks Locally
 
@@ -312,13 +312,32 @@ REJECTED → NEW (re-open)
 - `server/app/services/track_normalizer.py` — track normalization & remix detection
 - `server/app/services/version_filter.py` — filters unwanted versions (karaoke, demo) with fuzzy matching
 
+### LLM Gateway (provider-agnostic dispatch)
+- `server/app/services/llm/` — connector-based dispatch usable by any agentic feature:
+  - `gateway.py` — `Gateway.dispatch(db, actor, request, *, purpose)` resolves a connector (per-DJ MRU → org default → raise `NoLlmConfigured`) and routes through the matching adapter. Logs every call to `llm_call_log` (counts only — never prompt/completion content) and writes a `llm_audit_event` row for credential lifecycle events.
+  - `base.py` — canonical `ChatRequest` / `ChatResponse` / `ToolSpec` / `LlmAdapter` ABC
+  - `registry.py` — connector_type → adapter class lookup; auto-registers all adapters on import
+  - `tool_translation.py` — JSON-Schema ToolSpec ↔ per-provider tool/function shape + response parsers
+  - `url_validator.py` — validates custom OpenAI-compatible base URLs (HTTPS any host; HTTP loopback + RFC1918 only)
+  - `connector_storage.py` — CRUD + validation + audit/call logging helpers
+  - `exceptions.py` — `AuthInvalid` / `RateLimited` / `QuotaExceeded` / `ProviderUnavailable` / `ToolTranslationError` / `NoLlmConfigured`
+  - `adapters/openai_apikey.py` — OpenAI Platform API-key adapter (httpx-based)
+  - `adapters/openai_compatible.py` — Custom OpenAI-compatible endpoint (Hermes Agent, Ollama, vLLM, LMStudio)
+  - `adapters/anthropic_apikey.py` — Anthropic API-key adapter (uses the `anthropic` SDK)
+- Models: `LlmConnector` (encrypted credentials via `EncryptedText`), `LlmCallLog`, `LlmAuditEvent`
+- Admin endpoints (`/api/admin/llm/*`): connector policy, force-revoke, usage rollup
+- DJ endpoints (`/api/llm/connectors`): list/create/rotate/test/delete (rate-limited, scoped to current user)
+- Admin UI: `/admin/ai` (policy + per-DJ table + usage)
+- DJ UI: `/settings/ai` (connect/test/delete; includes Hermes onboarding for ChatGPT subscription path)
+- The recommendation engine routes through the gateway (`actor = event.created_by`, `purpose = "recommendation"`); `call_llm` now **requires** a `db` session — the legacy direct-Anthropic env-var fallback was removed in #343 (the connector system is the sole credential source).
+
 ### Recommendation Engine
 - `server/app/services/recommendation/` — multi-stage pipeline:
   - `service.py` — orchestrator: profile analysis → search → scoring → deduplication
   - `enrichment.py` — fills missing BPM/key/genre from Beatport/MusicBrainz/Tidal (for recommendations; request-level enrichment is in `sync/orchestrator.py`)
   - `scorer.py` — multi-dimensional scoring: BPM compatibility, harmonic mixing, genre affinity, artist diversity penalties
   - `camelot.py` — harmonic mixing wheel (Camelot key compatibility, half-time/double-time BPM)
-  - `llm_client.py` — Claude Haiku integration (6/min rate limit, forced tool_use schema for structured JSON)
+  - `llm_client.py` — gateway-backed query generation (forced `tool_use` schema for structured JSON; requires `db` — the legacy direct-Anthropic env-var fallback was removed in #343)
   - `llm_hooks.py` — structured response models for LLM queries
   - `template.py` — playlist-based template recommendations (DJ picks a Tidal/Beatport playlist as "vibe" source)
   - `mb_verify.py` — MusicBrainz artist verification to detect AI-generated filler tracks (cached in DB)
diff --git a/dashboard/app/(dj)/account/__tests__/page.test.tsx b/dashboard/app/(dj)/account/__tests__/page.test.tsx
index 0832b937..7c79abe2 100644
--- a/dashboard/app/(dj)/account/__tests__/page.test.tsx
+++ b/dashboard/app/(dj)/account/__tests__/page.test.tsx
@@ -27,6 +27,13 @@ const { mockGetMe, mockChangePassword, mockRequestEmailChange, mockUpdateMyPrefe
         changePassword: (...args: unknown[]) => changePassword(...args),
         requestEmailChange: (...args: unknown[]) => requestEmailChange(...args),
         updateMyPreferences: (...args: unknown[]) => updateMyPreferences(...args),
+        // The AI providers section (relocated from /settings/ai, #357) mounts
+        // inside the account page. Stub its API surface so the section can render
+        // without network access. getLlmPolicy rejects → fail-closed (no extra UI).
+        // These live on the shared mockApi object so vi.spyOn(mockApi, ...) in
+        // individual tests still rebinds the same reference the page calls.
+        listLlmConnectors: () => Promise.resolve([]),
+        getLlmPolicy: () => Promise.reject(new Error('forbidden')),
       },
     };
   });
@@ -58,6 +65,13 @@ describe('AccountPage', () => {
     });
   });
 
+  it('renders the relocated AI / Model providers section', async () => {
+    render(<AccountPage />);
+    await waitFor(() => {
+      expect(screen.getByText('AI / Model providers')).toBeInTheDocument();
+    });
+  });
+
   it('submits password change with correct payload', async () => {
     mockChangePassword.mockResolvedValue({ status: 'ok', message: 'Updated' });
     render(<AccountPage />);
diff --git a/dashboard/app/(dj)/account/page.tsx b/dashboard/app/(dj)/account/page.tsx
index 4191d22c..0c497b5f 100644
--- a/dashboard/app/(dj)/account/page.tsx
+++ b/dashboard/app/(dj)/account/page.tsx
@@ -6,6 +6,7 @@ import { useRouter } from 'next/navigation';
 
 import { useAuth } from '@/lib/auth';
 import { api } from '@/lib/api';
+import AiProvidersSection from '@/components/AiProvidersSection';
 
 export default function AccountPage() {
   const router = useRouter();
@@ -115,7 +116,7 @@ export default function AccountPage() {
   if (isLoading || !isAuthenticated) return null;
 
   return (
-    <main style={{ maxWidth: '480px', margin: '0 auto', padding: '2rem 1rem' }}>
+    <main style={{ maxWidth: '720px', margin: '0 auto', padding: '2rem 1rem' }}>
       <div style={{ display: 'flex', alignItems: 'center', gap: '1rem', marginBottom: '2rem' }}>
         <Link href="/dashboard" style={{ color: 'var(--text-secondary)', textDecoration: 'none', fontSize: '0.875rem' }}>
           ← Dashboard
@@ -223,6 +224,10 @@ export default function AccountPage() {
         )}
       </div>
 
+      <div style={{ background: 'var(--card)', borderRadius: '0.75rem', padding: '1.5rem', marginTop: '1.5rem' }}>
+        <AiProvidersSection />
+      </div>
+
       <div style={{ background: 'var(--card)', borderRadius: '0.75rem', padding: '1.5rem', marginTop: '1.5rem' }}>
         <h2 style={{ marginTop: 0, marginBottom: '1.25rem', fontSize: '1.1rem' }}>Guest Experience</h2>
         <label style={{ display: 'flex', alignItems: 'center', gap: '0.75rem' }}>
diff --git a/dashboard/app/(dj)/events/[code]/components/RecommendationsCard.tsx b/dashboard/app/(dj)/events/[code]/components/RecommendationsCard.tsx
index 7ff7d154..4d55ef69 100644
--- a/dashboard/app/(dj)/events/[code]/components/RecommendationsCard.tsx
+++ b/dashboard/app/(dj)/events/[code]/components/RecommendationsCard.tsx
@@ -234,7 +234,9 @@ export function RecommendationsCard({
     return false;
   })();
 
-  // Derive short display name from model ID (e.g., "claude-haiku-4-5-20251001" → "Haiku 4.5")
+  // Derive short display name from model ID (e.g., "claude-haiku-4-5-20251001" → "Haiku 4.5").
+  // Non-Anthropic models (gpt-5.x, gemini, grok, bedrock, …) fall back to the raw model id
+  // so the badge reflects whichever provider connector actually produced the suggestions.
   const modelDisplayName = (() => {
     if (!llmModel) return 'AI';
     const m = llmModel.toLowerCase();
@@ -250,7 +252,7 @@ export function RecommendationsCard({
       const ver = m.match(/opus-(\d+)-(\d+)/);
       return ver ? `Opus ${ver[1]}.${ver[2]}` : 'Opus';
     }
-    return 'AI';
+    return llmModel;
   })();
 
   const modeButtonStyle = (active: boolean) => ({
diff --git a/dashboard/app/admin/ai/__tests__/page.test.tsx b/dashboard/app/admin/ai/__tests__/page.test.tsx
index 83778b81..51e83de9 100644
--- a/dashboard/app/admin/ai/__tests__/page.test.tsx
+++ b/dashboard/app/admin/ai/__tests__/page.test.tsx
@@ -131,4 +131,526 @@ describe('AdminAISettingsPage', () => {
       expect(screen.getByText('Failed to load AI settings')).toBeInTheDocument();
     });
   });
+
+  it('renders connector policy + per-DJ connector cards when gateway data loads', async () => {
+    vi.spyOn(api, 'getAISettings').mockResolvedValue({
+      llm_enabled: true,
+      llm_model: 'claude-haiku-4-5-20251001',
+      llm_rate_limit_per_minute: 3,
+      api_key_configured: true,
+      api_key_masked: '...abcd',
+    });
+    vi.spyOn(api, 'getAIModels').mockResolvedValue({
+      models: [{ id: 'claude-haiku-4-5-20251001', name: 'Claude Haiku 4.5' }],
+    });
+    vi.spyOn(api, 'getAdminLlmPolicy').mockResolvedValue({
+      llm_apikey_connectors_enabled: true,
+      llm_compatible_connector_enabled: true,
+      llm_default_connector_id: null,
+      llm_call_log_retention_days: 30,
+    });
+    vi.spyOn(api, 'listAllLlmConnectors').mockResolvedValue([
+      {
+        id: 1,
+        user_id: 42,
+        dj_username: 'someDJ',
+        connector_type: 'openai_apikey',
+        display_name: 'My OpenAI',
+        status: 'active',
+        base_url_plain: null,
+        model_hint: 'gpt-5-mini',
+        created_at: '2026-05-01T00:00:00Z',
+        updated_at: '2026-05-01T00:00:00Z',
+        last_used_at: null,
+        last_error: null,
+        is_default: false,
+        last_health_check_at: null,
+        last_health_check_status: null,
+        monthly_token_cap: null,
+        current_month_tokens: 0,
+      },
+    ]);
+    vi.spyOn(api, 'getAdminLlmUsage').mockResolvedValue({
+      days: 30,
+      rows: [],
+    });
+
+    render(<AdminAISettingsPage />);
+
+    await waitFor(() =>
+      expect(screen.getByText('Connector policy')).toBeInTheDocument(),
+    );
+    expect(screen.getByText('Per-DJ connectors')).toBeInTheDocument();
+    expect(screen.getByText('someDJ')).toBeInTheDocument();
+    expect(screen.getByText(/Usage — last 30 days/)).toBeInTheDocument();
+  });
+
+  it('renders the audit trail card with seeded events', async () => {
+    vi.spyOn(api, 'getAISettings').mockResolvedValue({
+      llm_enabled: true,
+      llm_model: 'claude-haiku-4-5-20251001',
+      llm_rate_limit_per_minute: 3,
+      api_key_configured: true,
+      api_key_masked: '...abcd',
+    });
+    vi.spyOn(api, 'getAIModels').mockResolvedValue({ models: [] });
+    vi.spyOn(api, 'getAdminLlmPolicy').mockResolvedValue({
+      llm_apikey_connectors_enabled: true,
+      llm_compatible_connector_enabled: true,
+      llm_default_connector_id: null,
+      llm_call_log_retention_days: 30,
+    });
+    vi.spyOn(api, 'listAllLlmConnectors').mockResolvedValue([]);
+    vi.spyOn(api, 'getAdminLlmUsage').mockResolvedValue({ days: 30, rows: [] });
+    vi.spyOn(api, 'getAdminLlmAudit').mockResolvedValue({
+      rows: [
+        {
+          id: 1,
+          created_at: '2026-05-20T12:00:00Z',
+          event_type: 'connector_created',
+          actor_user_id: 42,
+          actor_username: 'someDJ',
+          target_connector_id: 7,
+          target_connector_display_name: 'My OpenAI',
+          notes: null,
+        },
+      ],
+      total: 1,
+      limit: 50,
+      offset: 0,
+    });
+
+    render(<AdminAISettingsPage />);
+
+    await waitFor(() =>
+      expect(screen.getByText('Audit trail')).toBeInTheDocument(),
+    );
+    expect(screen.getByText('connector_created')).toBeInTheDocument();
+    expect(screen.getByText('My OpenAI')).toBeInTheDocument();
+    // someDJ appears in the audit row (no connectors table rows to collide)
+    expect(screen.getByText('someDJ')).toBeInTheDocument();
+    // Filter + export controls
+    expect(screen.getByLabelText('Event type')).toBeInTheDocument();
+    expect(screen.getByText('Export CSV')).toBeInTheDocument();
+  });
+
+  it('refetches audit events when the event-type filter changes', async () => {
+    vi.spyOn(api, 'getAISettings').mockResolvedValue({
+      llm_enabled: true,
+      llm_model: 'claude-haiku-4-5-20251001',
+      llm_rate_limit_per_minute: 3,
+      api_key_configured: true,
+      api_key_masked: '...abcd',
+    });
+    vi.spyOn(api, 'getAIModels').mockResolvedValue({ models: [] });
+    vi.spyOn(api, 'getAdminLlmPolicy').mockResolvedValue({
+      llm_apikey_connectors_enabled: true,
+      llm_compatible_connector_enabled: true,
+      llm_default_connector_id: null,
+      llm_call_log_retention_days: 30,
+    });
+    vi.spyOn(api, 'listAllLlmConnectors').mockResolvedValue([]);
+    vi.spyOn(api, 'getAdminLlmUsage').mockResolvedValue({ days: 30, rows: [] });
+    const auditSpy = vi.spyOn(api, 'getAdminLlmAudit').mockResolvedValue({
+      rows: [],
+      total: 0,
+      limit: 50,
+      offset: 0,
+    });
+    const exportSpy = vi
+      .spyOn(api, 'downloadAdminLlmAuditCsv')
+      .mockResolvedValue(new Blob(['ok'], { type: 'text/csv' }));
+    // jsdom doesn't implement these — handleExportCsv triggers a browser download.
+    const createObjectURL = vi.fn(() => 'blob:mock');
+    const revokeObjectURL = vi.fn();
+    vi.stubGlobal('URL', { ...URL, createObjectURL, revokeObjectURL });
+
+    try {
+      render(<AdminAISettingsPage />);
+
+      await waitFor(() => expect(screen.getByText('Audit trail')).toBeInTheDocument());
+      auditSpy.mockClear();
+
+      fireEvent.change(screen.getByLabelText('Event type'), {
+        target: { value: 'connector_credentials_rotated' },
+      });
+
+      await waitFor(() =>
+        expect(auditSpy).toHaveBeenCalledWith(
+          expect.objectContaining({ event_type: 'connector_credentials_rotated' }),
+        ),
+      );
+
+      // CSV export must honor the active event-type filter.
+      fireEvent.click(screen.getByText('Export CSV'));
+      await waitFor(() =>
+        expect(exportSpy).toHaveBeenCalledWith(
+          expect.objectContaining({ event_type: 'connector_credentials_rotated' }),
+        ),
+      );
+    } finally {
+      // Guarantee the URL stub is restored even if an assertion fails early,
+      // so it can't leak into later tests.
+      vi.unstubAllGlobals();
+    }
+  });
+
+  it('force-revokes a connector via the admin table', async () => {
+    vi.spyOn(api, 'getAISettings').mockResolvedValue({
+      llm_enabled: true,
+      llm_model: 'claude-haiku-4-5-20251001',
+      llm_rate_limit_per_minute: 3,
+      api_key_configured: true,
+      api_key_masked: '...abcd',
+    });
+    vi.spyOn(api, 'getAIModels').mockResolvedValue({ models: [] });
+    vi.spyOn(api, 'getAdminLlmPolicy').mockResolvedValue({
+      llm_apikey_connectors_enabled: true,
+      llm_compatible_connector_enabled: true,
+      llm_default_connector_id: null,
+      llm_call_log_retention_days: 30,
+    });
+    vi.spyOn(api, 'listAllLlmConnectors').mockResolvedValue([
+      {
+        id: 9,
+        user_id: 42,
+        dj_username: 'badDJ',
+        connector_type: 'openai_apikey',
+        display_name: 'Compromised',
+        status: 'active',
+        base_url_plain: null,
+        model_hint: null,
+        created_at: '2026-05-01T00:00:00Z',
+        updated_at: '2026-05-01T00:00:00Z',
+        last_used_at: null,
+        last_error: null,
+        is_default: false,
+        last_health_check_at: null,
+        last_health_check_status: null,
+        monthly_token_cap: null,
+        current_month_tokens: 0,
+      },
+    ]);
+    vi.spyOn(api, 'getAdminLlmUsage').mockResolvedValue({ days: 30, rows: [] });
+    const revokeSpy = vi.spyOn(api, 'revokeAdminLlmConnector').mockResolvedValue({
+      id: 9,
+      user_id: 42,
+      dj_username: 'badDJ',
+      connector_type: 'openai_apikey',
+      display_name: 'Compromised',
+      status: 'disabled',
+      base_url_plain: null,
+      model_hint: null,
+      created_at: '2026-05-01T00:00:00Z',
+      updated_at: '2026-05-01T00:00:00Z',
+      last_used_at: null,
+      last_error: null,
+      is_default: false,
+      last_health_check_at: null,
+      last_health_check_status: null,
+      monthly_token_cap: null,
+      current_month_tokens: 0,
+    });
+    vi.spyOn(window, 'confirm').mockReturnValue(true);
+
+    render(<AdminAISettingsPage />);
+
+    await waitFor(() => expect(screen.getByText('Compromised')).toBeInTheDocument());
+    fireEvent.click(screen.getByText('Force-revoke'));
+    await waitFor(() => expect(revokeSpy).toHaveBeenCalledWith(9));
+  });
+
+  it('persists call-log retention on blur via the policy patch (issue #342)', async () => {
+    vi.spyOn(api, 'getAISettings').mockResolvedValue({
+      llm_enabled: true,
+      llm_model: 'claude-haiku-4-5-20251001',
+      llm_rate_limit_per_minute: 3,
+      api_key_configured: true,
+      api_key_masked: '...abcd',
+    });
+    vi.spyOn(api, 'getAIModels').mockResolvedValue({ models: [] });
+    vi.spyOn(api, 'getAdminLlmPolicy').mockResolvedValue({
+      llm_apikey_connectors_enabled: true,
+      llm_compatible_connector_enabled: true,
+      llm_default_connector_id: null,
+      llm_call_log_retention_days: 30,
+    });
+    vi.spyOn(api, 'listAllLlmConnectors').mockResolvedValue([]);
+    vi.spyOn(api, 'getAdminLlmUsage').mockResolvedValue({ days: 30, rows: [] });
+    const patchSpy = vi.spyOn(api, 'updateAdminLlmPolicy').mockResolvedValue({
+      llm_apikey_connectors_enabled: true,
+      llm_compatible_connector_enabled: true,
+      llm_default_connector_id: null,
+      llm_call_log_retention_days: 90,
+    });
+
+    render(<AdminAISettingsPage />);
+
+    const input = (await screen.findByLabelText(
+      /Call log retention/i,
+    )) as HTMLInputElement;
+    expect(input.value).toBe('30');
+
+    fireEvent.change(input, { target: { value: '90' } });
+    fireEvent.blur(input);
+
+    await waitFor(() =>
+      expect(patchSpy).toHaveBeenCalledWith(
+        expect.objectContaining({ llm_call_log_retention_days: 90 }),
+      ),
+    );
+  });
+
+  it('clamps an out-of-range retention value before patching (issue #342)', async () => {
+    vi.spyOn(api, 'getAISettings').mockResolvedValue({
+      llm_enabled: true,
+      llm_model: 'claude-haiku-4-5-20251001',
+      llm_rate_limit_per_minute: 3,
+      api_key_configured: true,
+      api_key_masked: '...abcd',
+    });
+    vi.spyOn(api, 'getAIModels').mockResolvedValue({ models: [] });
+    vi.spyOn(api, 'getAdminLlmPolicy').mockResolvedValue({
+      llm_apikey_connectors_enabled: true,
+      llm_compatible_connector_enabled: true,
+      llm_default_connector_id: null,
+      llm_call_log_retention_days: 30,
+    });
+    vi.spyOn(api, 'listAllLlmConnectors').mockResolvedValue([]);
+    vi.spyOn(api, 'getAdminLlmUsage').mockResolvedValue({ days: 30, rows: [] });
+    const patchSpy = vi.spyOn(api, 'updateAdminLlmPolicy').mockResolvedValue({
+      llm_apikey_connectors_enabled: true,
+      llm_compatible_connector_enabled: true,
+      llm_default_connector_id: null,
+      llm_call_log_retention_days: 365,
+    });
+
+    render(<AdminAISettingsPage />);
+
+    const input = (await screen.findByLabelText(
+      /Call log retention/i,
+    )) as HTMLInputElement;
+    fireEvent.change(input, { target: { value: '9999' } });
+    fireEvent.blur(input);
+
+    await waitFor(() =>
+      expect(patchSpy).toHaveBeenCalledWith(
+        expect.objectContaining({ llm_call_log_retention_days: 365 }),
+      ),
+    );
+  });
+
+  // Use 5 (not 0) for the below-min value: the onChange handler treats a falsy
+  // parsed value as "no change" (`parseInt(...) || policy.value`), so 0 would be
+  // coerced back to the current policy before blur ever sees it. 5 is a genuine
+  // below-min entry that the blur clamp must lift to 7.
+  it('clamps a below-min retention value before patching (issue #342)', async () => {
+    vi.spyOn(api, 'getAISettings').mockResolvedValue({
+      llm_enabled: true,
+      llm_model: 'claude-haiku-4-5-20251001',
+      llm_rate_limit_per_minute: 3,
+      api_key_configured: true,
+      api_key_masked: '...abcd',
+    });
+    vi.spyOn(api, 'getAIModels').mockResolvedValue({ models: [] });
+    vi.spyOn(api, 'getAdminLlmPolicy').mockResolvedValue({
+      llm_apikey_connectors_enabled: true,
+      llm_compatible_connector_enabled: true,
+      llm_default_connector_id: null,
+      llm_call_log_retention_days: 30,
+    });
+    vi.spyOn(api, 'listAllLlmConnectors').mockResolvedValue([]);
+    vi.spyOn(api, 'getAdminLlmUsage').mockResolvedValue({ days: 30, rows: [] });
+    const patchSpy = vi.spyOn(api, 'updateAdminLlmPolicy').mockResolvedValue({
+      llm_apikey_connectors_enabled: true,
+      llm_compatible_connector_enabled: true,
+      llm_default_connector_id: null,
+      llm_call_log_retention_days: 7,
+    });
+
+    render(<AdminAISettingsPage />);
+
+    const input = (await screen.findByLabelText(
+      /Call log retention/i,
+    )) as HTMLInputElement;
+    fireEvent.change(input, { target: { value: '5' } });
+    fireEvent.blur(input);
+
+    await waitFor(() =>
+      expect(patchSpy).toHaveBeenCalledWith(
+        expect.objectContaining({ llm_call_log_retention_days: 7 }),
+      ),
+    );
+  });
+
+  // -------- issue #346: surface health-check columns in connectors table --------
+  it('renders last-health-check column with a status badge per connector', async () => {
+    vi.spyOn(api, 'getAISettings').mockResolvedValue({
+      llm_enabled: true,
+      llm_model: 'claude-haiku-4-5-20251001',
+      llm_rate_limit_per_minute: 3,
+      api_key_configured: true,
+      api_key_masked: '...abcd',
+    });
+    vi.spyOn(api, 'getAIModels').mockResolvedValue({ models: [] });
+    vi.spyOn(api, 'getAdminLlmPolicy').mockResolvedValue({
+      llm_apikey_connectors_enabled: true,
+      llm_compatible_connector_enabled: true,
+      llm_default_connector_id: null,
+      llm_call_log_retention_days: 30,
+    });
+    vi.spyOn(api, 'listAllLlmConnectors').mockResolvedValue([
+      {
+        id: 1,
+        user_id: 1,
+        dj_username: 'alpha',
+        connector_type: 'openai_apikey',
+        display_name: 'Alpha key',
+        status: 'active',
+        base_url_plain: null,
+        model_hint: null,
+        created_at: '2026-05-01T00:00:00Z',
+        updated_at: '2026-05-01T00:00:00Z',
+        last_used_at: null,
+        last_error: null,
+        is_default: false,
+        last_health_check_at: '2026-05-28T10:00:00Z',
+        last_health_check_status: 'ok',
+        monthly_token_cap: null,
+        current_month_tokens: 0,
+      },
+      {
+        id: 2,
+        user_id: 2,
+        dj_username: 'bravo',
+        connector_type: 'anthropic_apikey',
+        display_name: 'Bravo key',
+        status: 'auth_invalid',
+        base_url_plain: null,
+        model_hint: null,
+        created_at: '2026-05-01T00:00:00Z',
+        updated_at: '2026-05-01T00:00:00Z',
+        last_used_at: null,
+        last_error: 'auth_invalid',
+        is_default: false,
+        last_health_check_at: '2026-05-28T09:00:00Z',
+        last_health_check_status: 'auth_invalid',
+        monthly_token_cap: null,
+        current_month_tokens: 0,
+      },
+      {
+        id: 3,
+        user_id: 3,
+        dj_username: 'charlie',
+        connector_type: 'openai_apikey',
+        display_name: 'Charlie key',
+        status: 'active',
+        base_url_plain: null,
+        model_hint: null,
+        created_at: '2026-05-01T00:00:00Z',
+        updated_at: '2026-05-01T00:00:00Z',
+        last_used_at: null,
+        last_error: null,
+        is_default: false,
+        last_health_check_at: null,
+        last_health_check_status: null,
+        monthly_token_cap: null,
+        current_month_tokens: 0,
+      },
+    ]);
+    vi.spyOn(api, 'getAdminLlmUsage').mockResolvedValue({ days: 30, rows: [] });
+
+    render(<AdminAISettingsPage />);
+
+    await waitFor(() => expect(screen.getByText('Alpha key')).toBeInTheDocument());
+    // Column header rendered with sortable affordance
+    expect(screen.getByText('Last health check')).toBeInTheDocument();
+    // Each badge visible
+    expect(screen.getByText('OK')).toBeInTheDocument();
+    expect(screen.getByText('Auth invalid')).toBeInTheDocument();
+    expect(screen.getByText('Never checked')).toBeInTheDocument();
+  });
+
+  it('toggles sort direction when clicking the last-health-check header', async () => {
+    vi.spyOn(api, 'getAISettings').mockResolvedValue({
+      llm_enabled: true,
+      llm_model: 'claude-haiku-4-5-20251001',
+      llm_rate_limit_per_minute: 3,
+      api_key_configured: true,
+      api_key_masked: '...abcd',
+    });
+    vi.spyOn(api, 'getAIModels').mockResolvedValue({ models: [] });
+    vi.spyOn(api, 'getAdminLlmPolicy').mockResolvedValue({
+      llm_apikey_connectors_enabled: true,
+      llm_compatible_connector_enabled: true,
+      llm_default_connector_id: null,
+      llm_call_log_retention_days: 30,
+    });
+    vi.spyOn(api, 'listAllLlmConnectors').mockResolvedValue([
+      {
+        id: 1,
+        user_id: 1,
+        dj_username: 'older',
+        connector_type: 'openai_apikey',
+        display_name: 'Older check',
+        status: 'active',
+        base_url_plain: null,
+        model_hint: null,
+        created_at: '2026-05-01T00:00:00Z',
+        updated_at: '2026-05-01T00:00:00Z',
+        last_used_at: null,
+        last_error: null,
+        is_default: false,
+        last_health_check_at: '2026-05-01T00:00:00Z',
+        last_health_check_status: 'ok',
+        monthly_token_cap: null,
+        current_month_tokens: 0,
+      },
+      {
+        id: 2,
+        user_id: 2,
+        dj_username: 'newer',
+        connector_type: 'openai_apikey',
+        display_name: 'Newer check',
+        status: 'active',
+        base_url_plain: null,
+        model_hint: null,
+        created_at: '2026-05-01T00:00:00Z',
+        updated_at: '2026-05-01T00:00:00Z',
+        last_used_at: null,
+        last_error: null,
+        is_default: false,
+        last_health_check_at: '2026-05-28T00:00:00Z',
+        last_health_check_status: 'ok',
+        monthly_token_cap: null,
+        current_month_tokens: 0,
+      },
+    ]);
+    vi.spyOn(api, 'getAdminLlmUsage').mockResolvedValue({ days: 30, rows: [] });
+
+    render(<AdminAISettingsPage />);
+
+    await waitFor(() => expect(screen.getByText('Newer check')).toBeInTheDocument());
+
+    const findRow = (text: string) => {
+      const td = screen.getByText(text);
+      const tr = td.closest('tr');
+      if (!tr) throw new Error(`row for ${text} not found`);
+      return tr;
+    };
+
+    // Default sort = last_health_check_at DESC → newer first.
+    const tbody = findRow('Newer check').parentElement!;
+    const beforeRows = Array.from(tbody.querySelectorAll('tr'));
+    const beforeOrder = beforeRows.map((r) => r.querySelector('td')!.textContent);
+    expect(beforeOrder).toEqual(['newer', 'older']);
+
+    // Click the Last health check header → should flip to ASC (older first).
+    fireEvent.click(screen.getByText('Last health check'));
+    await waitFor(() => {
+      const rows = Array.from(tbody.querySelectorAll('tr'));
+      const order = rows.map((r) => r.querySelector('td')!.textContent);
+      expect(order).toEqual(['older', 'newer']);
+    });
+  });
 });
diff --git a/dashboard/app/admin/ai/page.tsx b/dashboard/app/admin/ai/page.tsx
index 77ae31a7..af1a4c80 100644
--- a/dashboard/app/admin/ai/page.tsx
+++ b/dashboard/app/admin/ai/page.tsx
@@ -1,8 +1,16 @@
 'use client';
 
-import { useState } from 'react';
+import { useCallback, useEffect, useState } from 'react';
 import { api } from '@/lib/api';
-import type { AISettings, AIModelInfo } from '@/lib/api-types';
+import type { AdminLlmAuditFilters } from '@/lib/api';
+import type {
+  AISettings,
+  AIModelInfo,
+  LlmAdminAudit,
+  LlmAdminConnector,
+  LlmAdminPolicy,
+  LlmAdminUsage,
+} from '@/lib/api-types';
 import { useAdminPage } from '@/lib/useAdminPage';
 import { HelpSpot } from '@/components/help/HelpSpot';
 import { HelpButton } from '@/components/help/HelpButton';
@@ -10,12 +18,261 @@ import { OnboardingOverlay } from '@/components/help/OnboardingOverlay';
 
 const PAGE_ID = 'admin-ai';
 
+const TYPE_LABELS: Record<string, string> = {
+  openai_apikey: 'OpenAI',
+  anthropic_apikey: 'Anthropic',
+  openrouter_apikey: 'OpenRouter',
+  xai_apikey: 'xAI',
+  gemini_apikey: 'Gemini',
+  openai_compatible: 'OpenAI-compatible',
+  bedrock: 'AWS Bedrock',
+  azure_openai: 'Azure OpenAI',
+};
+
+// Audit event types — mirrors AUDIT_* constants in models/llm_connector.py.
+const AUDIT_EVENT_TYPES: Array<{ value: string; label: string }> = [
+  { value: 'connector_created', label: 'Connector created' },
+  { value: 'connector_credentials_rotated', label: 'Credentials rotated' },
+  { value: 'connector_deleted', label: 'Connector deleted' },
+  { value: 'connector_revoked_by_admin', label: 'Revoked by admin' },
+  { value: 'auth_invalid_observed', label: 'Auth invalid observed' },
+  { value: 'policy_changed', label: 'Policy changed' },
+  { value: 'connector_health_check', label: 'Health check' },
+  // Gateway auto-fallback events are written as `fallback_triggered:<trigger>`
+  // (see services/llm/gateway.py). The audit filter is an exact event_type match,
+  // so each trigger variant needs its own option to be filterable.
+  { value: 'fallback_triggered:rate_limited', label: 'Fallback — rate limited' },
+  { value: 'fallback_triggered:auth_invalid', label: 'Fallback — auth invalid' },
+  { value: 'fallback_triggered:provider_unavailable', label: 'Fallback — provider unavailable' },
+  { value: 'fallback_triggered:quota_exceeded', label: 'Fallback — quota exceeded' },
+];
+
+const AUDIT_PAGE_SIZE = 50;
+
+// Map health-check status to a colour family. Active=green, transient/quota
+// issues=amber, auth/error=red. ``null`` (never checked) is treated as
+// "neutral" so the table doesn't scream red on first load.
+const HEALTH_BADGE_STYLES: Record<
+  string,
+  { background: string; color: string; label: string }
+> = {
+  ok: { background: 'var(--color-success-subtle)', color: 'var(--color-success)', label: 'OK' },
+  auth_invalid: {
+    background: 'var(--color-danger-subtle)',
+    color: 'var(--color-danger)',
+    label: 'Auth invalid',
+  },
+  error: {
+    background: 'var(--color-danger-subtle)',
+    color: 'var(--color-danger)',
+    label: 'Error',
+  },
+  rate_limited: {
+    background: 'var(--color-warning-subtle, #2a2418)',
+    color: 'var(--color-warning, #c08418)',
+    label: 'Rate limited',
+  },
+  quota_exceeded: {
+    background: 'var(--color-warning-subtle, #2a2418)',
+    color: 'var(--color-warning, #c08418)',
+    label: 'Quota exceeded',
+  },
+  provider_unavailable: {
+    background: 'var(--color-warning-subtle, #2a2418)',
+    color: 'var(--color-warning, #c08418)',
+    label: 'Provider down',
+  },
+};
+
+type ConnectorSortKey = 'dj_username' | 'last_used_at' | 'last_health_check_at';
+
+function sortConnectors(
+  rows: LlmAdminConnector[],
+  sort: { key: ConnectorSortKey; direction: 'asc' | 'desc' },
+): LlmAdminConnector[] {
+  const factor = sort.direction === 'asc' ? 1 : -1;
+  // Treat ``null`` timestamps as "always last" regardless of direction so an
+  // admin sorting by recency doesn't get a wall of "never checked" rows at
+  // the top — they live below the real signal.
+  const tsValue = (v: string | null | undefined): number => {
+    if (!v) return sort.direction === 'asc' ? Number.POSITIVE_INFINITY : Number.NEGATIVE_INFINITY;
+    return new Date(v).getTime();
+  };
+  const copy = [...rows];
+  copy.sort((a, b) => {
+    if (sort.key === 'dj_username') {
+      const cmp = a.dj_username.localeCompare(b.dj_username);
+      if (cmp !== 0) return cmp * factor;
+    } else {
+      const cmp = tsValue(a[sort.key]) - tsValue(b[sort.key]);
+      if (cmp !== 0) return cmp * factor;
+    }
+    // Stable tiebreak on id so re-renders don't reshuffle equal-keyed rows.
+    return a.id - b.id;
+  });
+  return copy;
+}
+
+// Format a nullable ISO timestamp for table cells; em-dash when absent.
+function formatTimestamp(ts: string | null | undefined): string {
+  return ts ? new Date(ts).toLocaleString() : '—';
+}
+
+// Percent of the monthly cap consumed (issue #339). Returns null when there is
+// no cap (unlimited) so the UI renders no bar. Clamps to 0–100 so an over-cap
+// connector (possible when a cap is lowered mid-month) shows a full bar.
+function capPercent(used: number, cap: number | null | undefined): number | null {
+  if (cap == null) return null;
+  if (cap === 0) return 100;
+  return Math.min(100, Math.max(0, Math.round((used / cap) * 100)));
+}
+
+// Bar colour escalates with consumption: green < 80% < amber < 100% red.
+function capBarColor(percent: number): string {
+  if (percent >= 100) return 'var(--color-danger)';
+  if (percent >= 80) return 'var(--color-warning, #c08418)';
+  return 'var(--color-success)';
+}
+
+function PlainHeader({ label }: { label: string }) {
+  return (
+    <th
+      style={{ textAlign: 'left', padding: '0.5rem', borderBottom: '1px solid var(--border-color)' }}
+    >
+      {label}
+    </th>
+  );
+}
+
+function SortableHeader({
+  label,
+  sortKey,
+  activeKey,
+  direction,
+  onSort,
+}: {
+  label: string;
+  sortKey: ConnectorSortKey;
+  activeKey: ConnectorSortKey;
+  direction: 'asc' | 'desc';
+  onSort: (key: ConnectorSortKey, direction: 'asc' | 'desc') => void;
+}) {
+  const isActive = activeKey === sortKey;
+  const arrow = isActive ? (direction === 'asc' ? '▲' : '▼') : '';
+  return (
+    <th
+      onClick={() => {
+        if (isActive) {
+          onSort(sortKey, direction === 'asc' ? 'desc' : 'asc');
+        } else {
+          // First click on a new column goes to descending — newest-first is
+          // the more useful default for both ``last_used_at`` and
+          // ``last_health_check_at``.
+          onSort(sortKey, 'desc');
+        }
+      }}
+      style={{
+        textAlign: 'left',
+        padding: '0.5rem',
+        borderBottom: '1px solid var(--border-color)',
+        cursor: 'pointer',
+        userSelect: 'none',
+      }}
+      aria-sort={isActive ? (direction === 'asc' ? 'ascending' : 'descending') : 'none'}
+    >
+      {label}
+      {arrow ? <span style={{ marginLeft: '0.25rem', fontSize: '0.75rem' }}>{arrow}</span> : null}
+    </th>
+  );
+}
+
+function HealthBadge({ status }: { status: string | null }) {
+  if (!status) {
+    return (
+      <span style={{ color: 'var(--text-secondary)', fontSize: '0.75rem' }}>Never checked</span>
+    );
+  }
+  const style = HEALTH_BADGE_STYLES[status] ?? {
+    background: 'var(--color-warning-subtle, #2a2418)',
+    color: 'var(--text-secondary)',
+    label: status,
+  };
+  return (
+    <span
+      style={{
+        display: 'inline-block',
+        padding: '0.15rem 0.6rem',
+        borderRadius: '9999px',
+        fontSize: '0.75rem',
+        fontWeight: 600,
+        background: style.background,
+        color: style.color,
+        whiteSpace: 'nowrap',
+      }}
+    >
+      {style.label}
+    </span>
+  );
+}
+
+const AUDIT_DAY_OPTIONS: Array<{ value: number; label: string }> = [
+  { value: 7, label: 'Last 7 days' },
+  { value: 30, label: 'Last 30 days' },
+  { value: 90, label: 'Last 90 days' },
+  { value: 365, label: 'Last year' },
+  { value: 3650, label: 'All time' },
+];
+
 export default function AdminAISettingsPage() {
   const [models, setModels] = useState<AIModelInfo[]>([]);
   const [saving, setSaving] = useState(false);
   const [error, setError] = useState('');
   const [success, setSuccess] = useState('');
 
+  // LLM gateway state
+  const [policy, setPolicy] = useState<LlmAdminPolicy | null>(null);
+  const [connectors, setConnectors] = useState<LlmAdminConnector[]>([]);
+  const [usage, setUsage] = useState<LlmAdminUsage | null>(null);
+  const [policyMessage, setPolicyMessage] = useState('');
+
+  // Connectors-table sort state (issue #346)
+  // Default-sort by health-check-recency so an admin scanning the table sees
+  // the most-recently-verified rows up top — easiest first-pass triage.
+  const [connectorSort, setConnectorSort] = useState<{
+    key: ConnectorSortKey;
+    direction: 'asc' | 'desc';
+  }>({ key: 'last_health_check_at', direction: 'desc' });
+
+  // Audit trail state (issue #341)
+  const [audit, setAudit] = useState<LlmAdminAudit | null>(null);
+  const [auditLoading, setAuditLoading] = useState(false);
+  const [auditError, setAuditError] = useState('');
+  const [auditEventType, setAuditEventType] = useState('');
+  const [auditActorId, setAuditActorId] = useState('');
+  const [auditConnectorId, setAuditConnectorId] = useState('');
+  const [auditDays, setAuditDays] = useState(30);
+  const [auditPage, setAuditPage] = useState(0);
+  const [exporting, setExporting] = useState(false);
+
+  const buildAuditFilters = useCallback(
+    (overrides: Partial<AdminLlmAuditFilters> = {}): AdminLlmAuditFilters => {
+      const filters: AdminLlmAuditFilters = {
+        days: auditDays,
+        limit: AUDIT_PAGE_SIZE,
+        offset: auditPage * AUDIT_PAGE_SIZE,
+      };
+      if (auditEventType) filters.event_type = auditEventType;
+      const actorId = parseInt(auditActorId, 10);
+      if (auditActorId && !Number.isNaN(actorId)) filters.actor_user_id = actorId;
+      const connectorId = parseInt(auditConnectorId, 10);
+      if (auditConnectorId && !Number.isNaN(connectorId)) {
+        filters.target_connector_id = connectorId;
+      }
+      return { ...filters, ...overrides };
+    },
+    [auditDays, auditPage, auditEventType, auditActorId, auditConnectorId],
+  );
+
   const { data: settings, loading, error: loadError, setData: setSettings } = useAdminPage<AISettings>({
     pageId: PAGE_ID,
     loader: async () => {
@@ -29,6 +286,83 @@ export default function AdminAISettingsPage() {
     onError: () => 'Failed to load AI settings',
   });
 
+  useEffect(() => {
+    let active = true;
+    // Load each gateway section independently — a transient failure in one
+    // request shouldn't hide the others (e.g. usage 500 should not blank the
+    // policy + connectors panes).
+    Promise.allSettled([
+      api.getAdminLlmPolicy(),
+      api.listAllLlmConnectors(),
+      api.getAdminLlmUsage(30),
+    ]).then(([p, c, u]) => {
+      if (!active) return;
+      if (p.status === 'fulfilled') setPolicy(p.value);
+      if (c.status === 'fulfilled') setConnectors(c.value);
+      if (u.status === 'fulfilled') setUsage(u.value);
+      if (
+        p.status === 'rejected' ||
+        c.status === 'rejected' ||
+        u.status === 'rejected'
+      ) {
+        setPolicyMessage('Some LLM gateway data failed to load');
+      }
+    });
+    return () => {
+      active = false;
+    };
+  }, []);
+
+  // Load audit events whenever filters or the page change.
+  useEffect(() => {
+    let active = true;
+    setAuditLoading(true);
+    setAuditError('');
+    api
+      .getAdminLlmAudit(buildAuditFilters())
+      .then((data) => {
+        if (active) setAudit(data);
+      })
+      .catch((err) => {
+        if (active) {
+          setAuditError(err instanceof Error ? err.message : 'Failed to load audit events');
+        }
+      })
+      .finally(() => {
+        if (active) setAuditLoading(false);
+      });
+    return () => {
+      active = false;
+    };
+  }, [buildAuditFilters]);
+
+  // Any audit-filter change resets pagination to the first page before applying
+  // the new value, so the offset never points past a now-shorter result set.
+  const onAuditFilterChange = (apply: () => void) => {
+    setAuditPage(0);
+    apply();
+  };
+
+  const handleExportCsv = async () => {
+    setExporting(true);
+    setAuditError('');
+    try {
+      const blob = await api.downloadAdminLlmAuditCsv(buildAuditFilters());
+      const url = URL.createObjectURL(blob);
+      const link = document.createElement('a');
+      link.href = url;
+      link.download = 'llm-audit-events.csv';
+      document.body.appendChild(link);
+      link.click();
+      link.remove();
+      URL.revokeObjectURL(url);
+    } catch (err) {
+      setAuditError(err instanceof Error ? err.message : 'Export failed');
+    } finally {
+      setExporting(false);
+    }
+  };
+
   const handleSave = async () => {
     if (!settings) return;
     setSaving(true);
@@ -50,6 +384,67 @@ export default function AdminAISettingsPage() {
     }
   };
 
+  const handlePolicyPatch = async (next: Partial<LlmAdminPolicy>) => {
+    if (!policy) return;
+    setPolicyMessage('');
+    const optimistic = { ...policy, ...next };
+    const prev = policy;
+    setPolicy(optimistic);
+    try {
+      const updated = await api.updateAdminLlmPolicy({
+        llm_apikey_connectors_enabled: optimistic.llm_apikey_connectors_enabled,
+        llm_compatible_connector_enabled: optimistic.llm_compatible_connector_enabled,
+        llm_default_connector_id: optimistic.llm_default_connector_id,
+        clear_default: optimistic.llm_default_connector_id === null,
+        llm_call_log_retention_days: optimistic.llm_call_log_retention_days,
+      });
+      setPolicy(updated);
+      setPolicyMessage('Policy saved');
+      setTimeout(() => setPolicyMessage(''), 2000);
+    } catch (err) {
+      setPolicy(prev);
+      setPolicyMessage(err instanceof Error ? err.message : 'Save failed');
+    }
+  };
+
+  const handleCapBlur = async (connector: LlmAdminConnector, raw: string) => {
+    const trimmed = raw.trim();
+    // Empty input clears the cap (unlimited).
+    let next: number | null;
+    if (trimmed === '') {
+      next = null;
+    } else {
+      const parsed = parseInt(trimmed, 10);
+      if (Number.isNaN(parsed) || parsed < 0) {
+        setError('Monthly cap must be a non-negative whole number.');
+        return;
+      }
+      next = parsed;
+    }
+    // No-op when unchanged.
+    if (next === (connector.monthly_token_cap ?? null)) return;
+    try {
+      const updated = await api.setAdminLlmConnectorCap(connector.id, next);
+      setConnectors((prev) => prev.map((c) => (c.id === connector.id ? updated : c)));
+      setError('');
+    } catch (err) {
+      setError(err instanceof Error ? err.message : 'Failed to update cap');
+    }
+  };
+
+  const handleRevoke = async (id: number) => {
+    if (!window.confirm('Force-revoke this connector? The DJ will need to re-add it.')) return;
+    try {
+      const updated = await api.revokeAdminLlmConnector(id);
+      setConnectors((prev) => prev.map((c) => (c.id === id ? updated : c)));
+      // Reload policy in case the default changed
+      const newPolicy = await api.getAdminLlmPolicy();
+      setPolicy(newPolicy);
+    } catch (err) {
+      setError(err instanceof Error ? err.message : 'Revoke failed');
+    }
+  };
+
   if (loading) {
     return (
       <div className="container">
@@ -189,6 +584,399 @@ export default function AdminAISettingsPage() {
           {saving ? 'Saving...' : 'Save Settings'}
         </button>
       </div>
+
+      {/* ====== LLM Gateway connector policy ====== */}
+      {policy && (
+        <div className="card" style={{ marginTop: '2rem' }}>
+          <h2 style={{ marginTop: 0 }}>Connector policy</h2>
+          {policyMessage && (
+            <div style={{ marginBottom: '1rem', color: 'var(--text-secondary)' }}>{policyMessage}</div>
+          )}
+          <label style={{ display: 'flex', alignItems: 'center', gap: '0.75rem', cursor: 'pointer' }}>
+            <input
+              type="checkbox"
+              checked={policy.llm_apikey_connectors_enabled}
+              onChange={(e) => handlePolicyPatch({ llm_apikey_connectors_enabled: e.target.checked })}
+            />
+            Allow API-key connectors (e.g. OpenAI, Anthropic, OpenRouter, xAI, Gemini, Bedrock)
+          </label>
+          <label style={{ display: 'flex', alignItems: 'center', gap: '0.75rem', cursor: 'pointer', marginTop: '0.75rem' }}>
+            <input
+              type="checkbox"
+              checked={policy.llm_compatible_connector_enabled}
+              onChange={(e) => handlePolicyPatch({ llm_compatible_connector_enabled: e.target.checked })}
+            />
+            Allow custom OpenAI-compatible endpoints
+          </label>
+
+          <div className="form-group" style={{ marginTop: '1.5rem' }}>
+            <label htmlFor="default-connector">Org default connector</label>
+            <div style={{ color: 'var(--text-secondary)', fontSize: '0.875rem', marginBottom: '0.5rem' }}>
+              Used when a system call has no DJ actor (background jobs).
+            </div>
+            <select
+              id="default-connector"
+              className="input"
+              value={policy.llm_default_connector_id ?? ''}
+              onChange={(e) => {
+                const v = e.target.value;
+                if (!v) {
+                  handlePolicyPatch({ llm_default_connector_id: null });
+                } else {
+                  handlePolicyPatch({ llm_default_connector_id: parseInt(v) });
+                }
+              }}
+              style={{ maxWidth: '480px' }}
+            >
+              <option value="">— None —</option>
+              {connectors
+                .filter((c) => c.status === 'active')
+                .map((c) => (
+                  <option key={c.id} value={c.id}>
+                    {c.dj_username} — {c.display_name} ({TYPE_LABELS[c.connector_type] ?? c.connector_type})
+                  </option>
+                ))}
+            </select>
+          </div>
+
+          <div className="form-group" style={{ marginTop: '1.5rem' }}>
+            <label htmlFor="call-log-retention">Call log retention (days)</label>
+            <div style={{ color: 'var(--text-secondary)', fontSize: '0.875rem', marginBottom: '0.5rem' }}>
+              How long per-call telemetry (counts only, never prompt content) is kept before
+              the daily cleanup deletes it. Range: 7–365 days. Changes take effect within 24 hours.
+            </div>
+            <input
+              id="call-log-retention"
+              type="number"
+              className="input"
+              style={{ maxWidth: '200px' }}
+              min={7}
+              max={365}
+              value={policy.llm_call_log_retention_days}
+              onChange={(e) =>
+                setPolicy({
+                  ...policy,
+                  llm_call_log_retention_days: parseInt(e.target.value, 10) || policy.llm_call_log_retention_days,
+                })
+              }
+              onBlur={(e) => {
+                const raw = parseInt(e.target.value, 10);
+                const clamped = Number.isNaN(raw)
+                  ? policy.llm_call_log_retention_days
+                  : Math.min(365, Math.max(7, raw));
+                handlePolicyPatch({ llm_call_log_retention_days: clamped });
+              }}
+            />
+          </div>
+
+          <p style={{ color: 'var(--text-secondary)', fontSize: '0.875rem', marginTop: '1rem' }}>
+            WrzDJ stores provider credentials encrypted at rest. Calls consume the DJ&apos;s
+            quota or billing directly. Credentials are never shared between DJs.
+          </p>
+        </div>
+      )}
+
+      {/* ====== Per-DJ connectors table ====== */}
+      <div className="card" style={{ marginTop: '2rem' }}>
+        <h2 style={{ marginTop: 0 }}>Per-DJ connectors</h2>
+        <p style={{ color: 'var(--text-secondary)', fontSize: '0.875rem', marginTop: 0 }}>
+          Background monitor verifies each connector every {' '}
+          <code>LLM_HEALTH_CHECK_INTERVAL_HOURS</code> hours (default 6). DJ-triggered
+          tests update the same columns.
+        </p>
+        {connectors.length === 0 ? (
+          <p style={{ color: 'var(--text-secondary)' }}>No DJs have connected an LLM yet.</p>
+        ) : (
+          <div style={{ overflowX: 'auto' }}>
+            <table style={{ width: '100%', borderCollapse: 'collapse' }}>
+              <thead>
+                <tr>
+                  <SortableHeader
+                    label="DJ"
+                    sortKey="dj_username"
+                    activeKey={connectorSort.key}
+                    direction={connectorSort.direction}
+                    onSort={(k, d) => setConnectorSort({ key: k, direction: d })}
+                  />
+                  <PlainHeader label="Type" />
+                  <PlainHeader label="Name" />
+                  <PlainHeader label="Status" />
+                  <SortableHeader
+                    label="Last used"
+                    sortKey="last_used_at"
+                    activeKey={connectorSort.key}
+                    direction={connectorSort.direction}
+                    onSort={(k, d) => setConnectorSort({ key: k, direction: d })}
+                  />
+                  <SortableHeader
+                    label="Last health check"
+                    sortKey="last_health_check_at"
+                    activeKey={connectorSort.key}
+                    direction={connectorSort.direction}
+                    onSort={(k, d) => setConnectorSort({ key: k, direction: d })}
+                  />
+                  <PlainHeader label="Result" />
+                  <PlainHeader label="Monthly cap" />
+                  <PlainHeader label="Actions" />
+                </tr>
+              </thead>
+              <tbody>
+                {sortConnectors(connectors, connectorSort).map((c) => (
+                  <tr key={c.id}>
+                    <td style={{ padding: '0.5rem' }}>{c.dj_username}</td>
+                    <td style={{ padding: '0.5rem' }}>
+                      {TYPE_LABELS[c.connector_type] ?? c.connector_type}
+                    </td>
+                    <td style={{ padding: '0.5rem' }}>{c.display_name}</td>
+                    <td style={{ padding: '0.5rem' }}>{c.status}</td>
+                    <td style={{ padding: '0.5rem', color: 'var(--text-secondary)' }}>
+                      {formatTimestamp(c.last_used_at)}
+                    </td>
+                    <td style={{ padding: '0.5rem', color: 'var(--text-secondary)' }}>
+                      {formatTimestamp(c.last_health_check_at)}
+                    </td>
+                    <td style={{ padding: '0.5rem' }}>
+                      <HealthBadge status={c.last_health_check_status ?? null} />
+                    </td>
+                    <td style={{ padding: '0.5rem', minWidth: '180px' }}>
+                      <input
+                        type="number"
+                        className="input"
+                        style={{ width: '110px' }}
+                        min={0}
+                        placeholder="∞"
+                        defaultValue={c.monthly_token_cap ?? ''}
+                        onBlur={(e) => handleCapBlur(c, e.target.value)}
+                        aria-label={`Monthly token cap for ${c.dj_username} ${c.display_name}`}
+                      />
+                      <div
+                        style={{
+                          marginTop: '0.35rem',
+                          fontSize: '0.75rem',
+                          color: 'var(--text-secondary)',
+                        }}
+                      >
+                        {c.monthly_token_cap == null
+                          ? `${c.current_month_tokens.toLocaleString()} this month · unlimited`
+                          : `${c.current_month_tokens.toLocaleString()} / ${c.monthly_token_cap.toLocaleString()}`}
+                      </div>
+                      {c.monthly_token_cap != null && (
+                        <div
+                          aria-hidden
+                          style={{
+                            marginTop: '0.25rem',
+                            height: '6px',
+                            borderRadius: '9999px',
+                            background: 'var(--border-color)',
+                            overflow: 'hidden',
+                          }}
+                        >
+                          <div
+                            style={{
+                              width: `${capPercent(c.current_month_tokens, c.monthly_token_cap) ?? 0}%`,
+                              height: '100%',
+                              background: capBarColor(
+                                capPercent(c.current_month_tokens, c.monthly_token_cap) ?? 0,
+                              ),
+                            }}
+                          />
+                        </div>
+                      )}
+                    </td>
+                    <td style={{ padding: '0.5rem' }}>
+                      {c.status !== 'disabled' && (
+                        <button className="btn btn-danger" onClick={() => handleRevoke(c.id)}>
+                          Force-revoke
+                        </button>
+                      )}
+                    </td>
+                  </tr>
+                ))}
+              </tbody>
+            </table>
+          </div>
+        )}
+      </div>
+
+      {/* ====== Usage ====== */}
+      {usage && (
+        <div className="card" style={{ marginTop: '2rem' }}>
+          <h2 style={{ marginTop: 0 }}>Usage — last {usage.days} days</h2>
+          {usage.rows.length === 0 ? (
+            <p style={{ color: 'var(--text-secondary)' }}>No calls yet.</p>
+          ) : (
+            <div style={{ overflowX: 'auto' }}>
+              <table style={{ width: '100%', borderCollapse: 'collapse' }}>
+                <thead>
+                  <tr>
+                    {['DJ', 'Connector', 'Calls', 'Tokens in', 'Tokens out', 'Error rate'].map((h) => (
+                      <PlainHeader key={h} label={h} />
+                    ))}
+                  </tr>
+                </thead>
+                <tbody>
+                  {usage.rows.map((r) => (
+                    <tr key={r.connector_id}>
+                      <td style={{ padding: '0.5rem' }}>{r.dj_username}</td>
+                      <td style={{ padding: '0.5rem' }}>
+                        {r.display_name} <span style={{ color: 'var(--text-secondary)' }}>· {TYPE_LABELS[r.connector_type] ?? r.connector_type}</span>
+                      </td>
+                      <td style={{ padding: '0.5rem' }}>{r.total_calls}</td>
+                      <td style={{ padding: '0.5rem' }}>{r.total_tokens_in}</td>
+                      <td style={{ padding: '0.5rem' }}>{r.total_tokens_out}</td>
+                      <td style={{ padding: '0.5rem' }}>{(r.error_rate * 100).toFixed(1)}%</td>
+                    </tr>
+                  ))}
+                </tbody>
+              </table>
+            </div>
+          )}
+        </div>
+      )}
+
+      {/* ====== Audit trail (issue #341) ====== */}
+      <div className="card" style={{ marginTop: '2rem' }}>
+        <div style={{ display: 'flex', justifyContent: 'space-between', alignItems: 'center', gap: '1rem', flexWrap: 'wrap' }}>
+          <h2 style={{ marginTop: 0, marginBottom: 0 }}>Audit trail</h2>
+          <button
+            className="btn"
+            onClick={handleExportCsv}
+            disabled={exporting}
+          >
+            {exporting ? 'Exporting…' : 'Export CSV'}
+          </button>
+        </div>
+        <p style={{ color: 'var(--text-secondary)', fontSize: '0.875rem', marginTop: '0.5rem' }}>
+          Credential lifecycle events for every connector. Export honors the active filters.
+        </p>
+
+        {/* Filters */}
+        <div style={{ display: 'flex', gap: '1rem', flexWrap: 'wrap', marginTop: '1rem' }}>
+          <div className="form-group" style={{ margin: 0 }}>
+            <label htmlFor="audit-event-type">Event type</label>
+            <select
+              id="audit-event-type"
+              className="input"
+              value={auditEventType}
+              onChange={(e) => onAuditFilterChange(() => setAuditEventType(e.target.value))}
+            >
+              <option value="">All event types</option>
+              {AUDIT_EVENT_TYPES.map((t) => (
+                <option key={t.value} value={t.value}>{t.label}</option>
+              ))}
+            </select>
+          </div>
+
+          <div className="form-group" style={{ margin: 0 }}>
+            <label htmlFor="audit-actor">Actor user ID</label>
+            <input
+              id="audit-actor"
+              type="number"
+              min={1}
+              className="input"
+              style={{ maxWidth: '160px' }}
+              placeholder="Any"
+              value={auditActorId}
+              onChange={(e) => onAuditFilterChange(() => setAuditActorId(e.target.value))}
+            />
+          </div>
+
+          <div className="form-group" style={{ margin: 0 }}>
+            <label htmlFor="audit-connector">Connector</label>
+            <select
+              id="audit-connector"
+              className="input"
+              value={auditConnectorId}
+              onChange={(e) => onAuditFilterChange(() => setAuditConnectorId(e.target.value))}
+            >
+              <option value="">All connectors</option>
+              {connectors.map((c) => (
+                <option key={c.id} value={c.id}>
+                  {c.dj_username} — {c.display_name}
+                </option>
+              ))}
+            </select>
+          </div>
+
+          <div className="form-group" style={{ margin: 0 }}>
+            <label htmlFor="audit-days">Date range</label>
+            <select
+              id="audit-days"
+              className="input"
+              value={auditDays}
+              onChange={(e) => onAuditFilterChange(() => setAuditDays(parseInt(e.target.value, 10)))}
+            >
+              {AUDIT_DAY_OPTIONS.map((d) => (
+                <option key={d.value} value={d.value}>{d.label}</option>
+              ))}
+            </select>
+          </div>
+        </div>
+
+        {auditError && (
+          <div style={{ color: 'var(--color-danger)', marginTop: '1rem' }}>{auditError}</div>
+        )}
+
+        {auditLoading && !audit ? (
+          <p style={{ color: 'var(--text-secondary)', marginTop: '1rem' }}>Loading audit events…</p>
+        ) : audit && audit.rows.length === 0 ? (
+          <p style={{ color: 'var(--text-secondary)', marginTop: '1rem' }}>No audit events match these filters.</p>
+        ) : audit ? (
+          <>
+            <div style={{ overflowX: 'auto', marginTop: '1rem' }}>
+              <table style={{ width: '100%', borderCollapse: 'collapse' }}>
+                <thead>
+                  <tr>
+                    {['Timestamp', 'Actor', 'Event type', 'Connector', 'Notes'].map((h) => (
+                      <PlainHeader key={h} label={h} />
+                    ))}
+                  </tr>
+                </thead>
+                <tbody>
+                  {audit.rows.map((row) => (
+                    <tr key={row.id}>
+                      <td style={{ padding: '0.5rem', color: 'var(--text-secondary)' }}>
+                        {formatTimestamp(row.created_at)}
+                      </td>
+                      <td style={{ padding: '0.5rem' }}>{row.actor_username}</td>
+                      <td style={{ padding: '0.5rem' }}>{row.event_type}</td>
+                      <td style={{ padding: '0.5rem' }}>
+                        {row.target_connector_display_name ?? '—'}
+                      </td>
+                      <td style={{ padding: '0.5rem', color: 'var(--text-secondary)' }}>
+                        {row.notes ?? '—'}
+                      </td>
+                    </tr>
+                  ))}
+                </tbody>
+              </table>
+            </div>
+
+            {/* Pagination */}
+            <div style={{ display: 'flex', alignItems: 'center', gap: '1rem', marginTop: '1rem' }}>
+              <button
+                className="btn"
+                disabled={auditPage === 0 || auditLoading}
+                onClick={() => setAuditPage((p) => Math.max(0, p - 1))}
+              >
+                Previous
+              </button>
+              <span style={{ color: 'var(--text-secondary)', fontSize: '0.875rem' }}>
+                {audit.total === 0
+                  ? '0 events'
+                  : `${audit.offset + 1}–${Math.min(audit.offset + audit.rows.length, audit.total)} of ${audit.total}`}
+              </span>
+              <button
+                className="btn"
+                disabled={auditLoading || audit.offset + AUDIT_PAGE_SIZE >= audit.total}
+                onClick={() => setAuditPage((p) => p + 1)}
+              >
+                Next
+              </button>
+            </div>
+          </>
+        ) : null}
+      </div>
     </div>
   );
 }
diff --git a/dashboard/components/AiProvidersSection.tsx b/dashboard/components/AiProvidersSection.tsx
new file mode 100644
index 00000000..956e41d8
--- /dev/null
+++ b/dashboard/components/AiProvidersSection.tsx
@@ -0,0 +1,803 @@
+'use client';
+
+import { useEffect, useMemo, useState } from 'react';
+
+import { api } from '@/lib/api';
+import type {
+  AIModelInfo,
+  LlmConnector,
+  LlmConnectorCreate,
+  LlmConnectorType,
+  LlmDjPolicy,
+  LlmFeatureKey,
+  LlmFeaturePreferences,
+} from '@/lib/api-types';
+
+const CONNECTOR_TYPE_LABELS: Record<LlmConnectorType, string> = {
+  openai_apikey: 'OpenAI API key',
+  anthropic_apikey: 'Anthropic API key',
+  openrouter_apikey: 'OpenRouter API key',
+  xai_apikey: 'xAI Grok API key',
+  gemini_apikey: 'Google Gemini API key',
+  openai_compatible: 'Custom OpenAI-compatible endpoint',
+  bedrock: 'AWS Bedrock',
+  azure_openai: 'Azure OpenAI',
+};
+
+const STATUS_LABELS: Record<string, { text: string; color: string }> = {
+  active: { text: 'Active', color: 'var(--color-success)' },
+  auth_invalid: { text: 'Auth invalid', color: 'var(--color-danger)' },
+  disabled: { text: 'Disabled', color: 'var(--text-secondary)' },
+};
+
+// Human-readable labels for the pinnable agentic features (issue #337). Falls
+// back to the raw feature key for any feature the backend adds before the UI
+// learns its label.
+const FEATURE_LABELS: Record<string, string> = {
+  recommendation: 'Recommendations',
+  set_builder: 'Set builder',
+};
+
+// Provider-specific input placeholders. Missing entries fall back to the
+// per-field default below (openai_apikey for the key, openai_compatible for
+// the model hint), preserving the previous nested-ternary behavior.
+const API_KEY_PLACEHOLDERS: Partial<Record<LlmConnectorType, string>> = {
+  anthropic_apikey: 'sk-ant-…',
+  openrouter_apikey: 'sk-or-…',
+  xai_apikey: 'xai-…',
+  gemini_apikey: 'AIza…',
+};
+const API_KEY_PLACEHOLDER_DEFAULT = 'sk-proj-… / sk-…';
+
+const MODEL_HINT_PLACEHOLDERS: Partial<Record<LlmConnectorType, string>> = {
+  anthropic_apikey: 'claude-haiku-4-5-20251001',
+  openai_apikey: 'gpt-5-mini',
+  openrouter_apikey: 'e.g. openai/gpt-4o-mini',
+  xai_apikey: 'grok-3-mini',
+  gemini_apikey: 'gemini-2.5-flash',
+};
+const MODEL_HINT_PLACEHOLDER_DEFAULT = 'e.g. llama3';
+
+interface FormState {
+  open: boolean;
+  connector_type: LlmConnectorType;
+  display_name: string;
+  api_key: string;
+  base_url: string;
+  bearer: string;
+  model_hint: string;
+  aws_access_key_id: string;
+  aws_secret_access_key: string;
+  aws_region: string;
+  aws_model_id: string;
+  azure_resource_name: string;
+  azure_deployment_name: string;
+  azure_api_version: string;
+}
+
+const EMPTY_FORM: FormState = {
+  open: false,
+  connector_type: 'openai_apikey',
+  display_name: '',
+  api_key: '',
+  base_url: '',
+  bearer: '',
+  model_hint: '',
+  aws_access_key_id: '',
+  aws_secret_access_key: '',
+  aws_region: '',
+  aws_model_id: '',
+  azure_resource_name: '',
+  azure_deployment_name: '',
+  azure_api_version: '',
+};
+
+/**
+ * DJ-facing AI connector management UI (connect / test / delete, model hint,
+ * Hermes onboarding). Relocated from the standalone `/settings/ai` route into
+ * the `/account` page (issue #357). The component assumes the parent already
+ * enforces authentication — it does no auth gating of its own.
+ *
+ * Fail-closed behavior is preserved: when the DJ-scoped policy endpoint can't
+ * be read, NO provider types are offered rather than leaking every type.
+ */
+export default function AiProvidersSection() {
+  const [policy, setPolicy] = useState<LlmDjPolicy | null>(null);
+  const [connectors, setConnectors] = useState<LlmConnector[]>([]);
+  const [loading, setLoading] = useState(true);
+  const [error, setError] = useState('');
+  const [form, setForm] = useState<FormState>(EMPTY_FORM);
+  const [submitting, setSubmitting] = useState(false);
+  const [submitMessage, setSubmitMessage] = useState('');
+  const [submitError, setSubmitError] = useState('');
+  const [testStateById, setTestStateById] = useState<Record<number, string>>({});
+  // Live streamed text per connector for the "Stream test" button, plus the id
+  // currently streaming (drives the disabled state + label).
+  const [streamTextById, setStreamTextById] = useState<Record<number, string>>({});
+  const [streamingId, setStreamingId] = useState<number | null>(null);
+  const [openrouterModels, setOpenrouterModels] = useState<AIModelInfo[]>([]);
+  const [openrouterModelsLoaded, setOpenrouterModelsLoaded] = useState(false);
+  const [featurePrefs, setFeaturePrefs] = useState<LlmFeaturePreferences | null>(null);
+
+  useEffect(() => {
+    let active = true;
+    setLoading(true);
+    setError('');
+    Promise.all([api.listLlmConnectors(), fetchPolicySoft(), fetchFeaturePrefsSoft()])
+      .then(([rows, p, prefs]) => {
+        if (!active) return;
+        setConnectors(rows);
+        setPolicy(p);
+        setFeaturePrefs(prefs);
+      })
+      .catch((err) => {
+        if (!active) return;
+        setError(err instanceof Error ? err.message : 'Failed to load');
+      })
+      .finally(() => {
+        if (active) setLoading(false);
+      });
+    return () => {
+      active = false;
+    };
+  }, []);
+
+  // Lazily fetch the OpenRouter model catalogue the first time a DJ opens the
+  // form on the OpenRouter type. Best-effort: an empty list (or a failed fetch)
+  // simply falls back to the free-text model input. Fetched once per mount.
+  const wantsOpenrouterModels = form.open && form.connector_type === 'openrouter_apikey';
+  useEffect(() => {
+    if (!wantsOpenrouterModels || openrouterModelsLoaded) return;
+    setOpenrouterModelsLoaded(true);
+    api
+      .listOpenRouterModels()
+      .then((res) => setOpenrouterModels(res.models))
+      .catch(() => {
+        // Swallow — the dropdown gracefully degrades to free-text entry.
+      });
+  }, [wantsOpenrouterModels, openrouterModelsLoaded]);
+
+  const allowedTypes = useMemo<LlmConnectorType[]>(() => {
+    // Fail closed: when the policy can't be read, offer no providers rather than
+    // surfacing every type and letting the DJ pick one the admin disabled (the
+    // create call would 403). The server is the source of truth for the set.
+    if (!policy) return [];
+    return policy.allowed_connector_types as LlmConnectorType[];
+  }, [policy]);
+
+  // onChange factory for the plain string form fields — every text input/select
+  // updates exactly one FormState key with the raw value. connector_type stays
+  // inline because it needs a cast to LlmConnectorType.
+  const handleField =
+    (key: Exclude<keyof FormState, 'open' | 'connector_type'>) =>
+    (e: React.ChangeEvent<HTMLInputElement | HTMLSelectElement>) =>
+      setForm((f) => ({ ...f, [key]: e.target.value }));
+
+  const handleOpenForm = () => {
+    if (allowedTypes.length === 0) {
+      setSubmitError('Connector creation is currently disabled by admin policy.');
+      setSubmitMessage('');
+      return;
+    }
+    setForm({ ...EMPTY_FORM, open: true, connector_type: allowedTypes[0] });
+    setSubmitMessage('');
+    setSubmitError('');
+  };
+
+  const handleCancel = () => {
+    setForm(EMPTY_FORM);
+    setSubmitError('');
+  };
+
+  const handleCreate = async (e: React.FormEvent) => {
+    e.preventDefault();
+    setSubmitting(true);
+    setSubmitMessage('');
+    setSubmitError('');
+    const isCompatible = form.connector_type === 'openai_compatible';
+    const isBedrock = form.connector_type === 'bedrock';
+    const isAzure = form.connector_type === 'azure_openai';
+    // API-key providers: everything that isn't openai_compatible or bedrock.
+    // Azure also carries an api_key (plus its azure_* fields).
+    const isApiKey = !isCompatible && !isBedrock;
+    const payload: LlmConnectorCreate = {
+      connector_type: form.connector_type,
+      display_name: form.display_name,
+      // Bedrock has no model_hint field (it uses aws_model_id); never post a
+      // stale hint left over from a prior connector-type selection.
+      model_hint: isBedrock ? null : form.model_hint || null,
+      api_key: isApiKey ? form.api_key : null,
+      base_url: isCompatible ? form.base_url : null,
+      bearer: isCompatible ? form.bearer || null : null,
+      aws_access_key_id: isBedrock ? form.aws_access_key_id : null,
+      aws_secret_access_key: isBedrock ? form.aws_secret_access_key : null,
+      aws_region: isBedrock ? form.aws_region : null,
+      aws_model_id: isBedrock ? form.aws_model_id : null,
+      azure_resource_name: isAzure ? form.azure_resource_name : null,
+      azure_deployment_name: isAzure ? form.azure_deployment_name : null,
+      azure_api_version: isAzure ? form.azure_api_version : null,
+    };
+    try {
+      const created = await api.createLlmConnector(payload);
+      setConnectors((prev) => [created, ...prev]);
+      setForm(EMPTY_FORM);
+      setSubmitMessage(`Created "${created.display_name}". Run "Test" to verify it works.`);
+    } catch (err) {
+      setSubmitError(
+        err instanceof Error ? err.message : 'Create failed (check your inputs)',
+      );
+    } finally {
+      setSubmitting(false);
+    }
+  };
+
+  const handleTest = async (id: number) => {
+    setTestStateById((s) => ({ ...s, [id]: 'Testing…' }));
+    try {
+      const result = await api.testLlmConnector(id);
+      setTestStateById((s) => ({
+        ...s,
+        [id]: result.ok ? 'OK' : `Failed: ${result.error_code ?? 'unknown'}`,
+      }));
+      // Refresh the row so updated status renders
+      const fresh = await api.listLlmConnectors();
+      setConnectors(fresh);
+    } catch (err) {
+      setTestStateById((s) => ({
+        ...s,
+        [id]: err instanceof Error ? err.message : 'Test failed',
+      }));
+    }
+  };
+
+  const handleStreamTest = async (id: number) => {
+    setStreamTextById((s) => ({ ...s, [id]: '' }));
+    setStreamingId(id);
+    try {
+      await api.streamConnectorTest(id, (chunk) => {
+        if (chunk.text_delta) {
+          setStreamTextById((s) => ({ ...s, [id]: (s[id] ?? '') + chunk.text_delta }));
+        }
+      });
+    } catch (err) {
+      setStreamTextById((s) => ({
+        ...s,
+        [id]: err instanceof Error ? `(stream test failed: ${err.message})` : '(stream test failed)',
+      }));
+    } finally {
+      setStreamingId(null);
+    }
+  };
+
+  const handleDelete = async (id: number) => {
+    if (!window.confirm('Delete this connector? This cannot be undone.')) return;
+    try {
+      await api.deleteLlmConnector(id);
+      setConnectors((prev) => prev.filter((c) => c.id !== id));
+    } catch (err) {
+      setError(err instanceof Error ? err.message : 'Delete failed');
+    }
+  };
+
+  // Set / unset the per-DJ explicit default (issue #336). Optimistic update on
+  // the full list keeps the radio state consistent (exactly one row is default
+  // at any time) without waiting for a refetch.
+  const handleSetDefault = async (id: number) => {
+    try {
+      const updated = await api.setLlmConnectorDefault(id);
+      setConnectors((prev) =>
+        prev.map((c) =>
+          c.id === updated.id
+            ? updated
+            : c.user_id === updated.user_id
+            ? { ...c, is_default: false }
+            : c,
+        ),
+      );
+    } catch (err) {
+      setError(err instanceof Error ? err.message : 'Failed to set default');
+    }
+  };
+
+  const handleUnsetDefault = async (id: number) => {
+    try {
+      const updated = await api.unsetLlmConnectorDefault(id);
+      setConnectors((prev) => prev.map((c) => (c.id === updated.id ? updated : c)));
+    } catch (err) {
+      setError(err instanceof Error ? err.message : 'Failed to clear default');
+    }
+  };
+
+  // Per-feature pin (issue #337). An empty select value clears the pin (use the
+  // account default); any connector id sets/replaces it. The endpoint returns
+  // the full updated list, so we store it verbatim.
+  const handleFeaturePrefChange = async (feature: LlmFeatureKey, value: string) => {
+    try {
+      const updated =
+        value === ''
+          ? await api.clearLlmFeaturePreference(feature)
+          : await api.setLlmFeaturePreference({ feature, connector_id: Number(value) });
+      setFeaturePrefs(updated);
+      setError('');
+    } catch (err) {
+      setError(err instanceof Error ? err.message : 'Failed to update feature default');
+    }
+  };
+
+  return (
+    <div>
+      <h2 style={{ marginTop: 0, marginBottom: '1.25rem', fontSize: '1.1rem' }}>
+        AI / Model providers
+      </h2>
+
+      <p style={{ color: 'var(--text-secondary)' }}>
+        Connect your own LLM provider so AI-assisted features (recommendations, etc.) bill to
+        your account. Credentials are encrypted at rest. Calls consume your account&apos;s API or
+        subscription quota directly.
+      </p>
+
+      {loading && <div className="loading">Loading…</div>}
+      {error && <div style={{ color: 'var(--color-danger)', marginTop: '1rem' }}>{error}</div>}
+      {submitMessage && (
+        <div style={{ color: 'var(--color-success)', marginTop: '1rem' }}>{submitMessage}</div>
+      )}
+      {submitError && (
+        <div style={{ color: 'var(--color-danger)', marginTop: '1rem' }}>{submitError}</div>
+      )}
+
+      <section style={{ marginTop: '2rem' }}>
+        <h3 style={{ marginTop: 0 }}>Connected providers</h3>
+        {connectors.length === 0 && !loading && (
+          <p style={{ color: 'var(--text-secondary)' }}>No connectors yet.</p>
+        )}
+        {connectors.map((c) => {
+          const status = STATUS_LABELS[c.status] ?? { text: c.status, color: 'var(--text-secondary)' };
+          // Pin / unpin is only meaningful for active connectors — the gateway
+          // skips inactive defaults, so don't let the DJ pin a row that
+          // resolution would silently bypass.
+          const canPin = c.status === 'active';
+          const radioId = `connector-default-${c.id}`;
+          return (
+            <div key={c.id} className="card" style={{ marginTop: '1rem' }}>
+              <div style={{ display: 'flex', justifyContent: 'space-between', gap: '1rem', flexWrap: 'wrap' }}>
+                <div>
+                  <div style={{ display: 'flex', alignItems: 'center', gap: '0.5rem', flexWrap: 'wrap' }}>
+                    <div style={{ fontWeight: 600 }}>{c.display_name}</div>
+                    {c.is_default && (
+                      <span
+                        style={{
+                          fontSize: '0.7rem',
+                          padding: '0.125rem 0.5rem',
+                          borderRadius: '0.5rem',
+                          background: 'var(--color-success)',
+                          color: '#0a0a0a',
+                          fontWeight: 700,
+                          textTransform: 'uppercase',
+                          letterSpacing: '0.05em',
+                        }}
+                      >
+                        Default
+                      </span>
+                    )}
+                  </div>
+                  <div style={{ color: 'var(--text-secondary)', fontSize: '0.875rem' }}>
+                    {CONNECTOR_TYPE_LABELS[c.connector_type as LlmConnectorType] ?? c.connector_type}
+                    {c.model_hint ? ` · ${c.model_hint}` : ''}
+                    {c.base_url_plain ? ` · ${c.base_url_plain}` : ''}
+                  </div>
+                  <div style={{ marginTop: '0.5rem', fontSize: '0.875rem', color: status.color, fontWeight: 600 }}>
+                    {status.text}
+                    {testStateById[c.id] ? ` · ${testStateById[c.id]}` : ''}
+                  </div>
+                  {/* Radio for "Set as default" — exactly one connector per DJ may be pinned. */}
+                  <label
+                    htmlFor={radioId}
+                    style={{
+                      display: 'flex',
+                      alignItems: 'center',
+                      gap: '0.4rem',
+                      marginTop: '0.5rem',
+                      fontSize: '0.85rem',
+                      color: canPin ? 'var(--text)' : 'var(--text-secondary)',
+                      cursor: canPin ? 'pointer' : 'not-allowed',
+                    }}
+                  >
+                    <input
+                      id={radioId}
+                      type="radio"
+                      name="llm-connector-default"
+                      checked={c.is_default}
+                      disabled={!canPin && !c.is_default}
+                      onChange={() => {
+                        if (canPin) {
+                          handleSetDefault(c.id);
+                        }
+                      }}
+                    />
+                    {c.is_default ? (
+                      <>
+                        Pinned as default ·{' '}
+                        <button
+                          type="button"
+                          className="btn-link"
+                          onClick={(e) => {
+                            e.preventDefault();
+                            handleUnsetDefault(c.id);
+                          }}
+                          style={{
+                            background: 'none',
+                            border: 'none',
+                            padding: 0,
+                            color: 'var(--text-secondary)',
+                            textDecoration: 'underline',
+                            cursor: 'pointer',
+                            font: 'inherit',
+                          }}
+                        >
+                          Unpin
+                        </button>
+                      </>
+                    ) : (
+                      <span>Set as default</span>
+                    )}
+                  </label>
+                </div>
+                <div style={{ display: 'flex', gap: '0.5rem', flexWrap: 'wrap' }}>
+                  <button className="btn btn-secondary" onClick={() => handleTest(c.id)}>
+                    Test
+                  </button>
+                  <button
+                    className="btn btn-secondary"
+                    onClick={() => handleStreamTest(c.id)}
+                    disabled={streamingId !== null}
+                  >
+                    {streamingId === c.id ? 'Streaming…' : 'Stream test'}
+                  </button>
+                  <button className="btn btn-danger" onClick={() => handleDelete(c.id)}>
+                    Delete
+                  </button>
+                </div>
+                {streamTextById[c.id] !== undefined && streamTextById[c.id] !== '' && (
+                  <div
+                    style={{
+                      marginTop: '0.5rem',
+                      fontSize: '0.875rem',
+                      color: 'var(--text-secondary)',
+                      fontStyle: 'italic',
+                    }}
+                  >
+                    {streamTextById[c.id]}
+                  </div>
+                )}
+              </div>
+            </div>
+          );
+        })}
+      </section>
+
+      {featurePrefs && featurePrefs.known_features.length > 0 && (
+        <section style={{ marginTop: '2rem' }}>
+          <h3 style={{ marginTop: 0 }}>Per-feature defaults</h3>
+          <p style={{ color: 'var(--text-secondary)' }}>
+            Pin a specific provider to each AI feature. Unpinned features use your account
+            default (or most-recently-used) connector. Inactive connectors are skipped
+            automatically.
+          </p>
+          {featurePrefs.known_features.map((feature) => {
+            const current =
+              featurePrefs.preferences.find((p) => p.feature === feature)?.connector_id ?? '';
+            const selectId = `feature-pref-${feature}`;
+            const activeConnectors = connectors.filter((c) => c.status === 'active');
+            return (
+              <div className="form-group" key={feature}>
+                <label htmlFor={selectId}>{FEATURE_LABELS[feature] ?? feature}</label>
+                <select
+                  id={selectId}
+                  className="input"
+                  value={current === '' ? '' : String(current)}
+                  onChange={(e) =>
+                    handleFeaturePrefChange(feature as LlmFeatureKey, e.target.value)
+                  }
+                >
+                  <option value="">Use account default</option>
+                  {activeConnectors.map((c) => (
+                    <option key={c.id} value={String(c.id)}>
+                      {c.display_name}
+                    </option>
+                  ))}
+                </select>
+              </div>
+            );
+          })}
+        </section>
+      )}
+
+      <section style={{ marginTop: '2rem' }}>
+        {allowedTypes.length === 0 && !form.open && !loading && (
+          <p style={{ color: 'var(--text-secondary)' }}>
+            Connector creation is currently disabled by admin policy.
+          </p>
+        )}
+        {allowedTypes.length > 0 && !form.open && (
+          <button className="btn btn-primary" onClick={handleOpenForm}>
+            + Add provider
+          </button>
+        )}
+        {form.open && (
+          <form className="card" onSubmit={handleCreate} style={{ marginTop: '1rem' }}>
+            <h3 style={{ marginTop: 0 }}>Add provider</h3>
+
+            <div className="form-group">
+              <label htmlFor="connector_type">Provider</label>
+              <select
+                id="connector_type"
+                className="input"
+                value={form.connector_type}
+                onChange={(e) =>
+                  setForm({ ...form, connector_type: e.target.value as LlmConnectorType })
+                }
+              >
+                {allowedTypes.map((t) => (
+                  <option key={t} value={t}>
+                    {CONNECTOR_TYPE_LABELS[t]}
+                  </option>
+                ))}
+              </select>
+            </div>
+
+            <div className="form-group">
+              <label htmlFor="display_name">Display name</label>
+              <input
+                id="display_name"
+                className="input"
+                value={form.display_name}
+                onChange={handleField('display_name')}
+                placeholder="e.g. My OpenAI"
+                maxLength={80}
+                required
+              />
+            </div>
+
+            {form.connector_type === 'bedrock' ? (
+              <>
+                <div className="form-group">
+                  <label htmlFor="aws_access_key_id">AWS access key ID</label>
+                  <input
+                    id="aws_access_key_id"
+                    className="input"
+                    value={form.aws_access_key_id}
+                    onChange={handleField('aws_access_key_id')}
+                    placeholder="AKIA…"
+                    autoComplete="off"
+                    required
+                  />
+                </div>
+                <div className="form-group">
+                  <label htmlFor="aws_secret_access_key">AWS secret access key</label>
+                  <input
+                    id="aws_secret_access_key"
+                    className="input"
+                    type="password"
+                    value={form.aws_secret_access_key}
+                    onChange={handleField('aws_secret_access_key')}
+                    autoComplete="off"
+                    required
+                  />
+                </div>
+                <div className="form-group">
+                  <label htmlFor="aws_region">AWS region</label>
+                  <input
+                    id="aws_region"
+                    className="input"
+                    value={form.aws_region}
+                    onChange={handleField('aws_region')}
+                    placeholder="us-east-1"
+                    required
+                  />
+                </div>
+                <div className="form-group">
+                  <label htmlFor="aws_model_id">Bedrock model ID</label>
+                  <input
+                    id="aws_model_id"
+                    className="input"
+                    value={form.aws_model_id}
+                    onChange={handleField('aws_model_id')}
+                    placeholder="anthropic.claude-3-5-sonnet-20241022-v2:0"
+                    required
+                  />
+                  <p style={{ color: 'var(--text-secondary)', fontSize: '0.875rem', margin: '0.5rem 0 0' }}>
+                    Calls are signed with AWS SigV4 and billed to your AWS account.
+                    Claude (<code>anthropic.*</code>) and Llama (<code>meta.*</code>)
+                    model families are supported.
+                  </p>
+                </div>
+              </>
+            ) : form.connector_type === 'azure_openai' ? (
+              <>
+                <div className="form-group">
+                  <label htmlFor="api_key">API key</label>
+                  <input
+                    id="api_key"
+                    className="input"
+                    type="password"
+                    value={form.api_key}
+                    onChange={handleField('api_key')}
+                    placeholder="Azure OpenAI key"
+                    required
+                  />
+                </div>
+                <div className="form-group">
+                  <label htmlFor="azure_resource_name">Resource name</label>
+                  <input
+                    id="azure_resource_name"
+                    className="input"
+                    value={form.azure_resource_name}
+                    onChange={handleField('azure_resource_name')}
+                    placeholder="e.g. my-company"
+                    required
+                  />
+                  <p style={{ color: 'var(--text-secondary)', fontSize: '0.875rem', margin: '0.5rem 0 0' }}>
+                    The resource subdomain in{' '}
+                    <code>https://&lt;resource&gt;.openai.azure.com</code>.
+                  </p>
+                </div>
+                <div className="form-group">
+                  <label htmlFor="azure_deployment_name">Deployment name</label>
+                  <input
+                    id="azure_deployment_name"
+                    className="input"
+                    value={form.azure_deployment_name}
+                    onChange={handleField('azure_deployment_name')}
+                    placeholder="e.g. gpt-4o-prod"
+                    required
+                  />
+                </div>
+                <div className="form-group">
+                  <label htmlFor="azure_api_version">API version</label>
+                  <input
+                    id="azure_api_version"
+                    className="input"
+                    value={form.azure_api_version}
+                    onChange={handleField('azure_api_version')}
+                    placeholder="e.g. 2024-06-01"
+                    required
+                  />
+                </div>
+              </>
+            ) : form.connector_type !== 'openai_compatible' ? (
+              <div className="form-group">
+                <label htmlFor="api_key">API key</label>
+                <input
+                  id="api_key"
+                  className="input"
+                  type="password"
+                  value={form.api_key}
+                  onChange={handleField('api_key')}
+                  placeholder={
+                    API_KEY_PLACEHOLDERS[form.connector_type] ?? API_KEY_PLACEHOLDER_DEFAULT
+                  }
+                  required
+                />
+              </div>
+            ) : (
+              <>
+                <div className="form-group">
+                  <label htmlFor="base_url">Base URL</label>
+                  <input
+                    id="base_url"
+                    className="input"
+                    value={form.base_url}
+                    onChange={handleField('base_url')}
+                    placeholder="http://127.0.0.1:11434/v1"
+                    required
+                  />
+                  <p style={{ color: 'var(--text-secondary)', fontSize: '0.875rem', margin: '0.5rem 0 0' }}>
+                    HTTPS is required for public hosts. HTTP is only allowed for loopback (
+                    <code>127.0.0.1</code>, <code>localhost</code>) and private (RFC1918) IPs.
+                  </p>
+                </div>
+                <div className="form-group">
+                  <label htmlFor="bearer">Bearer token (optional)</label>
+                  <input
+                    id="bearer"
+                    className="input"
+                    type="password"
+                    value={form.bearer}
+                    onChange={handleField('bearer')}
+                  />
+                </div>
+                <details style={{ marginTop: '1rem' }}>
+                  <summary style={{ cursor: 'pointer', fontWeight: 600 }}>
+                    Want to use your ChatGPT Plus / Pro subscription?
+                  </summary>
+                  <p style={{ marginTop: '0.5rem' }}>
+                    Install{' '}
+                    <a
+                      href="https://github.com/NousResearch/hermes-agent"
+                      target="_blank"
+                      rel="noreferrer"
+                    >
+                      Hermes Agent
+                    </a>
+                    , run <code>hermes proxy</code>, and paste the URL it prints below. Your
+                    ChatGPT account never leaves your machine — WrzDJ only talks to your local
+                    Hermes proxy.
+                  </p>
+                </details>
+              </>
+            )}
+
+            {form.connector_type !== 'bedrock' && (
+              <div className="form-group">
+                <label htmlFor="model_hint">Model (optional)</label>
+                {form.connector_type === 'openrouter_apikey' && openrouterModels.length > 0 ? (
+                  <>
+                    <select
+                      id="model_hint"
+                      className="input"
+                      value={form.model_hint}
+                      onChange={handleField('model_hint')}
+                    >
+                      <option value="">Default (openai/gpt-4o-mini)</option>
+                      {openrouterModels.map((m) => (
+                        <option key={m.id} value={m.id}>
+                          {m.name} ({m.id})
+                        </option>
+                      ))}
+                    </select>
+                    <p style={{ color: 'var(--text-secondary)', fontSize: '0.875rem', margin: '0.5rem 0 0' }}>
+                      Each model routes through OpenRouter and bills your account at that model&apos;s
+                      OpenRouter rate (see openrouter.ai/models for per-token pricing).
+                    </p>
+                  </>
+                ) : (
+                  <input
+                    id="model_hint"
+                    className="input"
+                    value={form.model_hint}
+                    onChange={handleField('model_hint')}
+                    placeholder={
+                      MODEL_HINT_PLACEHOLDERS[form.connector_type] ?? MODEL_HINT_PLACEHOLDER_DEFAULT
+                    }
+                  />
+                )}
+              </div>
+            )}
+
+            <div style={{ display: 'flex', gap: '0.5rem', marginTop: '1rem' }}>
+              <button type="submit" className="btn btn-primary" disabled={submitting}>
+                {submitting ? 'Saving…' : 'Save'}
+              </button>
+              <button type="button" className="btn btn-secondary" onClick={handleCancel}>
+                Cancel
+              </button>
+            </div>
+          </form>
+        )}
+      </section>
+    </div>
+  );
+}
+
+async function fetchPolicySoft(): Promise<LlmDjPolicy | null> {
+  // Read the DJ-scoped policy endpoint. On any failure we return null and the
+  // UI fails *closed* (no providers offered) — see `allowedTypes`. This avoids
+  // showing a DJ a provider the admin disabled, only to have the create call
+  // reject it with a 403.
+  try {
+    return await api.getLlmPolicy();
+  } catch {
+    return null;
+  }
+}
+
+async function fetchFeaturePrefsSoft(): Promise<LlmFeaturePreferences | null> {
+  // Read the DJ's per-feature pins. On any failure we return null and the
+  // "Per-feature defaults" section is simply hidden — it's an enhancement, not
+  // load-bearing, so a transient error must not break the whole page.
+  try {
+    return await api.listLlmFeaturePreferences();
+  } catch {
+    return null;
+  }
+}
diff --git a/dashboard/components/__tests__/AiProvidersSection.featurePrefs.test.tsx b/dashboard/components/__tests__/AiProvidersSection.featurePrefs.test.tsx
new file mode 100644
index 00000000..cbabb2d3
--- /dev/null
+++ b/dashboard/components/__tests__/AiProvidersSection.featurePrefs.test.tsx
@@ -0,0 +1,124 @@
+import { describe, it, expect, vi, beforeEach } from 'vitest';
+import { render, screen, waitFor, fireEvent } from '@testing-library/react';
+
+import AiProvidersSection from '../AiProvidersSection';
+import { api } from '@/lib/api';
+import type { LlmConnector } from '@/lib/api-types';
+
+const NOW = new Date().toISOString();
+
+function makeConnector(overrides: Partial<LlmConnector> = {}): LlmConnector {
+  return {
+    id: 1,
+    user_id: 42,
+    connector_type: 'openai_apikey',
+    display_name: 'My OpenAI',
+    status: 'active',
+    base_url_plain: null,
+    model_hint: null,
+    created_at: NOW,
+    updated_at: NOW,
+    last_used_at: null,
+    last_error: null,
+    is_default: false,
+    last_health_check_at: null,
+    last_health_check_status: null,
+    monthly_token_cap: null,
+    ...overrides,
+  };
+}
+
+describe('AiProvidersSection per-feature defaults', () => {
+  beforeEach(() => {
+    vi.restoreAllMocks();
+    vi.spyOn(api, 'listLlmConnectors').mockResolvedValue([makeConnector()]);
+    vi.spyOn(api, 'getLlmPolicy').mockResolvedValue({
+      llm_apikey_connectors_enabled: true,
+      llm_compatible_connector_enabled: true,
+      allowed_connector_types: ['openai_apikey'],
+    });
+    vi.spyOn(api, 'listLlmFeaturePreferences').mockResolvedValue({
+      preferences: [],
+      known_features: ['recommendation', 'set_builder'],
+    });
+  });
+
+  it('renders a picker per known feature and sets a pin', async () => {
+    const setSpy = vi.spyOn(api, 'setLlmFeaturePreference').mockResolvedValue({
+      preferences: [{ feature: 'recommendation', connector_id: 1 }],
+      known_features: ['recommendation', 'set_builder'],
+    });
+
+    render(<AiProvidersSection />);
+
+    await waitFor(() =>
+      expect(screen.getByText('Per-feature defaults')).toBeInTheDocument(),
+    );
+
+    // One picker per known feature.
+    expect(screen.getByLabelText('Recommendations')).toBeInTheDocument();
+    expect(screen.getByLabelText('Set builder')).toBeInTheDocument();
+
+    const select = screen.getByLabelText('Recommendations') as HTMLSelectElement;
+    fireEvent.change(select, { target: { value: '1' } });
+
+    await waitFor(() =>
+      expect(setSpy).toHaveBeenCalledWith({
+        feature: 'recommendation',
+        connector_id: 1,
+      }),
+    );
+  });
+
+  it('clears a pin when "Use account default" is selected', async () => {
+    vi.spyOn(api, 'listLlmFeaturePreferences').mockResolvedValue({
+      preferences: [{ feature: 'recommendation', connector_id: 1 }],
+      known_features: ['recommendation', 'set_builder'],
+    });
+    const clearSpy = vi.spyOn(api, 'clearLlmFeaturePreference').mockResolvedValue({
+      preferences: [],
+      known_features: ['recommendation', 'set_builder'],
+    });
+
+    render(<AiProvidersSection />);
+    await waitFor(() =>
+      expect(screen.getByText('Per-feature defaults')).toBeInTheDocument(),
+    );
+
+    const select = screen.getByLabelText('Recommendations') as HTMLSelectElement;
+    // The current pin should be reflected as the selected value.
+    expect(select.value).toBe('1');
+
+    fireEvent.change(select, { target: { value: '' } });
+
+    await waitFor(() => expect(clearSpy).toHaveBeenCalledWith('recommendation'));
+  });
+
+  it('hides the section when the preferences fetch fails (fail soft)', async () => {
+    vi.spyOn(api, 'listLlmFeaturePreferences').mockRejectedValue(new Error('boom'));
+
+    render(<AiProvidersSection />);
+
+    // The connectors list still renders…
+    await waitFor(() => expect(screen.getByText('My OpenAI')).toBeInTheDocument());
+    // …but the per-feature section is absent.
+    expect(screen.queryByText('Per-feature defaults')).not.toBeInTheDocument();
+  });
+
+  it('only offers active connectors in the picker', async () => {
+    vi.spyOn(api, 'listLlmConnectors').mockResolvedValue([
+      makeConnector({ id: 1, display_name: 'Active one', status: 'active' }),
+      makeConnector({ id: 2, display_name: 'Broken one', status: 'auth_invalid' }),
+    ]);
+
+    render(<AiProvidersSection />);
+    await waitFor(() =>
+      expect(screen.getByText('Per-feature defaults')).toBeInTheDocument(),
+    );
+
+    const select = screen.getByLabelText('Recommendations') as HTMLSelectElement;
+    const optionLabels = Array.from(select.options).map((o) => o.textContent);
+    expect(optionLabels).toContain('Active one');
+    expect(optionLabels).not.toContain('Broken one');
+  });
+});
diff --git a/dashboard/components/__tests__/AiProvidersSection.test.tsx b/dashboard/components/__tests__/AiProvidersSection.test.tsx
new file mode 100644
index 00000000..749bd886
--- /dev/null
+++ b/dashboard/components/__tests__/AiProvidersSection.test.tsx
@@ -0,0 +1,471 @@
+import { describe, it, expect, vi, beforeEach } from 'vitest';
+import { render, screen, waitFor, fireEvent } from '@testing-library/react';
+
+import AiProvidersSection from '../AiProvidersSection';
+import { api } from '@/lib/api';
+import type { LlmConnector, LlmConnectorType, LlmDjPolicy } from '@/lib/api-types';
+
+const ALL_APIKEY_TYPES: LlmConnectorType[] = [
+  'openai_apikey',
+  'anthropic_apikey',
+  'openrouter_apikey',
+  'xai_apikey',
+  'bedrock',
+  'azure_openai',
+  'gemini_apikey',
+];
+
+// Build a DJ policy payload. `allowed_connector_types` is what the server
+// computes from the two toggles; the section renders exactly this set.
+function makePolicy(
+  apikeyEnabled: boolean,
+  compatibleEnabled: boolean,
+): LlmDjPolicy {
+  const allowed: LlmConnectorType[] = [];
+  if (apikeyEnabled) allowed.push(...ALL_APIKEY_TYPES);
+  if (compatibleEnabled) allowed.push('openai_compatible');
+  return {
+    llm_apikey_connectors_enabled: apikeyEnabled,
+    llm_compatible_connector_enabled: compatibleEnabled,
+    allowed_connector_types: allowed,
+  };
+}
+
+const NOW = new Date().toISOString();
+
+function makeConnector(overrides: Partial<LlmConnector> = {}): LlmConnector {
+  return {
+    id: 1,
+    user_id: 42,
+    connector_type: 'openai_apikey',
+    display_name: 'My OpenAI',
+    status: 'active',
+    base_url_plain: null,
+    model_hint: 'gpt-5-mini',
+    created_at: NOW,
+    updated_at: NOW,
+    last_used_at: null,
+    last_error: null,
+    is_default: false,
+    last_health_check_at: null,
+    last_health_check_status: null,
+    monthly_token_cap: null,
+    ...overrides,
+  };
+}
+
+describe('AiProvidersSection', () => {
+  beforeEach(() => {
+    vi.restoreAllMocks();
+  });
+
+  it('renders the section heading', async () => {
+    vi.spyOn(api, 'listLlmConnectors').mockResolvedValue([]);
+    vi.spyOn(api, 'getLlmPolicy').mockRejectedValue(new Error('forbidden'));
+
+    render(<AiProvidersSection />);
+
+    expect(screen.getByText('AI / Model providers')).toBeInTheDocument();
+  });
+
+  it('lists existing connectors', async () => {
+    vi.spyOn(api, 'listLlmConnectors').mockResolvedValue([
+      makeConnector({ display_name: 'My OpenAI' }),
+      makeConnector({
+        id: 2,
+        connector_type: 'anthropic_apikey',
+        display_name: 'My Claude',
+        model_hint: 'claude-haiku',
+      }),
+    ]);
+    vi.spyOn(api, 'getLlmPolicy').mockRejectedValue(new Error('forbidden'));
+
+    render(<AiProvidersSection />);
+
+    await waitFor(() => expect(screen.getByText('My OpenAI')).toBeInTheDocument());
+    expect(screen.getByText('My Claude')).toBeInTheDocument();
+  });
+
+  it('respects admin policy when filtering allowed connector types', async () => {
+    vi.spyOn(api, 'listLlmConnectors').mockResolvedValue([]);
+    vi.spyOn(api, 'getLlmPolicy').mockResolvedValue(makePolicy(false, true));
+
+    render(<AiProvidersSection />);
+
+    await waitFor(() => expect(screen.getByText('+ Add provider')).toBeInTheDocument());
+    fireEvent.click(screen.getByText('+ Add provider'));
+
+    // Provider dropdown should only contain the openai_compatible option
+    const select = screen.getByLabelText('Provider') as HTMLSelectElement;
+    const optionValues = Array.from(select.options).map((o) => o.value);
+    expect(optionValues).toEqual(['openai_compatible']);
+  });
+
+  it('reads the DJ-scoped policy endpoint (not the admin one)', async () => {
+    vi.spyOn(api, 'listLlmConnectors').mockResolvedValue([]);
+    const adminPolicySpy = vi
+      .spyOn(api, 'getAdminLlmPolicy')
+      .mockRejectedValue(new Error('should not be called'));
+    const policySpy = vi
+      .spyOn(api, 'getLlmPolicy')
+      .mockResolvedValue(makePolicy(true, true));
+
+    render(<AiProvidersSection />);
+
+    await waitFor(() => expect(policySpy).toHaveBeenCalled());
+    expect(adminPolicySpy).not.toHaveBeenCalled();
+  });
+
+  it('fails closed: hides all provider types when policy fetch fails', async () => {
+    vi.spyOn(api, 'listLlmConnectors').mockResolvedValue([]);
+    // Simulate the DJ policy endpoint being unavailable.
+    vi.spyOn(api, 'getLlmPolicy').mockRejectedValue(new Error('unavailable'));
+
+    render(<AiProvidersSection />);
+
+    // No "+ Add provider" button — the picker is hidden entirely.
+    await waitFor(() =>
+      expect(
+        screen.getByText('Connector creation is currently disabled by admin policy.'),
+      ).toBeInTheDocument(),
+    );
+    expect(screen.queryByText('+ Add provider')).not.toBeInTheDocument();
+    expect(screen.queryByLabelText('Provider')).not.toBeInTheDocument();
+  });
+
+  it('fails closed: only api-key types when compatible is disabled (no leak of all)', async () => {
+    vi.spyOn(api, 'listLlmConnectors').mockResolvedValue([]);
+    vi.spyOn(api, 'getLlmPolicy').mockResolvedValue(makePolicy(true, false));
+
+    render(<AiProvidersSection />);
+
+    await waitFor(() => expect(screen.getByText('+ Add provider')).toBeInTheDocument());
+    fireEvent.click(screen.getByText('+ Add provider'));
+
+    const select = screen.getByLabelText('Provider') as HTMLSelectElement;
+    const optionValues = Array.from(select.options).map((o) => o.value);
+    expect(optionValues).not.toContain('openai_compatible');
+    expect(optionValues).toContain('openai_apikey');
+  });
+
+  it('offers Azure OpenAI and reveals its config fields', async () => {
+    vi.spyOn(api, 'listLlmConnectors').mockResolvedValue([]);
+    vi.spyOn(api, 'getLlmPolicy').mockResolvedValue(makePolicy(true, true));
+
+    render(<AiProvidersSection />);
+
+    await waitFor(() => expect(screen.getByText('+ Add provider')).toBeInTheDocument());
+    fireEvent.click(screen.getByText('+ Add provider'));
+
+    const select = screen.getByLabelText('Provider') as HTMLSelectElement;
+    const optionValues = Array.from(select.options).map((o) => o.value);
+    expect(optionValues).toContain('azure_openai');
+
+    // Switching to Azure surfaces the resource/deployment/api-version inputs.
+    fireEvent.change(select, { target: { value: 'azure_openai' } });
+    expect(screen.getByLabelText('API key')).toBeInTheDocument();
+    expect(screen.getByLabelText('Resource name')).toBeInTheDocument();
+    expect(screen.getByLabelText('Deployment name')).toBeInTheDocument();
+    expect(screen.getByLabelText('API version')).toBeInTheDocument();
+  });
+
+  it('sends Azure config fields on create', async () => {
+    vi.spyOn(api, 'listLlmConnectors').mockResolvedValue([]);
+    vi.spyOn(api, 'getLlmPolicy').mockResolvedValue(makePolicy(true, true));
+    const createSpy = vi
+      .spyOn(api, 'createLlmConnector')
+      .mockResolvedValue(makeConnector({ connector_type: 'azure_openai' }));
+
+    render(<AiProvidersSection />);
+
+    await waitFor(() => expect(screen.getByText('+ Add provider')).toBeInTheDocument());
+    fireEvent.click(screen.getByText('+ Add provider'));
+
+    fireEvent.change(screen.getByLabelText('Provider'), {
+      target: { value: 'azure_openai' },
+    });
+    fireEvent.change(screen.getByLabelText('Display name'), {
+      target: { value: 'Venue Azure' },
+    });
+    fireEvent.change(screen.getByLabelText('API key'), {
+      target: { value: 'azure-secret' },
+    });
+    fireEvent.change(screen.getByLabelText('Resource name'), {
+      target: { value: 'venue-co' },
+    });
+    fireEvent.change(screen.getByLabelText('Deployment name'), {
+      target: { value: 'gpt4o-prod' },
+    });
+    fireEvent.change(screen.getByLabelText('API version'), {
+      target: { value: '2024-06-01' },
+    });
+
+    fireEvent.click(screen.getByRole('button', { name: 'Save' }));
+
+    await waitFor(() => expect(createSpy).toHaveBeenCalled());
+    expect(createSpy).toHaveBeenCalledWith(
+      expect.objectContaining({
+        connector_type: 'azure_openai',
+        api_key: 'azure-secret',
+        azure_resource_name: 'venue-co',
+        azure_deployment_name: 'gpt4o-prod',
+        azure_api_version: '2024-06-01',
+      }),
+    );
+  });
+
+  it('offers AWS Bedrock when api-key connectors are enabled', async () => {
+    vi.spyOn(api, 'listLlmConnectors').mockResolvedValue([]);
+    vi.spyOn(api, 'getLlmPolicy').mockResolvedValue(makePolicy(true, false));
+
+    render(<AiProvidersSection />);
+
+    await waitFor(() => expect(screen.getByText('+ Add provider')).toBeInTheDocument());
+    fireEvent.click(screen.getByText('+ Add provider'));
+
+    const select = screen.getByLabelText('Provider') as HTMLSelectElement;
+    const optionValues = Array.from(select.options).map((o) => o.value);
+    expect(optionValues).toContain('bedrock');
+    expect(optionValues).not.toContain('openai_compatible');
+
+    // Selecting Bedrock reveals the four AWS credential inputs.
+    fireEvent.change(select, { target: { value: 'bedrock' } });
+    expect(screen.getByLabelText('AWS access key ID')).toBeInTheDocument();
+    expect(screen.getByLabelText('AWS secret access key')).toBeInTheDocument();
+    expect(screen.getByLabelText('AWS region')).toBeInTheDocument();
+    expect(screen.getByLabelText('Bedrock model ID')).toBeInTheDocument();
+  });
+
+  it('runs Test and surfaces the result', async () => {
+    const row = makeConnector();
+    vi.spyOn(api, 'listLlmConnectors').mockResolvedValue([row]);
+    vi.spyOn(api, 'getLlmPolicy').mockResolvedValue(makePolicy(true, true));
+    const testSpy = vi.spyOn(api, 'testLlmConnector').mockResolvedValue({
+      ok: true,
+      error_code: null,
+      message: null,
+    });
+    // The refresh after Test re-lists connectors
+    vi.spyOn(api, 'listLlmConnectors').mockResolvedValue([row]);
+
+    render(<AiProvidersSection />);
+
+    await waitFor(() => expect(screen.getByText('My OpenAI')).toBeInTheDocument());
+    fireEvent.click(screen.getByRole('button', { name: 'Test' }));
+    await waitFor(() => {
+      expect(testSpy).toHaveBeenCalledWith(1);
+    });
+  });
+
+  it('runs Stream test and renders the streamed text live', async () => {
+    const row = makeConnector();
+    vi.spyOn(api, 'listLlmConnectors').mockResolvedValue([row]);
+    vi.spyOn(api, 'getLlmPolicy').mockResolvedValue(makePolicy(true, true));
+    const streamSpy = vi
+      .spyOn(api, 'streamConnectorTest')
+      .mockImplementation(async (_id, onChunk) => {
+        onChunk({ text_delta: 'Online' });
+        onChunk({ text_delta: ' and ready', done: false });
+        onChunk({ stop_reason: 'end_turn', done: true });
+      });
+
+    render(<AiProvidersSection />);
+
+    await waitFor(() => expect(screen.getByText('My OpenAI')).toBeInTheDocument());
+    fireEvent.click(screen.getByRole('button', { name: 'Stream test' }));
+    await waitFor(() => {
+      expect(streamSpy).toHaveBeenCalledWith(1, expect.any(Function));
+    });
+    await waitFor(() =>
+      expect(screen.getByText('Online and ready')).toBeInTheDocument(),
+    );
+  });
+
+  it('offers OpenRouter and fetches its model dropdown', async () => {
+    vi.spyOn(api, 'listLlmConnectors').mockResolvedValue([]);
+    vi.spyOn(api, 'getLlmPolicy').mockResolvedValue(makePolicy(true, false));
+    const modelsSpy = vi.spyOn(api, 'listOpenRouterModels').mockResolvedValue({
+      models: [
+        { id: 'openai/gpt-4o-mini', name: 'GPT-4o mini' },
+        { id: 'anthropic/claude-3.5-sonnet', name: 'Claude 3.5 Sonnet' },
+      ],
+    });
+
+    render(<AiProvidersSection />);
+
+    await waitFor(() => expect(screen.getByText('+ Add provider')).toBeInTheDocument());
+    fireEvent.click(screen.getByText('+ Add provider'));
+
+    const select = screen.getByLabelText('Provider') as HTMLSelectElement;
+    const optionValues = Array.from(select.options).map((o) => o.value);
+    expect(optionValues).toContain('openrouter_apikey');
+
+    // Switch to OpenRouter — the model catalogue should be fetched and rendered.
+    fireEvent.change(select, { target: { value: 'openrouter_apikey' } });
+    await waitFor(() => expect(modelsSpy).toHaveBeenCalled());
+
+    // The dropdown options appear once the (async) fetch resolves.
+    await screen.findByRole('option', { name: /GPT-4o mini/ });
+    const modelSelect = screen.getByLabelText('Model (optional)') as HTMLSelectElement;
+    const modelValues = Array.from(modelSelect.options).map((o) => o.value);
+    expect(modelValues).toContain('openai/gpt-4o-mini');
+    expect(modelValues).toContain('anthropic/claude-3.5-sonnet');
+  });
+
+  it('creates an OpenRouter connector with the selected model', async () => {
+    vi.spyOn(api, 'listLlmConnectors').mockResolvedValue([]);
+    vi.spyOn(api, 'getLlmPolicy').mockResolvedValue(makePolicy(true, false));
+    vi.spyOn(api, 'listOpenRouterModels').mockResolvedValue({
+      models: [{ id: 'openai/gpt-4o-mini', name: 'GPT-4o mini' }],
+    });
+    const createSpy = vi.spyOn(api, 'createLlmConnector').mockResolvedValue(
+      makeConnector({
+        connector_type: 'openrouter_apikey',
+        display_name: 'My OpenRouter',
+        model_hint: 'openai/gpt-4o-mini',
+      }),
+    );
+
+    render(<AiProvidersSection />);
+    await waitFor(() => expect(screen.getByText('+ Add provider')).toBeInTheDocument());
+    fireEvent.click(screen.getByText('+ Add provider'));
+
+    fireEvent.change(screen.getByLabelText('Provider'), {
+      target: { value: 'openrouter_apikey' },
+    });
+    fireEvent.change(screen.getByLabelText('Display name'), {
+      target: { value: 'My OpenRouter' },
+    });
+    fireEvent.change(screen.getByLabelText('API key'), {
+      target: { value: 'sk-or-v1-1234567890abcdef1234567890abcdef' },
+    });
+
+    await screen.findByRole('option', { name: /GPT-4o mini/ });
+    const modelSelect = screen.getByLabelText('Model (optional)') as HTMLSelectElement;
+    fireEvent.change(modelSelect, { target: { value: 'openai/gpt-4o-mini' } });
+
+    fireEvent.click(screen.getByRole('button', { name: 'Save' }));
+
+    await waitFor(() => expect(createSpy).toHaveBeenCalled());
+    expect(createSpy).toHaveBeenCalledWith(
+      expect.objectContaining({
+        connector_type: 'openrouter_apikey',
+        display_name: 'My OpenRouter',
+        api_key: 'sk-or-v1-1234567890abcdef1234567890abcdef',
+        base_url: null,
+        bearer: null,
+        model_hint: 'openai/gpt-4o-mini',
+      }),
+    );
+  });
+
+  // ---------- per-DJ default (issue #336) ----------
+
+  it('shows the Default badge on the pinned connector', async () => {
+    vi.spyOn(api, 'listLlmConnectors').mockResolvedValue([
+      makeConnector({ id: 1, display_name: 'Pinned', is_default: true }),
+      makeConnector({ id: 2, display_name: 'Other', is_default: false }),
+    ]);
+    vi.spyOn(api, 'getLlmPolicy').mockRejectedValue(new Error('forbidden'));
+
+    render(<AiProvidersSection />);
+
+    await waitFor(() => expect(screen.getByText('Pinned')).toBeInTheDocument());
+    // The badge is rendered next to the display name.
+    expect(screen.getByText('Default')).toBeInTheDocument();
+  });
+
+  it('clicking the radio on an unpinned connector calls setDefault', async () => {
+    vi.spyOn(api, 'listLlmConnectors').mockResolvedValue([
+      makeConnector({ id: 1, display_name: 'A', is_default: true }),
+      makeConnector({ id: 2, display_name: 'B', is_default: false }),
+    ]);
+    vi.spyOn(api, 'getLlmPolicy').mockRejectedValue(new Error('forbidden'));
+    const setSpy = vi
+      .spyOn(api, 'setLlmConnectorDefault')
+      .mockResolvedValue(
+        makeConnector({ id: 2, display_name: 'B', is_default: true }),
+      );
+
+    render(<AiProvidersSection />);
+
+    await waitFor(() => expect(screen.getByText('B')).toBeInTheDocument());
+    // The radio for connector B is unchecked; click to pin it.
+    const radioB = screen.getByLabelText('Set as default');
+    fireEvent.click(radioB);
+
+    await waitFor(() => expect(setSpy).toHaveBeenCalledWith(2));
+  });
+
+  it('clicking Unpin on the pinned connector calls unsetDefault', async () => {
+    vi.spyOn(api, 'listLlmConnectors').mockResolvedValue([
+      makeConnector({ id: 1, display_name: 'A', is_default: true }),
+    ]);
+    vi.spyOn(api, 'getLlmPolicy').mockRejectedValue(new Error('forbidden'));
+    const unsetSpy = vi
+      .spyOn(api, 'unsetLlmConnectorDefault')
+      .mockResolvedValue(makeConnector({ id: 1, display_name: 'A', is_default: false }));
+
+    render(<AiProvidersSection />);
+
+    await waitFor(() => expect(screen.getByText('A')).toBeInTheDocument());
+    fireEvent.click(screen.getByRole('button', { name: 'Unpin' }));
+
+    await waitFor(() => expect(unsetSpy).toHaveBeenCalledWith(1));
+  });
+
+  it('disables the radio on inactive connectors', async () => {
+    vi.spyOn(api, 'listLlmConnectors').mockResolvedValue([
+      makeConnector({
+        id: 1,
+        display_name: 'Broken',
+        status: 'auth_invalid',
+        is_default: false,
+      }),
+    ]);
+    vi.spyOn(api, 'getLlmPolicy').mockRejectedValue(new Error('forbidden'));
+
+    render(<AiProvidersSection />);
+
+    await waitFor(() => expect(screen.getByText('Broken')).toBeInTheDocument());
+    const radio = screen.getByLabelText('Set as default') as HTMLInputElement;
+    expect(radio).toBeDisabled();
+  });
+
+  it('optimistically clears the previous default when pinning a new one', async () => {
+    vi.spyOn(api, 'listLlmConnectors').mockResolvedValue([
+      makeConnector({ id: 1, user_id: 42, display_name: 'A', is_default: true }),
+      makeConnector({ id: 2, user_id: 42, display_name: 'B', is_default: false }),
+    ]);
+    vi.spyOn(api, 'getLlmPolicy').mockRejectedValue(new Error('forbidden'));
+    vi.spyOn(api, 'setLlmConnectorDefault').mockResolvedValue(
+      makeConnector({ id: 2, user_id: 42, display_name: 'B', is_default: true }),
+    );
+
+    render(<AiProvidersSection />);
+
+    await waitFor(() => expect(screen.getByText('B')).toBeInTheDocument());
+    fireEvent.click(screen.getByLabelText('Set as default'));
+
+    // After the optimistic update, the Default badge should sit next to B, not A.
+    await waitFor(() => {
+      const badge = screen.getByText('Default');
+      // Badge is right beside the display name — walk up to the card.
+      const card = badge.closest('.card');
+      expect(card?.textContent).toContain('B');
+    });
+  });
+
+  it('deletes after confirmation', async () => {
+    vi.spyOn(api, 'listLlmConnectors').mockResolvedValue([makeConnector()]);
+    vi.spyOn(api, 'getLlmPolicy').mockRejectedValue(new Error('nope'));
+    const delSpy = vi.spyOn(api, 'deleteLlmConnector').mockResolvedValue();
+    vi.spyOn(window, 'confirm').mockReturnValue(true);
+
+    render(<AiProvidersSection />);
+
+    await waitFor(() => expect(screen.getByText('My OpenAI')).toBeInTheDocument());
+    fireEvent.click(screen.getByRole('button', { name: 'Delete' }));
+    await waitFor(() => expect(delSpy).toHaveBeenCalledWith(1));
+  });
+});
diff --git a/dashboard/lib/__tests__/api.test.ts b/dashboard/lib/__tests__/api.test.ts
index b7126f09..655bbe1c 100644
--- a/dashboard/lib/__tests__/api.test.ts
+++ b/dashboard/lib/__tests__/api.test.ts
@@ -520,6 +520,127 @@ describe('ApiClient', () => {
     });
   });
 
+  describe('LLM Gateway API', () => {
+    beforeEach(() => {
+      api.setToken('test-token');
+    });
+
+    it('lists per-DJ connectors', async () => {
+      mockFetch.mockResolvedValueOnce({
+        ok: true,
+        json: async () => [
+          {
+            id: 1,
+            user_id: 42,
+            connector_type: 'openai_apikey',
+            display_name: 'My OpenAI',
+            status: 'active',
+            base_url_plain: null,
+            model_hint: 'gpt-5-mini',
+            created_at: '2026-01-01T00:00:00Z',
+            updated_at: '2026-01-01T00:00:00Z',
+            last_used_at: null,
+            last_error: null,
+          },
+        ],
+      });
+
+      const result = await api.listLlmConnectors();
+      expect(result).toHaveLength(1);
+      expect(result[0].connector_type).toBe('openai_apikey');
+    });
+
+    it('creates a connector via POST', async () => {
+      mockFetch.mockResolvedValueOnce({
+        ok: true,
+        json: async () => ({
+          id: 2,
+          user_id: 42,
+          connector_type: 'openai_compatible',
+          display_name: 'Hermes',
+          status: 'active',
+          base_url_plain: 'http://127.0.0.1:11434/v1',
+          model_hint: null,
+          created_at: '2026-01-01T00:00:00Z',
+          updated_at: '2026-01-01T00:00:00Z',
+          last_used_at: null,
+          last_error: null,
+        }),
+      });
+
+      const result = await api.createLlmConnector({
+        connector_type: 'openai_compatible',
+        display_name: 'Hermes',
+        base_url: 'http://127.0.0.1:11434/v1',
+        bearer: null,
+        api_key: null,
+        model_hint: null,
+      });
+      expect(result.id).toBe(2);
+
+      const [, options] = mockFetch.mock.calls[0];
+      expect(options.method).toBe('POST');
+    });
+
+    it('updates admin LLM policy via PATCH', async () => {
+      mockFetch.mockResolvedValueOnce({
+        ok: true,
+        json: async () => ({
+          llm_apikey_connectors_enabled: false,
+          llm_compatible_connector_enabled: true,
+          llm_default_connector_id: null,
+        }),
+      });
+      const result = await api.updateAdminLlmPolicy({
+        llm_apikey_connectors_enabled: false,
+        llm_compatible_connector_enabled: null,
+        llm_default_connector_id: null,
+        clear_default: true,
+      });
+      expect(result.llm_apikey_connectors_enabled).toBe(false);
+
+      const [, options] = mockFetch.mock.calls[0];
+      expect(options.method).toBe('PATCH');
+    });
+
+    it('fetches admin usage with days param', async () => {
+      mockFetch.mockResolvedValueOnce({
+        ok: true,
+        json: async () => ({ days: 30, rows: [] }),
+      });
+
+      await api.getAdminLlmUsage(30);
+      const [url] = mockFetch.mock.calls[0];
+      expect(url).toContain('/api/admin/llm/usage?days=30');
+    });
+
+    it('sets a connector monthly cap via PATCH', async () => {
+      mockFetch.mockResolvedValueOnce({
+        ok: true,
+        json: async () => ({ id: 7, monthly_token_cap: 5000, current_month_tokens: 200 }),
+      });
+
+      const result = await api.setAdminLlmConnectorCap(7, 5000);
+      expect(result.monthly_token_cap).toBe(5000);
+
+      const [url, options] = mockFetch.mock.calls[0];
+      expect(url).toContain('/api/admin/llm/connectors/7/cap');
+      expect(options.method).toBe('PATCH');
+      expect(JSON.parse(options.body)).toEqual({ monthly_token_cap: 5000 });
+    });
+
+    it('clears a connector cap by passing null', async () => {
+      mockFetch.mockResolvedValueOnce({
+        ok: true,
+        json: async () => ({ id: 7, monthly_token_cap: null, current_month_tokens: 0 }),
+      });
+
+      await api.setAdminLlmConnectorCap(7, null);
+      const [, options] = mockFetch.mock.calls[0];
+      expect(JSON.parse(options.body)).toEqual({ monthly_token_cap: null });
+    });
+  });
+
   describe('Activity Log API', () => {
     beforeEach(() => {
       api.setToken('test-token');
@@ -2293,6 +2414,107 @@ describe('ApiClient', () => {
     });
   });
 
+  describe('streamConnectorTest', () => {
+    it('parses SSE data frames and invokes onChunk per frame', async () => {
+      const sse =
+        'data: {"text_delta":"Hi","done":false}\n\n' +
+        'data: {"text_delta":" there","done":false}\n\n' +
+        'data: {"text_delta":"","stop_reason":"end_turn","done":true}\n\n';
+      const encoder = new TextEncoder();
+      const stream = new ReadableStream<Uint8Array>({
+        start(controller) {
+          controller.enqueue(encoder.encode(sse));
+          controller.close();
+        },
+      });
+      const fetchMock = vi.spyOn(global, 'fetch').mockResolvedValueOnce(
+        new Response(stream, {
+          status: 200,
+          headers: { 'Content-Type': 'text/event-stream' },
+        }),
+      );
+
+      api.setToken('jwt-token');
+      const chunks: Array<{ text_delta?: string; done?: boolean }> = [];
+      await api.streamConnectorTest(7, (c) => chunks.push(c));
+
+      expect(chunks.map((c) => c.text_delta).join('')).toBe('Hi there');
+      expect(chunks.at(-1)?.done).toBe(true);
+
+      const init = fetchMock.mock.calls[0][1] as RequestInit;
+      const headers = new Headers(init.headers);
+      expect(headers.get('Authorization')).toBe('Bearer jwt-token');
+      expect(init.method).toBe('POST');
+    });
+
+    it('parses CRLF-delimited SSE frames, including event: error (#354)', async () => {
+      // A spec-compliant server or proxy may frame SSE with CRLF (\r\n\r\n)
+      // rather than LF. The parser must split frames and lines on either, or it
+      // silently drops every frame — including the typed `event: error`.
+      const sse =
+        'data: {"text_delta":"Hi","done":false}\r\n\r\n' +
+        'event: error\r\ndata: {"code":"ProviderUnavailable"}\r\n\r\n';
+      const encoder = new TextEncoder();
+      const stream = new ReadableStream<Uint8Array>({
+        start(controller) {
+          controller.enqueue(encoder.encode(sse));
+          controller.close();
+        },
+      });
+      vi.spyOn(global, 'fetch').mockResolvedValueOnce(
+        new Response(stream, {
+          status: 200,
+          headers: { 'Content-Type': 'text/event-stream' },
+        }),
+      );
+
+      api.setToken('jwt-token');
+      const chunks: Array<{ text_delta?: string }> = [];
+      await expect(
+        api.streamConnectorTest(7, (c) => chunks.push(c)),
+      ).rejects.toThrowError(/ProviderUnavailable/);
+      // The CRLF-framed data frame before the error was still parsed.
+      expect(chunks.map((c) => c.text_delta).join('')).toBe('Hi');
+    });
+
+    it('throws ApiError on non-OK response', async () => {
+      vi.spyOn(global, 'fetch').mockResolvedValueOnce(
+        new Response('nope', { status: 500 }),
+      );
+      api.setToken('jwt-token');
+      await expect(api.streamConnectorTest(7, () => {})).rejects.toBeInstanceOf(ApiError);
+    });
+
+    it('surfaces an SSE event: error frame as a thrown ApiError (#379)', async () => {
+      // The backend emits `event: error` + a sanitised `{code}` data line for
+      // typed gateway failures; the consumer must reject, not swallow it.
+      const sse =
+        'data: {"text_delta":"partial","done":false}\n\n' +
+        'event: error\ndata: {"code":"ProviderUnavailable"}\n\n';
+      const encoder = new TextEncoder();
+      const stream = new ReadableStream<Uint8Array>({
+        start(controller) {
+          controller.enqueue(encoder.encode(sse));
+          controller.close();
+        },
+      });
+      vi.spyOn(global, 'fetch').mockResolvedValueOnce(
+        new Response(stream, {
+          status: 200,
+          headers: { 'Content-Type': 'text/event-stream' },
+        }),
+      );
+
+      api.setToken('jwt-token');
+      const chunks: Array<{ text_delta?: string }> = [];
+      await expect(
+        api.streamConnectorTest(7, (c) => chunks.push(c)),
+      ).rejects.toThrowError(/ProviderUnavailable/);
+      // The leading valid chunk was still delivered before the error surfaced.
+      expect(chunks.map((c) => c.text_delta).join('')).toBe('partial');
+    });
+  });
+
   describe('frictionless join api', () => {
     it('getJoinConfig hits the public collect endpoint', async () => {
       mockFetch.mockResolvedValueOnce(
diff --git a/dashboard/lib/api-types.generated.ts b/dashboard/lib/api-types.generated.ts
index e6af9f56..72bc6c28 100644
--- a/dashboard/lib/api-types.generated.ts
+++ b/dashboard/lib/api-types.generated.ts
@@ -169,6 +169,149 @@ export interface paths {
         patch?: never;
         trace?: never;
     };
+    "/api/admin/llm/audit": {
+        parameters: {
+            query?: never;
+            header?: never;
+            path?: never;
+            cookie?: never;
+        };
+        /**
+         * List Audit Events
+         * @description Browse the LLM audit trail (admin-only).
+         *
+         *     Read-only view over ``llm_audit_event`` with optional filters and
+         *     pagination. The target connector's display name is joined in — credential
+         *     material is never read or returned.
+         */
+        get: operations["list_audit_events_api_admin_llm_audit_get"];
+        put?: never;
+        post?: never;
+        delete?: never;
+        options?: never;
+        head?: never;
+        patch?: never;
+        trace?: never;
+    };
+    "/api/admin/llm/audit.csv": {
+        parameters: {
+            query?: never;
+            header?: never;
+            path?: never;
+            cookie?: never;
+        };
+        /**
+         * Export Audit Events Csv
+         * @description Export the (filtered) audit trail as CSV (admin-only).
+         *
+         *     Honors the same filters as ``GET /audit``. Capped at
+         *     ``_AUDIT_CSV_ROW_CAP`` rows to avoid unbounded streaming. Columns:
+         *     timestamp, actor, event_type, target_connector, notes. Never includes
+         *     credential material.
+         */
+        get: operations["export_audit_events_csv_api_admin_llm_audit_csv_get"];
+        put?: never;
+        post?: never;
+        delete?: never;
+        options?: never;
+        head?: never;
+        patch?: never;
+        trace?: never;
+    };
+    "/api/admin/llm/connectors": {
+        parameters: {
+            query?: never;
+            header?: never;
+            path?: never;
+            cookie?: never;
+        };
+        /** List Connectors Admin */
+        get: operations["list_connectors_admin_api_admin_llm_connectors_get"];
+        put?: never;
+        post?: never;
+        delete?: never;
+        options?: never;
+        head?: never;
+        patch?: never;
+        trace?: never;
+    };
+    "/api/admin/llm/connectors/{connector_id}/cap": {
+        parameters: {
+            query?: never;
+            header?: never;
+            path?: never;
+            cookie?: never;
+        };
+        get?: never;
+        put?: never;
+        post?: never;
+        delete?: never;
+        options?: never;
+        head?: never;
+        /**
+         * Set Connector Cap Admin
+         * @description Set or clear a connector's monthly token cap (admin-only, issue #339).
+         *
+         *     ``monthly_token_cap = null`` clears the cap (unlimited). The change is
+         *     pre-flight only: an in-flight gateway call already past its cap check is
+         *     unaffected. Pydantic enforces the non-negative bound (``ge=0``); the
+         *     service layer re-validates defensively.
+         */
+        patch: operations["set_connector_cap_admin_api_admin_llm_connectors__connector_id__cap_patch"];
+        trace?: never;
+    };
+    "/api/admin/llm/connectors/{connector_id}/revoke": {
+        parameters: {
+            query?: never;
+            header?: never;
+            path?: never;
+            cookie?: never;
+        };
+        get?: never;
+        put?: never;
+        /** Revoke Connector Admin */
+        post: operations["revoke_connector_admin_api_admin_llm_connectors__connector_id__revoke_post"];
+        delete?: never;
+        options?: never;
+        head?: never;
+        patch?: never;
+        trace?: never;
+    };
+    "/api/admin/llm/policy": {
+        parameters: {
+            query?: never;
+            header?: never;
+            path?: never;
+            cookie?: never;
+        };
+        /** Get Policy */
+        get: operations["get_policy_api_admin_llm_policy_get"];
+        put?: never;
+        post?: never;
+        delete?: never;
+        options?: never;
+        head?: never;
+        /** Patch Policy */
+        patch: operations["patch_policy_api_admin_llm_policy_patch"];
+        trace?: never;
+    };
+    "/api/admin/llm/usage": {
+        parameters: {
+            query?: never;
+            header?: never;
+            path?: never;
+            cookie?: never;
+        };
+        /** Get Usage */
+        get: operations["get_usage_api_admin_llm_usage_get"];
+        put?: never;
+        post?: never;
+        delete?: never;
+        options?: never;
+        head?: never;
+        patch?: never;
+        trace?: never;
+    };
     "/api/admin/settings": {
         parameters: {
             query?: never;
@@ -1299,24 +1442,25 @@ export interface paths {
         patch: operations["assign_kiosk_api_kiosk__kiosk_id__assign_patch"];
         trace?: never;
     };
-    "/api/public/collect/{code}": {
+    "/api/llm/connectors": {
         parameters: {
             query?: never;
             header?: never;
             path?: never;
             cookie?: never;
         };
-        /** Preview */
-        get: operations["preview_api_public_collect__code__get"];
+        /** List Connectors */
+        get: operations["list_connectors_api_llm_connectors_get"];
         put?: never;
-        post?: never;
+        /** Create Connector Endpoint */
+        post: operations["create_connector_endpoint_api_llm_connectors_post"];
         delete?: never;
         options?: never;
         head?: never;
         patch?: never;
         trace?: never;
     };
-    "/api/public/collect/{code}/enrich-preview": {
+    "/api/llm/connectors/{connector_id}": {
         parameters: {
             query?: never;
             header?: never;
@@ -1325,18 +1469,16 @@ export interface paths {
         };
         get?: never;
         put?: never;
-        /**
-         * Enrich Preview
-         * @description Lightweight Beatport BPM/key lookup for search-time vibes — no DB writes.
-         */
-        post: operations["enrich_preview_api_public_collect__code__enrich_preview_post"];
-        delete?: never;
+        post?: never;
+        /** Delete Connector Endpoint */
+        delete: operations["delete_connector_endpoint_api_llm_connectors__connector_id__delete"];
         options?: never;
         head?: never;
-        patch?: never;
+        /** Update Connector Metadata */
+        patch: operations["update_connector_metadata_api_llm_connectors__connector_id__patch"];
         trace?: never;
     };
-    "/api/public/collect/{code}/guest/ensure-name": {
+    "/api/llm/connectors/{connector_id}/credentials": {
         parameters: {
             query?: never;
             header?: never;
@@ -1344,148 +1486,196 @@ export interface paths {
             cookie?: never;
         };
         get?: never;
-        put?: never;
-        /**
-         * Ensure Name
-         * @description Frictionless-join name management. Auto-generates a nickname when none is
-         *     set, or applies a manual rename. Gated on event.frictionless_join so it can
-         *     never bypass email verification on a hardened (non-frictionless) event.
-         *
-         *     Not anonymous: requires the `wrzdj_human` HMAC-signed verified-human cookie
-         *     (set via Turnstile) through `require_verified_human_soft`. Calls without a
-         *     resolvable verified-human guest are rejected with 403
-         *     `human_verification_required`.
-         */
-        post: operations["ensure_name_api_public_collect__code__guest_ensure_name_post"];
+        /** Rotate Connector Credentials */
+        put: operations["rotate_connector_credentials_api_llm_connectors__connector_id__credentials_put"];
+        post?: never;
         delete?: never;
         options?: never;
         head?: never;
         patch?: never;
         trace?: never;
     };
-    "/api/public/collect/{code}/join-config": {
+    "/api/llm/connectors/{connector_id}/default": {
         parameters: {
             query?: never;
             header?: never;
             path?: never;
             cookie?: never;
         };
+        get?: never;
+        put?: never;
         /**
-         * Join Config
-         * @description Public, unauthenticated: lets the join page decide its gate mode on load.
+         * Set Connector As Default
+         * @description Pin this connector as the DJ's explicit default (issue #336).
+         *
+         *     Atomically clears any other defaults the DJ owns before flipping this row,
+         *     so the partial unique index never sees two True rows for the same user.
+         *
+         *     Setting a disabled / auth_invalid connector as default is rejected with 400
+         *     so DJs don't silently break their own routing — a default that the gateway
+         *     would skip anyway is a footgun.
          */
-        get: operations["join_config_api_public_collect__code__join_config_get"];
-        put?: never;
-        post?: never;
-        delete?: never;
+        post: operations["set_connector_as_default_api_llm_connectors__connector_id__default_post"];
+        /**
+         * Unset Connector As Default
+         * @description Clear the explicit default — gateway resolution falls back to MRU.
+         */
+        delete: operations["unset_connector_as_default_api_llm_connectors__connector_id__default_delete"];
         options?: never;
         head?: never;
         patch?: never;
         trace?: never;
     };
-    "/api/public/collect/{code}/leaderboard": {
+    "/api/llm/connectors/{connector_id}/stream-test": {
         parameters: {
             query?: never;
             header?: never;
             path?: never;
             cookie?: never;
         };
-        /** Leaderboard */
-        get: operations["leaderboard_api_public_collect__code__leaderboard_get"];
+        get?: never;
         put?: never;
-        post?: never;
+        /**
+         * Stream Test Connector
+         * @description Stream a short sentence through the connector as ``text/event-stream``.
+         *
+         *     Validates ownership up front (404 for connectors the DJ doesn't own — never
+         *     leaks existence). Each SSE ``data:`` frame is a JSON ``ChatResponseChunk``.
+         *     On a typed gateway error an ``event: error`` frame is emitted carrying only a
+         *     sanitised code (never the upstream payload), then the stream ends. Client
+         *     disconnect cancels the upstream provider request — the gateway generator's
+         *     ``finally`` writes the counts-only call log and closes the adapter.
+         *
+         *     Unlike the public guest SSE stream (``api/sse.py``), this endpoint is
+         *     authenticated, rate-limited (10/min), and strictly bounded (max 64 output
+         *     tokens), so it holds the request-scoped DB session for the brief stream
+         *     lifetime rather than opening a detached ``SessionLocal`` — the pool-pinning
+         *     concern that drove ``api/sse.py``'s pattern applies to unauthenticated,
+         *     indefinitely-open guest connections, not a short admin health probe.
+         */
+        post: operations["stream_test_connector_api_llm_connectors__connector_id__stream_test_post"];
         delete?: never;
         options?: never;
         head?: never;
         patch?: never;
         trace?: never;
     };
-    "/api/public/collect/{code}/live-join-code": {
+    "/api/llm/connectors/{connector_id}/test": {
         parameters: {
             query?: never;
             header?: never;
             path?: never;
             cookie?: never;
         };
+        get?: never;
+        put?: never;
         /**
-         * Get Live Join Code
-         * @description Return the live join_code for an event that has entered the live phase.
+         * Test Connector
+         * @description Run a health check and return a sanitised result.
          *
-         *     Requires a verified human cookie (not email verification) so the join_code
-         *     is never leaked to unverified bots scraping /collect during the
-         *     collection-to-live transition. The join_code is otherwise revealed only
-         *     via the QR code at the event venue.
+         *     Behaviour identical to the background monitor (issue #340), so the
+         *     ``last_health_check_at`` / ``last_health_check_status`` columns and audit
+         *     rows are written the same way on every invocation regardless of trigger
+         *     source. See ``services/llm/health_check.py`` for the shared helper.
          */
-        get: operations["get_live_join_code_api_public_collect__code__live_join_code_get"];
-        put?: never;
-        post?: never;
+        post: operations["test_connector_api_llm_connectors__connector_id__test_post"];
         delete?: never;
         options?: never;
         head?: never;
         patch?: never;
         trace?: never;
     };
-    "/api/public/collect/{code}/profile": {
+    "/api/llm/feature-preferences": {
         parameters: {
             query?: never;
             header?: never;
             path?: never;
             cookie?: never;
         };
-        /** Get Profile */
-        get: operations["get_profile_api_public_collect__code__profile_get"];
+        /**
+         * List Feature Preferences
+         * @description List the DJ's per-feature connector pins (issue #337).
+         */
+        get: operations["list_feature_preferences_api_llm_feature_preferences_get"];
         put?: never;
-        /** Set Profile */
-        post: operations["set_profile_api_public_collect__code__profile_post"];
+        /**
+         * Set Feature Preference Endpoint
+         * @description Pin (or re-pin) a connector to a feature for the current DJ.
+         *
+         *     Validates connector ownership server-side (404 for IDs the DJ doesn't own,
+         *     so another DJ's connector existence is never leaked) and rejects pinning a
+         *     non-active connector (400) — the gateway would skip it anyway, so silently
+         *     accepting it is a footgun.
+         */
+        post: operations["set_feature_preference_endpoint_api_llm_feature_preferences_post"];
         delete?: never;
         options?: never;
         head?: never;
         patch?: never;
         trace?: never;
     };
-    "/api/public/collect/{code}/profile/me": {
+    "/api/llm/feature-preferences/{feature}": {
         parameters: {
             query?: never;
             header?: never;
             path?: never;
             cookie?: never;
         };
-        /** My Picks */
-        get: operations["my_picks_api_public_collect__code__profile_me_get"];
+        get?: never;
         put?: never;
         post?: never;
-        delete?: never;
+        /**
+         * Clear Feature Preference Endpoint
+         * @description Clear the DJ's pin for ``feature`` (no-op if unset). Returns the new list.
+         */
+        delete: operations["clear_feature_preference_endpoint_api_llm_feature_preferences__feature__delete"];
         options?: never;
         head?: never;
         patch?: never;
         trace?: never;
     };
-    "/api/public/collect/{code}/requests": {
+    "/api/llm/openrouter/models": {
         parameters: {
             query?: never;
             header?: never;
             path?: never;
             cookie?: never;
         };
-        get?: never;
+        /**
+         * List Openrouter Models
+         * @description Return the OpenRouter model catalogue for the model-hint dropdown.
+         *
+         *     Served from a process-wide TTL cache (refreshed hourly). The OpenRouter
+         *     ``/models`` endpoint is public, so no connector credentials are required.
+         *     Returns an empty list if the catalogue is unavailable — the frontend then
+         *     falls back to a free-text model input.
+         */
+        get: operations["list_openrouter_models_api_llm_openrouter_models_get"];
         put?: never;
-        /** Submit */
-        post: operations["submit_api_public_collect__code__requests_post"];
+        post?: never;
         delete?: never;
         options?: never;
         head?: never;
         patch?: never;
         trace?: never;
     };
-    "/api/public/collect/{code}/requests/{request_id}/preview": {
+    "/api/llm/policy": {
         parameters: {
             query?: never;
             header?: never;
             path?: never;
             cookie?: never;
         };
-        /** Request Preview */
-        get: operations["request_preview_api_public_collect__code__requests__request_id__preview_get"];
+        /**
+         * Get Dj Policy
+         * @description DJ-readable connector policy (non-sensitive subset).
+         *
+         *     The settings/ai page consumes this to fail *closed* — hiding connector
+         *     types the admin has disabled rather than showing every provider and only
+         *     discovering the block when the create call returns 403. Admin-only fields
+         *     (e.g. ``llm_default_connector_id``) are intentionally excluded.
+         */
+        get: operations["get_dj_policy_api_llm_policy_get"];
         put?: never;
         post?: never;
         delete?: never;
@@ -1494,71 +1684,71 @@ export interface paths {
         patch?: never;
         trace?: never;
     };
-    "/api/public/collect/{code}/vote": {
+    "/api/public/collect/{code}": {
         parameters: {
             query?: never;
             header?: never;
             path?: never;
             cookie?: never;
         };
-        get?: never;
+        /** Preview */
+        get: operations["preview_api_public_collect__code__get"];
         put?: never;
-        /** Vote */
-        post: operations["vote_api_public_collect__code__vote_post"];
+        post?: never;
         delete?: never;
         options?: never;
         head?: never;
         patch?: never;
         trace?: never;
     };
-    "/api/public/e/{code}/bridge-status": {
+    "/api/public/collect/{code}/enrich-preview": {
         parameters: {
             query?: never;
             header?: never;
             path?: never;
             cookie?: never;
         };
+        get?: never;
+        put?: never;
         /**
-         * Get Public Bridge Status
-         * @description Get bridge connection status for public display.
-         *
-         *     Independent of track data — returns bridge connectivity even when
-         *     no track is currently playing. Resolves by join_code: serves guest-facing
-         *     kiosk display + overlay pages.
+         * Enrich Preview
+         * @description Lightweight Beatport BPM/key lookup for search-time vibes — no DB writes.
          */
-        get: operations["get_public_bridge_status_api_public_e__code__bridge_status_get"];
-        put?: never;
-        post?: never;
+        post: operations["enrich_preview_api_public_collect__code__enrich_preview_post"];
         delete?: never;
         options?: never;
         head?: never;
         patch?: never;
         trace?: never;
     };
-    "/api/public/e/{code}/history": {
+    "/api/public/collect/{code}/guest/ensure-name": {
         parameters: {
             query?: never;
             header?: never;
             path?: never;
             cookie?: never;
         };
+        get?: never;
+        put?: never;
         /**
-         * Get Public History
-         * @description Get play history for public display.
+         * Ensure Name
+         * @description Frictionless-join name management. Auto-generates a nickname when none is
+         *     set, or applies a manual rename. Gated on event.frictionless_join so it can
+         *     never bypass email verification on a hardened (non-frictionless) event.
          *
-         *     Returns the list of tracks played during the event, newest first.
-         *     Resolves by join_code: serves guest-facing kiosk display.
+         *     Not anonymous: requires the `wrzdj_human` HMAC-signed verified-human cookie
+         *     (set via Turnstile) through `require_verified_human_soft`. Calls without a
+         *     resolvable verified-human guest are rejected with 403
+         *     `human_verification_required`.
          */
-        get: operations["get_public_history_api_public_e__code__history_get"];
-        put?: never;
-        post?: never;
+        post: operations["ensure_name_api_public_collect__code__guest_ensure_name_post"];
         delete?: never;
         options?: never;
         head?: never;
         patch?: never;
         trace?: never;
     };
-    "/api/public/e/{code}/nowplaying": {
+    "/api/public/collect/{code}/join-config": {
         parameters: {
             query?: never;
             header?: never;
@@ -1566,15 +1756,10 @@ export interface paths {
             cookie?: never;
         };
         /**
-         * Get Public Now Playing
-         * @description Get current now-playing track for public display.
-         *
-         *     Returns the track currently playing from StageLinQ, or None if nothing playing.
-         *
-         *     Resolves by join_code: this endpoint serves the kiosk display + OBS overlay
-         *     pages, which route by join_code per the post-PR-#324 public/guest URL contract.
+         * Join Config
+         * @description Public, unauthenticated: lets the join page decide its gate mode on load.
          */
-        get: operations["get_public_now_playing_api_public_e__code__nowplaying_get"];
+        get: operations["join_config_api_public_collect__code__join_config_get"];
         put?: never;
         post?: never;
         delete?: never;
@@ -1583,7 +1768,207 @@ export interface paths {
         patch?: never;
         trace?: never;
     };
-    "/api/public/events/{code}": {
+    "/api/public/collect/{code}/leaderboard": {
+        parameters: {
+            query?: never;
+            header?: never;
+            path?: never;
+            cookie?: never;
+        };
+        /** Leaderboard */
+        get: operations["leaderboard_api_public_collect__code__leaderboard_get"];
+        put?: never;
+        post?: never;
+        delete?: never;
+        options?: never;
+        head?: never;
+        patch?: never;
+        trace?: never;
+    };
+    "/api/public/collect/{code}/live-join-code": {
+        parameters: {
+            query?: never;
+            header?: never;
+            path?: never;
+            cookie?: never;
+        };
+        /**
+         * Get Live Join Code
+         * @description Return the live join_code for an event that has entered the live phase.
+         *
+         *     Requires a verified human cookie (not email verification) so the join_code
+         *     is never leaked to unverified bots scraping /collect during the
+         *     collection-to-live transition. The join_code is otherwise revealed only
+         *     via the QR code at the event venue.
+         */
+        get: operations["get_live_join_code_api_public_collect__code__live_join_code_get"];
+        put?: never;
+        post?: never;
+        delete?: never;
+        options?: never;
+        head?: never;
+        patch?: never;
+        trace?: never;
+    };
+    "/api/public/collect/{code}/profile": {
+        parameters: {
+            query?: never;
+            header?: never;
+            path?: never;
+            cookie?: never;
+        };
+        /** Get Profile */
+        get: operations["get_profile_api_public_collect__code__profile_get"];
+        put?: never;
+        /** Set Profile */
+        post: operations["set_profile_api_public_collect__code__profile_post"];
+        delete?: never;
+        options?: never;
+        head?: never;
+        patch?: never;
+        trace?: never;
+    };
+    "/api/public/collect/{code}/profile/me": {
+        parameters: {
+            query?: never;
+            header?: never;
+            path?: never;
+            cookie?: never;
+        };
+        /** My Picks */
+        get: operations["my_picks_api_public_collect__code__profile_me_get"];
+        put?: never;
+        post?: never;
+        delete?: never;
+        options?: never;
+        head?: never;
+        patch?: never;
+        trace?: never;
+    };
+    "/api/public/collect/{code}/requests": {
+        parameters: {
+            query?: never;
+            header?: never;
+            path?: never;
+            cookie?: never;
+        };
+        get?: never;
+        put?: never;
+        /** Submit */
+        post: operations["submit_api_public_collect__code__requests_post"];
+        delete?: never;
+        options?: never;
+        head?: never;
+        patch?: never;
+        trace?: never;
+    };
+    "/api/public/collect/{code}/requests/{request_id}/preview": {
+        parameters: {
+            query?: never;
+            header?: never;
+            path?: never;
+            cookie?: never;
+        };
+        /** Request Preview */
+        get: operations["request_preview_api_public_collect__code__requests__request_id__preview_get"];
+        put?: never;
+        post?: never;
+        delete?: never;
+        options?: never;
+        head?: never;
+        patch?: never;
+        trace?: never;
+    };
+    "/api/public/collect/{code}/vote": {
+        parameters: {
+            query?: never;
+            header?: never;
+            path?: never;
+            cookie?: never;
+        };
+        get?: never;
+        put?: never;
+        /** Vote */
+        post: operations["vote_api_public_collect__code__vote_post"];
+        delete?: never;
+        options?: never;
+        head?: never;
+        patch?: never;
+        trace?: never;
+    };
+    "/api/public/e/{code}/bridge-status": {
+        parameters: {
+            query?: never;
+            header?: never;
+            path?: never;
+            cookie?: never;
+        };
+        /**
+         * Get Public Bridge Status
+         * @description Get bridge connection status for public display.
+         *
+         *     Independent of track data — returns bridge connectivity even when
+         *     no track is currently playing. Resolves by join_code: serves guest-facing
+         *     kiosk display + overlay pages.
+         */
+        get: operations["get_public_bridge_status_api_public_e__code__bridge_status_get"];
+        put?: never;
+        post?: never;
+        delete?: never;
+        options?: never;
+        head?: never;
+        patch?: never;
+        trace?: never;
+    };
+    "/api/public/e/{code}/history": {
+        parameters: {
+            query?: never;
+            header?: never;
+            path?: never;
+            cookie?: never;
+        };
+        /**
+         * Get Public History
+         * @description Get play history for public display.
+         *
+         *     Returns the list of tracks played during the event, newest first.
+         *     Resolves by join_code: serves guest-facing kiosk display.
+         */
+        get: operations["get_public_history_api_public_e__code__history_get"];
+        put?: never;
+        post?: never;
+        delete?: never;
+        options?: never;
+        head?: never;
+        patch?: never;
+        trace?: never;
+    };
+    "/api/public/e/{code}/nowplaying": {
+        parameters: {
+            query?: never;
+            header?: never;
+            path?: never;
+            cookie?: never;
+        };
+        /**
+         * Get Public Now Playing
+         * @description Get current now-playing track for public display.
+         *
+         *     Returns the track currently playing from StageLinQ, or None if nothing playing.
+         *
+         *     Resolves by join_code: this endpoint serves the kiosk display + OBS overlay
+         *     pages, which route by join_code per the post-PR-#324 public/guest URL contract.
+         */
+        get: operations["get_public_now_playing_api_public_e__code__nowplaying_get"];
+        put?: never;
+        post?: never;
+        delete?: never;
+        options?: never;
+        head?: never;
+        patch?: never;
+        trace?: never;
+    };
+    "/api/public/events/{code}": {
         parameters: {
             query?: never;
             header?: never;
@@ -1701,6 +2086,14 @@ export interface paths {
          *     unauthenticated DoS (unlimited long-lived connections exhausting FDs)
          *     and passive eavesdropping via 6-char event-code brute force.
          *
+         *     POOL SAFETY (issue #356): the one-shot existence/auth check runs inside a
+         *     short-lived ``with SessionLocal()`` block whose pooled connection is
+         *     returned BEFORE the EventSourceResponse is returned. An EventSource
+         *     connection can stay open indefinitely, so we must NOT hold a
+         *     request-scoped ``get_db`` session across the stream lifetime — doing so
+         *     pinned one pooled connection per open stream and exhausted the QueuePool
+         *     (size 5 + overflow 10 = 15 connections) under modest guest load.
+         *
          *     Event types:
          *     - request_created: New request submitted
          *     - request_status_changed: Request status update
@@ -2019,6 +2412,58 @@ export interface paths {
         patch?: never;
         trace?: never;
     };
+    "/api/setbuilder/sets": {
+        parameters: {
+            query?: never;
+            header?: never;
+            path?: never;
+            cookie?: never;
+        };
+        /**
+         * List Sets
+         * @description List the current DJ's sets, newest first.
+         */
+        get: operations["list_sets_api_setbuilder_sets_get"];
+        put?: never;
+        /**
+         * Create Set
+         * @description Create a new empty set owned by the current DJ.
+         */
+        post: operations["create_set_api_setbuilder_sets_post"];
+        delete?: never;
+        options?: never;
+        head?: never;
+        patch?: never;
+        trace?: never;
+    };
+    "/api/setbuilder/sets/{set_id}": {
+        parameters: {
+            query?: never;
+            header?: never;
+            path?: never;
+            cookie?: never;
+        };
+        /**
+         * Get Set
+         * @description Get one of the current DJ's sets, or 404.
+         */
+        get: operations["get_set_api_setbuilder_sets__set_id__get"];
+        put?: never;
+        post?: never;
+        /**
+         * Delete Set
+         * @description Delete one of the current DJ's sets, or 404.
+         */
+        delete: operations["delete_set_api_setbuilder_sets__set_id__delete"];
+        options?: never;
+        head?: never;
+        /**
+         * Rename Set
+         * @description Rename one of the current DJ's sets, or 404.
+         */
+        patch: operations["rename_set_api_setbuilder_sets__set_id__patch"];
+        trace?: never;
+    };
     "/api/tidal/auth/cancel": {
         parameters: {
             query?: never;
@@ -2288,13 +2733,101 @@ export interface components {
             /** Source */
             source: string;
         };
-        /** AdminEventOut */
-        AdminEventOut: {
-            /** Code */
-            code: string;
+        /**
+         * AdminAuditOut
+         * @description Paginated audit-event browse response.
+         */
+        AdminAuditOut: {
+            /** Limit */
+            limit: number;
+            /** Offset */
+            offset: number;
+            /** Rows */
+            rows: components["schemas"]["AuditEventRow"][];
+            /** Total */
+            total: number;
+        };
+        /**
+         * AdminConnectorCapPatch
+         * @description Admin set/clear a connector's monthly token cap (issue #339).
+         *
+         *     ``monthly_token_cap`` is **required** so intent is always explicit: an
+         *     integer sets the cap, ``null`` clears it (unlimited). Omitting the field
+         *     (an empty ``{}`` body) is rejected with 422 rather than silently treated as
+         *     ``null`` — that would let an accidental no-field PATCH wipe a configured
+         *     cap. A non-null value must be a non-negative integer; ``0`` means "no
+         *     further calls this month". The upper bound is a sanity ceiling, not a
+         *     billing limit.
+         */
+        AdminConnectorCapPatch: {
+            /** Monthly Token Cap */
+            monthly_token_cap: number | null;
+        };
+        /**
+         * AdminConnectorOut
+         * @description Admin view — adds the DJ's username for display.
+         */
+        AdminConnectorOut: {
+            /** Base Url Plain */
+            base_url_plain: string | null;
             /**
-             * Created At
-             * Format: date-time
+             * Connector Type
+             * @enum {string}
+             */
+            connector_type: "openai_apikey" | "anthropic_apikey" | "openai_compatible" | "openrouter_apikey" | "xai_apikey" | "bedrock" | "azure_openai" | "gemini_apikey";
+            /**
+             * Created At
+             * Format: date-time
+             */
+            created_at: string;
+            /**
+             * Current Month Tokens
+             * @default 0
+             */
+            current_month_tokens: number;
+            /** Display Name */
+            display_name: string;
+            /** Dj Username */
+            dj_username: string;
+            /** Id */
+            id: number;
+            /**
+             * Is Default
+             * @default false
+             */
+            is_default: boolean;
+            /** Last Error */
+            last_error: string | null;
+            /** Last Health Check At */
+            last_health_check_at: string | null;
+            /** Last Health Check Status */
+            last_health_check_status: ("ok" | "auth_invalid" | "rate_limited" | "quota_exceeded" | "provider_unavailable" | "error") | null;
+            /** Last Used At */
+            last_used_at: string | null;
+            /** Model Hint */
+            model_hint: string | null;
+            /** Monthly Token Cap */
+            monthly_token_cap: number | null;
+            /**
+             * Status
+             * @enum {string}
+             */
+            status: "active" | "auth_invalid" | "disabled";
+            /**
+             * Updated At
+             * Format: date-time
+             */
+            updated_at: string;
+            /** User Id */
+            user_id: number;
+        };
+        /** AdminEventOut */
+        AdminEventOut: {
+            /** Code */
+            code: string;
+            /**
+             * Created At
+             * Format: date-time
              */
             created_at: string;
             /**
@@ -2320,6 +2853,40 @@ export interface components {
              */
             request_count: number;
         };
+        /** AdminPolicyOut */
+        AdminPolicyOut: {
+            /** Llm Apikey Connectors Enabled */
+            llm_apikey_connectors_enabled: boolean;
+            /** Llm Call Log Retention Days */
+            llm_call_log_retention_days: number;
+            /** Llm Compatible Connector Enabled */
+            llm_compatible_connector_enabled: boolean;
+            /** Llm Default Connector Id */
+            llm_default_connector_id: number | null;
+        };
+        /** AdminPolicyPatch */
+        AdminPolicyPatch: {
+            /**
+             * Clear Default
+             * @default false
+             */
+            clear_default: boolean;
+            /** Llm Apikey Connectors Enabled */
+            llm_apikey_connectors_enabled?: boolean | null;
+            /** Llm Call Log Retention Days */
+            llm_call_log_retention_days?: number | null;
+            /** Llm Compatible Connector Enabled */
+            llm_compatible_connector_enabled?: boolean | null;
+            /** Llm Default Connector Id */
+            llm_default_connector_id?: number | null;
+        };
+        /** AdminUsageOut */
+        AdminUsageOut: {
+            /** Days */
+            days: number;
+            /** Rows */
+            rows: components["schemas"]["UsageRow"][];
+        };
         /** AdminUserCreate */
         AdminUserCreate: {
             /** Password */
@@ -2362,6 +2929,34 @@ export interface components {
             /** Role */
             role?: string | null;
         };
+        /**
+         * AuditEventRow
+         * @description A single audit-trail row with joined display labels.
+         *
+         *     Never includes credential material — only the target connector's
+         *     human-readable display name (joined from ``llm_connectors``).
+         */
+        AuditEventRow: {
+            /** Actor User Id */
+            actor_user_id: number;
+            /** Actor Username */
+            actor_username: string;
+            /**
+             * Created At
+             * Format: date-time
+             */
+            created_at: string;
+            /** Event Type */
+            event_type: string;
+            /** Id */
+            id: number;
+            /** Notes */
+            notes: string | null;
+            /** Target Connector Display Name */
+            target_connector_display_name: string | null;
+            /** Target Connector Id */
+            target_connector_id: number | null;
+        };
         /**
          * BeatportEventSettings
          * @description Beatport sync settings for an event.
@@ -2805,6 +3400,156 @@ export interface components {
             /** Request Id */
             request_id: number;
         };
+        /**
+         * ConnectorCreate
+         * @description Provider-agnostic create payload.
+         *
+         *     Field requirements vary by ``connector_type``:
+         *
+         *     - ``openai_apikey`` / ``anthropic_apikey`` / ``openrouter_apikey`` /
+         *       ``xai_apikey`` / ``gemini_apikey``: ``api_key`` required; ``base_url``
+         *       and ``bearer`` are ignored.
+         *     - ``openai_compatible``: ``base_url`` required; ``bearer`` optional;
+         *       ``api_key`` is ignored.
+         *     - ``bedrock``: ``aws_access_key_id``, ``aws_secret_access_key``,
+         *       ``aws_region`` and ``aws_model_id`` required; other fields ignored.
+         *     - ``azure_openai``: ``api_key``, ``azure_resource_name``,
+         *       ``azure_deployment_name`` and ``azure_api_version`` all required.
+         *
+         *     The combination is enforced by :meth:`_require_credentials_for_type`.
+         *     See ``build_create_payload`` in ``services/llm/connector_storage.py``
+         *     for the full validation flow (including key shape checks).
+         */
+        ConnectorCreate: {
+            /** Api Key */
+            api_key?: string | null;
+            /** Aws Access Key Id */
+            aws_access_key_id?: string | null;
+            /** Aws Model Id */
+            aws_model_id?: string | null;
+            /** Aws Region */
+            aws_region?: string | null;
+            /** Aws Secret Access Key */
+            aws_secret_access_key?: string | null;
+            /** Azure Api Version */
+            azure_api_version?: string | null;
+            /** Azure Deployment Name */
+            azure_deployment_name?: string | null;
+            /** Azure Resource Name */
+            azure_resource_name?: string | null;
+            /** Base Url */
+            base_url?: string | null;
+            /** Bearer */
+            bearer?: string | null;
+            /**
+             * Connector Type
+             * @enum {string}
+             */
+            connector_type: "openai_apikey" | "anthropic_apikey" | "openai_compatible" | "openrouter_apikey" | "xai_apikey" | "bedrock" | "azure_openai" | "gemini_apikey";
+            /** Display Name */
+            display_name: string;
+            /** Model Hint */
+            model_hint?: string | null;
+        };
+        /**
+         * ConnectorCredentialsRotate
+         * @description Rotation payload — at least one credential field must be supplied.
+         *
+         *     Field semantics mirror :class:`ConnectorCreate`. The actual field required
+         *     depends on the connector being rotated (validated in ``rotate_credentials``).
+         */
+        ConnectorCredentialsRotate: {
+            /** Api Key */
+            api_key?: string | null;
+            /** Aws Access Key Id */
+            aws_access_key_id?: string | null;
+            /** Aws Model Id */
+            aws_model_id?: string | null;
+            /** Aws Region */
+            aws_region?: string | null;
+            /** Aws Secret Access Key */
+            aws_secret_access_key?: string | null;
+            /** Azure Api Version */
+            azure_api_version?: string | null;
+            /** Azure Deployment Name */
+            azure_deployment_name?: string | null;
+            /** Azure Resource Name */
+            azure_resource_name?: string | null;
+            /** Base Url */
+            base_url?: string | null;
+            /** Bearer */
+            bearer?: string | null;
+        };
+        /**
+         * ConnectorOut
+         * @description Public-safe connector view — never includes the credential blob.
+         */
+        ConnectorOut: {
+            /** Base Url Plain */
+            base_url_plain: string | null;
+            /**
+             * Connector Type
+             * @enum {string}
+             */
+            connector_type: "openai_apikey" | "anthropic_apikey" | "openai_compatible" | "openrouter_apikey" | "xai_apikey" | "bedrock" | "azure_openai" | "gemini_apikey";
+            /**
+             * Created At
+             * Format: date-time
+             */
+            created_at: string;
+            /** Display Name */
+            display_name: string;
+            /** Id */
+            id: number;
+            /**
+             * Is Default
+             * @default false
+             */
+            is_default: boolean;
+            /** Last Error */
+            last_error: string | null;
+            /** Last Health Check At */
+            last_health_check_at: string | null;
+            /** Last Health Check Status */
+            last_health_check_status: ("ok" | "auth_invalid" | "rate_limited" | "quota_exceeded" | "provider_unavailable" | "error") | null;
+            /** Last Used At */
+            last_used_at: string | null;
+            /** Model Hint */
+            model_hint: string | null;
+            /** Monthly Token Cap */
+            monthly_token_cap: number | null;
+            /**
+             * Status
+             * @enum {string}
+             */
+            status: "active" | "auth_invalid" | "disabled";
+            /**
+             * Updated At
+             * Format: date-time
+             */
+            updated_at: string;
+            /** User Id */
+            user_id: number;
+        };
+        /**
+         * ConnectorPatch
+         * @description Metadata-only patch (no credential rotation here).
+         */
+        ConnectorPatch: {
+            /** Display Name */
+            display_name?: string | null;
+            /** Model Hint */
+            model_hint?: string | null;
+        };
+        /** ConnectorTestResult */
+        ConnectorTestResult: {
+            /** Error Code */
+            error_code: string | null;
+            /** Message */
+            message: string | null;
+            /** Ok */
+            ok: boolean;
+        };
         /**
          * DisplaySettingsResponse
          * @description Response for display settings update.
@@ -2847,6 +3592,28 @@ export interface components {
             /** Requests Open */
             requests_open?: boolean | null;
         };
+        /**
+         * DjPolicyOut
+         * @description DJ-readable connector policy — the non-sensitive subset of the admin
+         *     policy surface.
+         *
+         *     Lets the settings/ai page fail *closed*: a normal DJ can learn which
+         *     connector types the admin has enabled (so disallowed providers are hidden
+         *     in the picker) without exposing admin-only fields such as
+         *     ``llm_default_connector_id``.
+         *
+         *     ``allowed_connector_types`` is the pre-computed set of connector types a DJ
+         *     may create given the two toggles, so the frontend doesn't have to hard-code
+         *     the api-key-vs-compatible mapping.
+         */
+        DjPolicyOut: {
+            /** Allowed Connector Types */
+            allowed_connector_types: ("openai_apikey" | "anthropic_apikey" | "openai_compatible" | "openrouter_apikey" | "xai_apikey" | "bedrock" | "azure_openai" | "gemini_apikey")[];
+            /** Llm Apikey Connectors Enabled */
+            llm_apikey_connectors_enabled: boolean;
+            /** Llm Compatible Connector Enabled */
+            llm_compatible_connector_enabled: boolean;
+        };
         /** EnrichPreviewItem */
         EnrichPreviewItem: {
             /** Artist */
@@ -3012,6 +3779,42 @@ export interface components {
             /** Name */
             name?: string | null;
         };
+        /**
+         * FeaturePreferenceOut
+         * @description A single per-feature connector pin (issue #337).
+         */
+        FeaturePreferenceOut: {
+            /** Connector Id */
+            connector_id: number;
+            /**
+             * Feature
+             * @enum {string}
+             */
+            feature: "recommendation" | "set_builder";
+        };
+        /**
+         * FeaturePreferenceSet
+         * @description Set/change a per-feature pin. Upsert — replaces any existing pin.
+         */
+        FeaturePreferenceSet: {
+            /** Connector Id */
+            connector_id: number;
+            /**
+             * Feature
+             * @enum {string}
+             */
+            feature: "recommendation" | "set_builder";
+        };
+        /**
+         * FeaturePreferencesListOut
+         * @description All of a DJ's per-feature pins + the catalogue of pinnable features.
+         */
+        FeaturePreferencesListOut: {
+            /** Known Features */
+            known_features: ("recommendation" | "set_builder")[];
+            /** Preferences */
+            preferences: components["schemas"]["FeaturePreferenceOut"][];
+        };
         /** GuestNowPlaying */
         GuestNowPlaying: {
             /** Album Art Url */
@@ -3767,6 +4570,102 @@ export interface components {
             catalog_search: components["schemas"]["CapabilityStatus"];
             playlist_sync: components["schemas"]["CapabilityStatus"];
         };
+        /**
+         * SetCreate
+         * @description Body for creating a new (empty) set.
+         */
+        SetCreate: {
+            /** Event Id */
+            event_id?: number | null;
+            /** Name */
+            name: string;
+        };
+        /**
+         * SetDetail
+         * @description Full set record (Phase 0: no slot/curve expansion yet).
+         */
+        SetDetail: {
+            /** Bpm Ceiling */
+            bpm_ceiling: number | null;
+            /** Bpm Floor */
+            bpm_floor: number | null;
+            /**
+             * Created At
+             * Format: date-time
+             */
+            created_at: string;
+            /** Event Id */
+            event_id: number | null;
+            /** Exported At */
+            exported_at: string | null;
+            /** Id */
+            id: number;
+            /** Key Strictness */
+            key_strictness: number;
+            /** Name */
+            name: string;
+            /**
+             * Sharing Mode
+             * @enum {string}
+             */
+            sharing_mode: "private" | "invite_only";
+            /**
+             * Status
+             * @enum {string}
+             */
+            status: "draft" | "locked" | "exported";
+            /** Target Duration Sec */
+            target_duration_sec: number | null;
+            /** Tidal Playlist Id */
+            tidal_playlist_id: string | null;
+            /**
+             * Updated At
+             * Format: date-time
+             */
+            updated_at: string;
+            /** Vibe Theme */
+            vibe_theme: string | null;
+        };
+        /**
+         * SetRename
+         * @description Body for renaming a set.
+         */
+        SetRename: {
+            /** Name */
+            name: string;
+        };
+        /**
+         * SetSummary
+         * @description Set list item (no children).
+         */
+        SetSummary: {
+            /**
+             * Created At
+             * Format: date-time
+             */
+            created_at: string;
+            /** Event Id */
+            event_id: number | null;
+            /** Id */
+            id: number;
+            /** Name */
+            name: string;
+            /**
+             * Sharing Mode
+             * @enum {string}
+             */
+            sharing_mode: "private" | "invite_only";
+            /**
+             * Status
+             * @enum {string}
+             */
+            status: "draft" | "locked" | "exported";
+            /**
+             * Updated At
+             * Format: date-time
+             */
+            updated_at: string;
+        };
         /** StatusMessageResponse */
         StatusMessageResponse: {
             /** Message */
@@ -3995,6 +4894,30 @@ export interface components {
             /** Tidal Sync Enabled */
             tidal_sync_enabled?: boolean | null;
         };
+        /** UsageRow */
+        UsageRow: {
+            /** Connector Id */
+            connector_id: number;
+            /**
+             * Connector Type
+             * @enum {string}
+             */
+            connector_type: "openai_apikey" | "anthropic_apikey" | "openai_compatible" | "openrouter_apikey" | "xai_apikey" | "bedrock" | "azure_openai" | "gemini_apikey";
+            /** Display Name */
+            display_name: string;
+            /** Dj Username */
+            dj_username: string;
+            /** Error Count */
+            error_count: number;
+            /** Error Rate */
+            error_rate: number;
+            /** Total Calls */
+            total_calls: number;
+            /** Total Tokens In */
+            total_tokens_in: number;
+            /** Total Tokens Out */
+            total_tokens_out: number;
+        };
         /** UserOut */
         UserOut: {
             /**
@@ -4403,9 +5326,16 @@ export interface operations {
             };
         };
     };
-    admin_get_settings_api_admin_settings_get: {
+    list_audit_events_api_admin_llm_audit_get: {
         parameters: {
-            query?: never;
+            query?: {
+                event_type?: string | null;
+                actor_user_id?: number | null;
+                target_connector_id?: number | null;
+                days?: number;
+                limit?: number;
+                offset?: number;
+            };
             header?: never;
             path?: never;
             cookie?: never;
@@ -4418,31 +5348,41 @@ export interface operations {
                     [name: string]: unknown;
                 };
                 content: {
-                    "application/json": components["schemas"]["SystemSettingsOut"];
+                    "application/json": components["schemas"]["AdminAuditOut"];
+                };
+            };
+            /** @description Validation Error */
+            422: {
+                headers: {
+                    [name: string]: unknown;
+                };
+                content: {
+                    "application/json": components["schemas"]["HTTPValidationError"];
                 };
             };
         };
     };
-    admin_update_settings_api_admin_settings_patch: {
+    export_audit_events_csv_api_admin_llm_audit_csv_get: {
         parameters: {
-            query?: never;
+            query?: {
+                event_type?: string | null;
+                actor_user_id?: number | null;
+                target_connector_id?: number | null;
+                days?: number;
+            };
             header?: never;
             path?: never;
             cookie?: never;
         };
-        requestBody: {
-            content: {
-                "application/json": components["schemas"]["SystemSettingsUpdate"];
-            };
-        };
+        requestBody?: never;
         responses: {
-            /** @description Successful Response */
+            /** @description CSV export of the filtered audit trail. */
             200: {
                 headers: {
                     [name: string]: unknown;
                 };
                 content: {
-                    "application/json": components["schemas"]["SystemSettingsOut"];
+                    "text/csv": string;
                 };
             };
             /** @description Validation Error */
@@ -4456,7 +5396,7 @@ export interface operations {
             };
         };
     };
-    admin_stats_api_admin_stats_get: {
+    list_connectors_admin_api_admin_llm_connectors_get: {
         parameters: {
             query?: never;
             header?: never;
@@ -4471,23 +5411,25 @@ export interface operations {
                     [name: string]: unknown;
                 };
                 content: {
-                    "application/json": components["schemas"]["SystemStats"];
+                    "application/json": components["schemas"]["AdminConnectorOut"][];
                 };
             };
         };
     };
-    admin_list_users_api_admin_users_get: {
+    set_connector_cap_admin_api_admin_llm_connectors__connector_id__cap_patch: {
         parameters: {
-            query?: {
-                page?: number;
-                limit?: number;
-                role?: string | null;
-            };
+            query?: never;
             header?: never;
-            path?: never;
+            path: {
+                connector_id: number;
+            };
             cookie?: never;
         };
-        requestBody?: never;
+        requestBody: {
+            content: {
+                "application/json": components["schemas"]["AdminConnectorCapPatch"];
+            };
+        };
         responses: {
             /** @description Successful Response */
             200: {
@@ -4495,7 +5437,7 @@ export interface operations {
                     [name: string]: unknown;
                 };
                 content: {
-                    "application/json": components["schemas"]["PaginatedResponse"];
+                    "application/json": components["schemas"]["AdminConnectorOut"];
                 };
             };
             /** @description Validation Error */
@@ -4509,26 +5451,24 @@ export interface operations {
             };
         };
     };
-    admin_create_user_api_admin_users_post: {
+    revoke_connector_admin_api_admin_llm_connectors__connector_id__revoke_post: {
         parameters: {
             query?: never;
             header?: never;
-            path?: never;
-            cookie?: never;
-        };
-        requestBody: {
-            content: {
-                "application/json": components["schemas"]["AdminUserCreate"];
+            path: {
+                connector_id: number;
             };
+            cookie?: never;
         };
+        requestBody?: never;
         responses: {
             /** @description Successful Response */
-            201: {
+            200: {
                 headers: {
                     [name: string]: unknown;
                 };
                 content: {
-                    "application/json": components["schemas"]["AdminUserOut"];
+                    "application/json": components["schemas"]["AdminConnectorOut"];
                 };
             };
             /** @description Validation Error */
@@ -4542,40 +5482,263 @@ export interface operations {
             };
         };
     };
-    admin_delete_user_api_admin_users__user_id__delete: {
+    get_policy_api_admin_llm_policy_get: {
         parameters: {
             query?: never;
             header?: never;
-            path: {
-                user_id: number;
-            };
+            path?: never;
             cookie?: never;
         };
         requestBody?: never;
         responses: {
             /** @description Successful Response */
-            204: {
-                headers: {
-                    [name: string]: unknown;
-                };
-                content?: never;
-            };
-            /** @description Validation Error */
-            422: {
+            200: {
                 headers: {
                     [name: string]: unknown;
                 };
                 content: {
-                    "application/json": components["schemas"]["HTTPValidationError"];
+                    "application/json": components["schemas"]["AdminPolicyOut"];
                 };
             };
         };
     };
-    admin_update_user_api_admin_users__user_id__patch: {
+    patch_policy_api_admin_llm_policy_patch: {
         parameters: {
             query?: never;
             header?: never;
-            path: {
+            path?: never;
+            cookie?: never;
+        };
+        requestBody: {
+            content: {
+                "application/json": components["schemas"]["AdminPolicyPatch"];
+            };
+        };
+        responses: {
+            /** @description Successful Response */
+            200: {
+                headers: {
+                    [name: string]: unknown;
+                };
+                content: {
+                    "application/json": components["schemas"]["AdminPolicyOut"];
+                };
+            };
+            /** @description Validation Error */
+            422: {
+                headers: {
+                    [name: string]: unknown;
+                };
+                content: {
+                    "application/json": components["schemas"]["HTTPValidationError"];
+                };
+            };
+        };
+    };
+    get_usage_api_admin_llm_usage_get: {
+        parameters: {
+            query?: {
+                days?: number;
+            };
+            header?: never;
+            path?: never;
+            cookie?: never;
+        };
+        requestBody?: never;
+        responses: {
+            /** @description Successful Response */
+            200: {
+                headers: {
+                    [name: string]: unknown;
+                };
+                content: {
+                    "application/json": components["schemas"]["AdminUsageOut"];
+                };
+            };
+            /** @description Validation Error */
+            422: {
+                headers: {
+                    [name: string]: unknown;
+                };
+                content: {
+                    "application/json": components["schemas"]["HTTPValidationError"];
+                };
+            };
+        };
+    };
+    admin_get_settings_api_admin_settings_get: {
+        parameters: {
+            query?: never;
+            header?: never;
+            path?: never;
+            cookie?: never;
+        };
+        requestBody?: never;
+        responses: {
+            /** @description Successful Response */
+            200: {
+                headers: {
+                    [name: string]: unknown;
+                };
+                content: {
+                    "application/json": components["schemas"]["SystemSettingsOut"];
+                };
+            };
+        };
+    };
+    admin_update_settings_api_admin_settings_patch: {
+        parameters: {
+            query?: never;
+            header?: never;
+            path?: never;
+            cookie?: never;
+        };
+        requestBody: {
+            content: {
+                "application/json": components["schemas"]["SystemSettingsUpdate"];
+            };
+        };
+        responses: {
+            /** @description Successful Response */
+            200: {
+                headers: {
+                    [name: string]: unknown;
+                };
+                content: {
+                    "application/json": components["schemas"]["SystemSettingsOut"];
+                };
+            };
+            /** @description Validation Error */
+            422: {
+                headers: {
+                    [name: string]: unknown;
+                };
+                content: {
+                    "application/json": components["schemas"]["HTTPValidationError"];
+                };
+            };
+        };
+    };
+    admin_stats_api_admin_stats_get: {
+        parameters: {
+            query?: never;
+            header?: never;
+            path?: never;
+            cookie?: never;
+        };
+        requestBody?: never;
+        responses: {
+            /** @description Successful Response */
+            200: {
+                headers: {
+                    [name: string]: unknown;
+                };
+                content: {
+                    "application/json": components["schemas"]["SystemStats"];
+                };
+            };
+        };
+    };
+    admin_list_users_api_admin_users_get: {
+        parameters: {
+            query?: {
+                page?: number;
+                limit?: number;
+                role?: string | null;
+            };
+            header?: never;
+            path?: never;
+            cookie?: never;
+        };
+        requestBody?: never;
+        responses: {
+            /** @description Successful Response */
+            200: {
+                headers: {
+                    [name: string]: unknown;
+                };
+                content: {
+                    "application/json": components["schemas"]["PaginatedResponse"];
+                };
+            };
+            /** @description Validation Error */
+            422: {
+                headers: {
+                    [name: string]: unknown;
+                };
+                content: {
+                    "application/json": components["schemas"]["HTTPValidationError"];
+                };
+            };
+        };
+    };
+    admin_create_user_api_admin_users_post: {
+        parameters: {
+            query?: never;
+            header?: never;
+            path?: never;
+            cookie?: never;
+        };
+        requestBody: {
+            content: {
+                "application/json": components["schemas"]["AdminUserCreate"];
+            };
+        };
+        responses: {
+            /** @description Successful Response */
+            201: {
+                headers: {
+                    [name: string]: unknown;
+                };
+                content: {
+                    "application/json": components["schemas"]["AdminUserOut"];
+                };
+            };
+            /** @description Validation Error */
+            422: {
+                headers: {
+                    [name: string]: unknown;
+                };
+                content: {
+                    "application/json": components["schemas"]["HTTPValidationError"];
+                };
+            };
+        };
+    };
+    admin_delete_user_api_admin_users__user_id__delete: {
+        parameters: {
+            query?: never;
+            header?: never;
+            path: {
+                user_id: number;
+            };
+            cookie?: never;
+        };
+        requestBody?: never;
+        responses: {
+            /** @description Successful Response */
+            204: {
+                headers: {
+                    [name: string]: unknown;
+                };
+                content?: never;
+            };
+            /** @description Validation Error */
+            422: {
+                headers: {
+                    [name: string]: unknown;
+                };
+                content: {
+                    "application/json": components["schemas"]["HTTPValidationError"];
+                };
+            };
+        };
+    };
+    admin_update_user_api_admin_users__user_id__patch: {
+        parameters: {
+            query?: never;
+            header?: never;
+            path: {
                 user_id: number;
             };
             cookie?: never;
@@ -6168,7 +7331,461 @@ export interface operations {
                     [name: string]: unknown;
                 };
                 content: {
-                    "application/json": components["schemas"]["AcceptAllResponse"];
+                    "application/json": components["schemas"]["AcceptAllResponse"];
+                };
+            };
+            /** @description Validation Error */
+            422: {
+                headers: {
+                    [name: string]: unknown;
+                };
+                content: {
+                    "application/json": components["schemas"]["HTTPValidationError"];
+                };
+            };
+        };
+    };
+    bulk_delete_requests_endpoint_api_events__code__requests_bulk_delete: {
+        parameters: {
+            query?: {
+                status?: string | null;
+            };
+            header?: never;
+            path: {
+                code: string;
+            };
+            cookie?: never;
+        };
+        requestBody?: never;
+        responses: {
+            /** @description Successful Response */
+            200: {
+                headers: {
+                    [name: string]: unknown;
+                };
+                content: {
+                    "application/json": components["schemas"]["BulkActionResponse"];
+                };
+            };
+            /** @description Validation Error */
+            422: {
+                headers: {
+                    [name: string]: unknown;
+                };
+                content: {
+                    "application/json": components["schemas"]["HTTPValidationError"];
+                };
+            };
+        };
+    };
+    reject_all_requests_endpoint_api_events__code__requests_reject_all_post: {
+        parameters: {
+            query?: never;
+            header?: never;
+            path: {
+                code: string;
+            };
+            cookie?: never;
+        };
+        requestBody?: never;
+        responses: {
+            /** @description Successful Response */
+            200: {
+                headers: {
+                    [name: string]: unknown;
+                };
+                content: {
+                    "application/json": components["schemas"]["BulkActionResponse"];
+                };
+            };
+            /** @description Validation Error */
+            422: {
+                headers: {
+                    [name: string]: unknown;
+                };
+                content: {
+                    "application/json": components["schemas"]["HTTPValidationError"];
+                };
+            };
+        };
+    };
+    event_search_api_events__code__search_get: {
+        parameters: {
+            query: {
+                q: string;
+            };
+            header?: never;
+            path: {
+                code: string;
+            };
+            cookie?: never;
+        };
+        requestBody?: never;
+        responses: {
+            /** @description Successful Response */
+            200: {
+                headers: {
+                    [name: string]: unknown;
+                };
+                content: {
+                    "application/json": components["schemas"]["SearchResult"][];
+                };
+            };
+            /** @description Validation Error */
+            422: {
+                headers: {
+                    [name: string]: unknown;
+                };
+                content: {
+                    "application/json": components["schemas"]["HTTPValidationError"];
+                };
+            };
+        };
+    };
+    unarchive_event_endpoint_api_events__code__unarchive_post: {
+        parameters: {
+            query?: never;
+            header?: never;
+            path: {
+                code: string;
+            };
+            cookie?: never;
+        };
+        requestBody?: never;
+        responses: {
+            /** @description Successful Response */
+            200: {
+                headers: {
+                    [name: string]: unknown;
+                };
+                content: {
+                    "application/json": components["schemas"]["EventOut"];
+                };
+            };
+            /** @description Validation Error */
+            422: {
+                headers: {
+                    [name: string]: unknown;
+                };
+                content: {
+                    "application/json": components["schemas"]["HTTPValidationError"];
+                };
+            };
+        };
+    };
+    api_health_check_api_health_get: {
+        parameters: {
+            query?: never;
+            header?: never;
+            path?: never;
+            cookie?: never;
+        };
+        requestBody?: never;
+        responses: {
+            /** @description Successful Response */
+            200: {
+                headers: {
+                    [name: string]: unknown;
+                };
+                content: {
+                    "application/json": unknown;
+                };
+            };
+        };
+    };
+    list_my_kiosks_api_kiosk_mine_get: {
+        parameters: {
+            query?: never;
+            header?: never;
+            path?: never;
+            cookie?: never;
+        };
+        requestBody?: never;
+        responses: {
+            /** @description Successful Response */
+            200: {
+                headers: {
+                    [name: string]: unknown;
+                };
+                content: {
+                    "application/json": components["schemas"]["KioskOut"][];
+                };
+            };
+        };
+    };
+    complete_kiosk_pairing_api_kiosk_pair__pair_code__complete_post: {
+        parameters: {
+            query?: never;
+            header?: never;
+            path: {
+                pair_code: string;
+            };
+            cookie?: never;
+        };
+        requestBody: {
+            content: {
+                "application/json": components["schemas"]["KioskCompletePairingRequest"];
+            };
+        };
+        responses: {
+            /** @description Successful Response */
+            200: {
+                headers: {
+                    [name: string]: unknown;
+                };
+                content: {
+                    "application/json": components["schemas"]["KioskOut"];
+                };
+            };
+            /** @description Validation Error */
+            422: {
+                headers: {
+                    [name: string]: unknown;
+                };
+                content: {
+                    "application/json": components["schemas"]["HTTPValidationError"];
+                };
+            };
+        };
+    };
+    delete_kiosk_endpoint_api_kiosk__kiosk_id__delete: {
+        parameters: {
+            query?: never;
+            header?: never;
+            path: {
+                kiosk_id: number;
+            };
+            cookie?: never;
+        };
+        requestBody?: never;
+        responses: {
+            /** @description Successful Response */
+            204: {
+                headers: {
+                    [name: string]: unknown;
+                };
+                content?: never;
+            };
+            /** @description Validation Error */
+            422: {
+                headers: {
+                    [name: string]: unknown;
+                };
+                content: {
+                    "application/json": components["schemas"]["HTTPValidationError"];
+                };
+            };
+        };
+    };
+    rename_kiosk_endpoint_api_kiosk__kiosk_id__patch: {
+        parameters: {
+            query?: never;
+            header?: never;
+            path: {
+                kiosk_id: number;
+            };
+            cookie?: never;
+        };
+        requestBody: {
+            content: {
+                "application/json": components["schemas"]["KioskRenameRequest"];
+            };
+        };
+        responses: {
+            /** @description Successful Response */
+            200: {
+                headers: {
+                    [name: string]: unknown;
+                };
+                content: {
+                    "application/json": components["schemas"]["KioskOut"];
+                };
+            };
+            /** @description Validation Error */
+            422: {
+                headers: {
+                    [name: string]: unknown;
+                };
+                content: {
+                    "application/json": components["schemas"]["HTTPValidationError"];
+                };
+            };
+        };
+    };
+    assign_kiosk_api_kiosk__kiosk_id__assign_patch: {
+        parameters: {
+            query?: never;
+            header?: never;
+            path: {
+                kiosk_id: number;
+            };
+            cookie?: never;
+        };
+        requestBody: {
+            content: {
+                "application/json": components["schemas"]["KioskAssignRequest"];
+            };
+        };
+        responses: {
+            /** @description Successful Response */
+            200: {
+                headers: {
+                    [name: string]: unknown;
+                };
+                content: {
+                    "application/json": components["schemas"]["KioskOut"];
+                };
+            };
+            /** @description Validation Error */
+            422: {
+                headers: {
+                    [name: string]: unknown;
+                };
+                content: {
+                    "application/json": components["schemas"]["HTTPValidationError"];
+                };
+            };
+        };
+    };
+    list_connectors_api_llm_connectors_get: {
+        parameters: {
+            query?: never;
+            header?: never;
+            path?: never;
+            cookie?: never;
+        };
+        requestBody?: never;
+        responses: {
+            /** @description Successful Response */
+            200: {
+                headers: {
+                    [name: string]: unknown;
+                };
+                content: {
+                    "application/json": components["schemas"]["ConnectorOut"][];
+                };
+            };
+        };
+    };
+    create_connector_endpoint_api_llm_connectors_post: {
+        parameters: {
+            query?: never;
+            header?: never;
+            path?: never;
+            cookie?: never;
+        };
+        requestBody: {
+            content: {
+                "application/json": components["schemas"]["ConnectorCreate"];
+            };
+        };
+        responses: {
+            /** @description Successful Response */
+            201: {
+                headers: {
+                    [name: string]: unknown;
+                };
+                content: {
+                    "application/json": components["schemas"]["ConnectorOut"];
+                };
+            };
+            /** @description Validation Error */
+            422: {
+                headers: {
+                    [name: string]: unknown;
+                };
+                content: {
+                    "application/json": components["schemas"]["HTTPValidationError"];
+                };
+            };
+        };
+    };
+    delete_connector_endpoint_api_llm_connectors__connector_id__delete: {
+        parameters: {
+            query?: never;
+            header?: never;
+            path: {
+                connector_id: number;
+            };
+            cookie?: never;
+        };
+        requestBody?: never;
+        responses: {
+            /** @description Successful Response */
+            204: {
+                headers: {
+                    [name: string]: unknown;
+                };
+                content?: never;
+            };
+            /** @description Validation Error */
+            422: {
+                headers: {
+                    [name: string]: unknown;
+                };
+                content: {
+                    "application/json": components["schemas"]["HTTPValidationError"];
+                };
+            };
+        };
+    };
+    update_connector_metadata_api_llm_connectors__connector_id__patch: {
+        parameters: {
+            query?: never;
+            header?: never;
+            path: {
+                connector_id: number;
+            };
+            cookie?: never;
+        };
+        requestBody: {
+            content: {
+                "application/json": components["schemas"]["ConnectorPatch"];
+            };
+        };
+        responses: {
+            /** @description Successful Response */
+            200: {
+                headers: {
+                    [name: string]: unknown;
+                };
+                content: {
+                    "application/json": components["schemas"]["ConnectorOut"];
+                };
+            };
+            /** @description Validation Error */
+            422: {
+                headers: {
+                    [name: string]: unknown;
+                };
+                content: {
+                    "application/json": components["schemas"]["HTTPValidationError"];
+                };
+            };
+        };
+    };
+    rotate_connector_credentials_api_llm_connectors__connector_id__credentials_put: {
+        parameters: {
+            query?: never;
+            header?: never;
+            path: {
+                connector_id: number;
+            };
+            cookie?: never;
+        };
+        requestBody: {
+            content: {
+                "application/json": components["schemas"]["ConnectorCredentialsRotate"];
+            };
+        };
+        responses: {
+            /** @description Successful Response */
+            200: {
+                headers: {
+                    [name: string]: unknown;
+                };
+                content: {
+                    "application/json": components["schemas"]["ConnectorOut"];
                 };
             };
             /** @description Validation Error */
@@ -6182,14 +7799,12 @@ export interface operations {
             };
         };
     };
-    bulk_delete_requests_endpoint_api_events__code__requests_bulk_delete: {
+    set_connector_as_default_api_llm_connectors__connector_id__default_post: {
         parameters: {
-            query?: {
-                status?: string | null;
-            };
+            query?: never;
             header?: never;
             path: {
-                code: string;
+                connector_id: number;
             };
             cookie?: never;
         };
@@ -6201,8 +7816,22 @@ export interface operations {
                     [name: string]: unknown;
                 };
                 content: {
-                    "application/json": components["schemas"]["BulkActionResponse"];
+                    "application/json": components["schemas"]["ConnectorOut"];
+                };
+            };
+            /** @description Connector cannot be set as default (e.g. disabled or auth_invalid). */
+            400: {
+                headers: {
+                    [name: string]: unknown;
+                };
+                content?: never;
+            };
+            /** @description Connector not found for current user. */
+            404: {
+                headers: {
+                    [name: string]: unknown;
                 };
+                content?: never;
             };
             /** @description Validation Error */
             422: {
@@ -6215,12 +7844,12 @@ export interface operations {
             };
         };
     };
-    reject_all_requests_endpoint_api_events__code__requests_reject_all_post: {
+    unset_connector_as_default_api_llm_connectors__connector_id__default_delete: {
         parameters: {
             query?: never;
             header?: never;
             path: {
-                code: string;
+                connector_id: number;
             };
             cookie?: never;
         };
@@ -6232,8 +7861,15 @@ export interface operations {
                     [name: string]: unknown;
                 };
                 content: {
-                    "application/json": components["schemas"]["BulkActionResponse"];
+                    "application/json": components["schemas"]["ConnectorOut"];
+                };
+            };
+            /** @description Connector not found for current user. */
+            404: {
+                headers: {
+                    [name: string]: unknown;
                 };
+                content?: never;
             };
             /** @description Validation Error */
             422: {
@@ -6246,14 +7882,12 @@ export interface operations {
             };
         };
     };
-    event_search_api_events__code__search_get: {
+    stream_test_connector_api_llm_connectors__connector_id__stream_test_post: {
         parameters: {
-            query: {
-                q: string;
-            };
+            query?: never;
             header?: never;
             path: {
-                code: string;
+                connector_id: number;
             };
             cookie?: never;
         };
@@ -6265,7 +7899,7 @@ export interface operations {
                     [name: string]: unknown;
                 };
                 content: {
-                    "application/json": components["schemas"]["SearchResult"][];
+                    "application/json": unknown;
                 };
             };
             /** @description Validation Error */
@@ -6279,12 +7913,12 @@ export interface operations {
             };
         };
     };
-    unarchive_event_endpoint_api_events__code__unarchive_post: {
+    test_connector_api_llm_connectors__connector_id__test_post: {
         parameters: {
             query?: never;
             header?: never;
             path: {
-                code: string;
+                connector_id: number;
             };
             cookie?: never;
         };
@@ -6296,7 +7930,7 @@ export interface operations {
                     [name: string]: unknown;
                 };
                 content: {
-                    "application/json": components["schemas"]["EventOut"];
+                    "application/json": components["schemas"]["ConnectorTestResult"];
                 };
             };
             /** @description Validation Error */
@@ -6310,7 +7944,7 @@ export interface operations {
             };
         };
     };
-    api_health_check_api_health_get: {
+    list_feature_preferences_api_llm_feature_preferences_get: {
         parameters: {
             query?: never;
             header?: never;
@@ -6325,19 +7959,23 @@ export interface operations {
                     [name: string]: unknown;
                 };
                 content: {
-                    "application/json": unknown;
+                    "application/json": components["schemas"]["FeaturePreferencesListOut"];
                 };
             };
         };
     };
-    list_my_kiosks_api_kiosk_mine_get: {
+    set_feature_preference_endpoint_api_llm_feature_preferences_post: {
         parameters: {
             query?: never;
             header?: never;
             path?: never;
             cookie?: never;
         };
-        requestBody?: never;
+        requestBody: {
+            content: {
+                "application/json": components["schemas"]["FeaturePreferenceSet"];
+            };
+        };
         responses: {
             /** @description Successful Response */
             200: {
@@ -6345,34 +7983,22 @@ export interface operations {
                     [name: string]: unknown;
                 };
                 content: {
-                    "application/json": components["schemas"]["KioskOut"][];
+                    "application/json": components["schemas"]["FeaturePreferencesListOut"];
                 };
             };
-        };
-    };
-    complete_kiosk_pairing_api_kiosk_pair__pair_code__complete_post: {
-        parameters: {
-            query?: never;
-            header?: never;
-            path: {
-                pair_code: string;
-            };
-            cookie?: never;
-        };
-        requestBody: {
-            content: {
-                "application/json": components["schemas"]["KioskCompletePairingRequest"];
-            };
-        };
-        responses: {
-            /** @description Successful Response */
-            200: {
+            /** @description Connector is not active and cannot be pinned. */
+            400: {
                 headers: {
                     [name: string]: unknown;
                 };
-                content: {
-                    "application/json": components["schemas"]["KioskOut"];
+                content?: never;
+            };
+            /** @description Connector not found for current user. */
+            404: {
+                headers: {
+                    [name: string]: unknown;
                 };
+                content?: never;
             };
             /** @description Validation Error */
             422: {
@@ -6385,23 +8011,25 @@ export interface operations {
             };
         };
     };
-    delete_kiosk_endpoint_api_kiosk__kiosk_id__delete: {
+    clear_feature_preference_endpoint_api_llm_feature_preferences__feature__delete: {
         parameters: {
             query?: never;
             header?: never;
             path: {
-                kiosk_id: number;
+                feature: "recommendation" | "set_builder";
             };
             cookie?: never;
         };
         requestBody?: never;
         responses: {
             /** @description Successful Response */
-            204: {
+            200: {
                 headers: {
                     [name: string]: unknown;
                 };
-                content?: never;
+                content: {
+                    "application/json": components["schemas"]["FeaturePreferencesListOut"];
+                };
             };
             /** @description Validation Error */
             422: {
@@ -6414,20 +8042,14 @@ export interface operations {
             };
         };
     };
-    rename_kiosk_endpoint_api_kiosk__kiosk_id__patch: {
+    list_openrouter_models_api_llm_openrouter_models_get: {
         parameters: {
             query?: never;
             header?: never;
-            path: {
-                kiosk_id: number;
-            };
+            path?: never;
             cookie?: never;
         };
-        requestBody: {
-            content: {
-                "application/json": components["schemas"]["KioskRenameRequest"];
-            };
-        };
+        requestBody?: never;
         responses: {
             /** @description Successful Response */
             200: {
@@ -6435,34 +8057,19 @@ export interface operations {
                     [name: string]: unknown;
                 };
                 content: {
-                    "application/json": components["schemas"]["KioskOut"];
-                };
-            };
-            /** @description Validation Error */
-            422: {
-                headers: {
-                    [name: string]: unknown;
-                };
-                content: {
-                    "application/json": components["schemas"]["HTTPValidationError"];
+                    "application/json": components["schemas"]["AIModelsResponse"];
                 };
             };
         };
     };
-    assign_kiosk_api_kiosk__kiosk_id__assign_patch: {
+    get_dj_policy_api_llm_policy_get: {
         parameters: {
             query?: never;
             header?: never;
-            path: {
-                kiosk_id: number;
-            };
+            path?: never;
             cookie?: never;
         };
-        requestBody: {
-            content: {
-                "application/json": components["schemas"]["KioskAssignRequest"];
-            };
-        };
+        requestBody?: never;
         responses: {
             /** @description Successful Response */
             200: {
@@ -6470,17 +8077,22 @@ export interface operations {
                     [name: string]: unknown;
                 };
                 content: {
-                    "application/json": components["schemas"]["KioskOut"];
+                    "application/json": components["schemas"]["DjPolicyOut"];
                 };
             };
-            /** @description Validation Error */
-            422: {
+            /** @description Not authenticated (missing or invalid bearer token). */
+            401: {
                 headers: {
                     [name: string]: unknown;
                 };
-                content: {
-                    "application/json": components["schemas"]["HTTPValidationError"];
+                content?: never;
+            };
+            /** @description Authenticated but not an active DJ (e.g. pending approval). */
+            403: {
+                headers: {
+                    [name: string]: unknown;
                 };
+                content?: never;
             };
         };
     };
@@ -7617,6 +9229,154 @@ export interface operations {
             };
         };
     };
+    list_sets_api_setbuilder_sets_get: {
+        parameters: {
+            query?: never;
+            header?: never;
+            path?: never;
+            cookie?: never;
+        };
+        requestBody?: never;
+        responses: {
+            /** @description Successful Response */
+            200: {
+                headers: {
+                    [name: string]: unknown;
+                };
+                content: {
+                    "application/json": components["schemas"]["SetSummary"][];
+                };
+            };
+        };
+    };
+    create_set_api_setbuilder_sets_post: {
+        parameters: {
+            query?: never;
+            header?: never;
+            path?: never;
+            cookie?: never;
+        };
+        requestBody: {
+            content: {
+                "application/json": components["schemas"]["SetCreate"];
+            };
+        };
+        responses: {
+            /** @description Successful Response */
+            201: {
+                headers: {
+                    [name: string]: unknown;
+                };
+                content: {
+                    "application/json": components["schemas"]["SetDetail"];
+                };
+            };
+            /** @description Validation Error */
+            422: {
+                headers: {
+                    [name: string]: unknown;
+                };
+                content: {
+                    "application/json": components["schemas"]["HTTPValidationError"];
+                };
+            };
+        };
+    };
+    get_set_api_setbuilder_sets__set_id__get: {
+        parameters: {
+            query?: never;
+            header?: never;
+            path: {
+                set_id: number;
+            };
+            cookie?: never;
+        };
+        requestBody?: never;
+        responses: {
+            /** @description Successful Response */
+            200: {
+                headers: {
+                    [name: string]: unknown;
+                };
+                content: {
+                    "application/json": components["schemas"]["SetDetail"];
+                };
+            };
+            /** @description Validation Error */
+            422: {
+                headers: {
+                    [name: string]: unknown;
+                };
+                content: {
+                    "application/json": components["schemas"]["HTTPValidationError"];
+                };
+            };
+        };
+    };
+    delete_set_api_setbuilder_sets__set_id__delete: {
+        parameters: {
+            query?: never;
+            header?: never;
+            path: {
+                set_id: number;
+            };
+            cookie?: never;
+        };
+        requestBody?: never;
+        responses: {
+            /** @description Successful Response */
+            204: {
+                headers: {
+                    [name: string]: unknown;
+                };
+                content?: never;
+            };
+            /** @description Validation Error */
+            422: {
+                headers: {
+                    [name: string]: unknown;
+                };
+                content: {
+                    "application/json": components["schemas"]["HTTPValidationError"];
+                };
+            };
+        };
+    };
+    rename_set_api_setbuilder_sets__set_id__patch: {
+        parameters: {
+            query?: never;
+            header?: never;
+            path: {
+                set_id: number;
+            };
+            cookie?: never;
+        };
+        requestBody: {
+            content: {
+                "application/json": components["schemas"]["SetRename"];
+            };
+        };
+        responses: {
+            /** @description Successful Response */
+            200: {
+                headers: {
+                    [name: string]: unknown;
+                };
+                content: {
+                    "application/json": components["schemas"]["SetDetail"];
+                };
+            };
+            /** @description Validation Error */
+            422: {
+                headers: {
+                    [name: string]: unknown;
+                };
+                content: {
+                    "application/json": components["schemas"]["HTTPValidationError"];
+                };
+            };
+        };
+    };
     cancel_auth_api_tidal_auth_cancel_post: {
         parameters: {
             query?: never;
diff --git a/dashboard/lib/api-types.ts b/dashboard/lib/api-types.ts
index c177b05b..c132e30a 100644
--- a/dashboard/lib/api-types.ts
+++ b/dashboard/lib/api-types.ts
@@ -52,6 +52,32 @@ export type AIModelInfo = Schemas['AIModelInfo'];
 export type AIModelsResponse = Schemas['AIModelsResponse'];
 export type AISettings = Schemas['AISettingsOut'];
 export type AISettingsUpdate = Schemas['AISettingsUpdate'];
+
+// LLM gateway (issue #329)
+export type LlmConnector = Schemas['ConnectorOut'];
+export type LlmAdminConnector = Schemas['AdminConnectorOut'];
+export type LlmConnectorCreate = Schemas['ConnectorCreate'];
+export type LlmConnectorPatch = Schemas['ConnectorPatch'];
+export type LlmConnectorCredentialsRotate = Schemas['ConnectorCredentialsRotate'];
+export type LlmConnectorTestResult = Schemas['ConnectorTestResult'];
+export type LlmAdminPolicy = Schemas['AdminPolicyOut'];
+export type LlmAdminPolicyPatch = Schemas['AdminPolicyPatch'];
+// Monthly token cap (issue #339)
+export type LlmAdminConnectorCapPatch = Schemas['AdminConnectorCapPatch'];
+export type LlmDjPolicy = Schemas['DjPolicyOut'];
+export type LlmAdminUsage = Schemas['AdminUsageOut'];
+export type LlmUsageRow = Schemas['UsageRow'];
+// LLM audit trail (issue #341)
+export type LlmAdminAudit = Schemas['AdminAuditOut'];
+export type LlmAuditRow = Schemas['AuditEventRow'];
+// Per-feature connector preference (issue #337)
+export type LlmFeaturePreference = Schemas['FeaturePreferenceOut'];
+export type LlmFeaturePreferences = Schemas['FeaturePreferencesListOut'];
+export type LlmFeaturePreferenceSet = Schemas['FeaturePreferenceSet'];
+export type LlmFeatureKey = Schemas['FeaturePreferenceOut']['feature'];
+// Derive from schema so backend enum changes propagate to TS automatically.
+export type LlmConnectorType = Schemas['ConnectorOut']['connector_type'];
+export type LlmConnectorStatus = Schemas['ConnectorOut']['status'];
 export type ActivityLogEntry = Schemas['ActivityLogEntry'];
 export type CapabilityStatus = Schemas['CapabilityStatus'];
 export type ServiceCapabilities = Schemas['ServiceCapabilities'];
diff --git a/dashboard/lib/api.ts b/dashboard/lib/api.ts
index 6c4f7d3e..8db9635f 100644
--- a/dashboard/lib/api.ts
+++ b/dashboard/lib/api.ts
@@ -5,6 +5,20 @@ import type {
   AISettings,
   AISettingsUpdate,
   ActivityLogEntry,
+  LlmAdminAudit,
+  LlmAdminConnector,
+  LlmAdminPolicy,
+  LlmAdminPolicyPatch,
+  LlmAdminUsage,
+  LlmConnector,
+  LlmConnectorCreate,
+  LlmConnectorCredentialsRotate,
+  LlmConnectorPatch,
+  LlmConnectorTestResult,
+  LlmDjPolicy,
+  LlmFeatureKey,
+  LlmFeaturePreferences,
+  LlmFeaturePreferenceSet,
   ArchivedEvent,
   BeatportEventSettings,
   BeatportSearchResult,
@@ -52,6 +66,25 @@ export type {
   AIModelsResponse,
   AISettings,
   AISettingsUpdate,
+  LlmAdminAudit,
+  LlmAdminConnector,
+  LlmAdminPolicy,
+  LlmAdminPolicyPatch,
+  LlmAdminUsage,
+  LlmAuditRow,
+  LlmConnector,
+  LlmConnectorCreate,
+  LlmConnectorCredentialsRotate,
+  LlmConnectorPatch,
+  LlmConnectorStatus,
+  LlmConnectorTestResult,
+  LlmConnectorType,
+  LlmDjPolicy,
+  LlmFeatureKey,
+  LlmFeaturePreference,
+  LlmFeaturePreferences,
+  LlmFeaturePreferenceSet,
+  LlmUsageRow,
   ArchivedEvent,
   BeatportEventSettings,
   BeatportSearchResult,
@@ -103,6 +136,17 @@ export type {
   VoteResponse,
 } from './api-types';
 
+// ========== Admin LLM audit trail filters (issue #341) ==========
+
+export interface AdminLlmAuditFilters {
+  event_type?: string;
+  actor_user_id?: number;
+  target_connector_id?: number;
+  days?: number;
+  limit?: number;
+  offset?: number;
+}
+
 // ========== Pre-Event Collection Types ==========
 
 export interface CollectEventPreview {
@@ -231,6 +275,26 @@ export class HumanVerificationRequiredError extends ApiError {
   }
 }
 
+/**
+ * One incremental chunk of a streamed LLM response (mirrors the backend
+ * `ChatResponseChunk`). Non-final chunks carry `text_delta` and/or
+ * `tool_call_deltas`; the final chunk has `done: true` plus `stop_reason` and
+ * (when reported) `usage`. Hand-written client type — SSE chunks are not part of
+ * the REST OpenAPI schema.
+ */
+export interface LlmStreamChunk {
+  text_delta?: string;
+  tool_call_deltas?: Array<{
+    index: number;
+    id?: string | null;
+    name?: string | null;
+    input_json_fragment?: string;
+  }>;
+  stop_reason?: 'end_turn' | 'tool_use' | 'max_tokens' | 'error' | null;
+  usage?: { prompt: number; completion: number } | null;
+  done?: boolean;
+}
+
 /**
  * Wrap a guest-public fetch in 403-human-verification-required retry logic.
  * Caller passes a `reverify` async function that re-runs the Turnstile
@@ -1173,6 +1237,244 @@ class ApiClient {
     });
   }
 
+  // ========== LLM connectors (per-DJ) ==========
+
+  async listLlmConnectors(): Promise<LlmConnector[]> {
+    return this.fetch('/api/llm/connectors');
+  }
+
+  // DJ-readable connector policy (non-sensitive subset). The settings/ai page
+  // uses this to fail closed — hiding connector types the admin disabled —
+  // instead of falling back to "all types allowed" on the admin-only endpoint.
+  async getLlmPolicy(): Promise<LlmDjPolicy> {
+    return this.fetch('/api/llm/policy');
+  }
+
+  async listOpenRouterModels(): Promise<AIModelsResponse> {
+    return this.fetch('/api/llm/openrouter/models');
+  }
+
+  async createLlmConnector(data: LlmConnectorCreate): Promise<LlmConnector> {
+    return this.fetch('/api/llm/connectors', {
+      method: 'POST',
+      body: JSON.stringify(data),
+    });
+  }
+
+  async updateLlmConnector(id: number, data: LlmConnectorPatch): Promise<LlmConnector> {
+    return this.fetch(`/api/llm/connectors/${id}`, {
+      method: 'PATCH',
+      body: JSON.stringify(data),
+    });
+  }
+
+  async rotateLlmConnectorCredentials(
+    id: number,
+    data: LlmConnectorCredentialsRotate,
+  ): Promise<LlmConnector> {
+    return this.fetch(`/api/llm/connectors/${id}/credentials`, {
+      method: 'PUT',
+      body: JSON.stringify(data),
+    });
+  }
+
+  async testLlmConnector(id: number): Promise<LlmConnectorTestResult> {
+    return this.fetch(`/api/llm/connectors/${id}/test`, { method: 'POST' });
+  }
+
+  /**
+   * Stream a short health-check sentence through a connector via SSE.
+   *
+   * Uses fetch + ReadableStream rather than EventSource because EventSource
+   * cannot send the Authorization header this authenticated endpoint requires.
+   * Pass an AbortSignal to cancel — aborting closes the connection, which the
+   * backend treats as a client disconnect and cancels the upstream provider
+   * request. `onChunk` is invoked for every parsed SSE data frame.
+   */
+  async streamConnectorTest(
+    id: number,
+    onChunk: (chunk: LlmStreamChunk) => void,
+    signal?: AbortSignal,
+  ): Promise<void> {
+    const headers = new Headers({ Accept: 'text/event-stream' });
+    if (this.token) headers.set('Authorization', `Bearer ${this.token}`);
+
+    const response = await fetch(`${getApiUrl()}/api/llm/connectors/${id}/stream-test`, {
+      method: 'POST',
+      headers,
+      signal,
+    });
+    if (!response.ok || !response.body) {
+      if (response.status === 401 && this.onUnauthorized) this.onUnauthorized();
+      throw new ApiError('Stream test failed', response.status);
+    }
+
+    const reader = response.body.getReader();
+    const decoder = new TextDecoder();
+    let buffer = '';
+    // SSE frames are separated by a blank line. The spec allows LF (`\n\n`) or
+    // CRLF (`\r\n\r\n`) terminators, so match either — a CRLF-emitting server or
+    // proxy must not leave frames (including `event: error`) unparsed.
+    const frameBoundary = /\r?\n\r?\n/;
+    try {
+      for (;;) {
+        const { done, value } = await reader.read();
+        if (done) break;
+        buffer += decoder.decode(value, { stream: true });
+        let sep: number;
+        while ((sep = buffer.search(frameBoundary)) !== -1) {
+          const frame = buffer.slice(0, sep);
+          const boundary = buffer.slice(sep).match(frameBoundary)?.[0] ?? '\n\n';
+          buffer = buffer.slice(sep + boundary.length);
+          // A frame may carry an `event:` name plus one or more `data:` lines.
+          // The backend emits `event: error` for typed gateway failures, so we
+          // must inspect the event type — not just blindly parse `data:`.
+          let eventType = 'message';
+          const dataLines: string[] = [];
+          for (const line of frame.split(/\r?\n/)) {
+            if (line.startsWith('event:')) {
+              eventType = line.slice('event:'.length).trim();
+            } else if (line.startsWith('data:')) {
+              dataLines.push(line.slice('data:'.length).trim());
+            }
+          }
+          const data = dataLines.join('\n').trim();
+          if (!data || data === '[DONE]') continue;
+
+          if (eventType === 'error') {
+            // Surface the sanitised backend error code as a thrown failure
+            // rather than passing it through as an inert chunk.
+            let code: string | undefined;
+            try {
+              code = (JSON.parse(data) as { code?: string }).code;
+            } catch {
+              code = undefined;
+            }
+            throw new ApiError(`Stream test failed${code ? `: ${code}` : ''}`, 500);
+          }
+
+          try {
+            onChunk(JSON.parse(data) as LlmStreamChunk);
+          } catch {
+            // Ignore unparseable keepalive frames.
+          }
+        }
+      }
+    } finally {
+      reader.releaseLock();
+    }
+  }
+
+  async deleteLlmConnector(id: number): Promise<void> {
+    await this.fetch(`/api/llm/connectors/${id}`, { method: 'DELETE' });
+  }
+
+  // Pin / unpin a connector as the DJ's explicit default (issue #336). When
+  // pinned, the gateway routes through this connector regardless of which one
+  // is most-recently-used.
+  async setLlmConnectorDefault(id: number): Promise<LlmConnector> {
+    return this.fetch(`/api/llm/connectors/${id}/default`, { method: 'POST' });
+  }
+
+  async unsetLlmConnectorDefault(id: number): Promise<LlmConnector> {
+    return this.fetch(`/api/llm/connectors/${id}/default`, { method: 'DELETE' });
+  }
+
+  // ========== Per-feature connector preferences (issue #337) ==========
+
+  async listLlmFeaturePreferences(): Promise<LlmFeaturePreferences> {
+    return this.fetch('/api/llm/feature-preferences');
+  }
+
+  async setLlmFeaturePreference(data: LlmFeaturePreferenceSet): Promise<LlmFeaturePreferences> {
+    return this.fetch('/api/llm/feature-preferences', {
+      method: 'POST',
+      body: JSON.stringify(data),
+    });
+  }
+
+  async clearLlmFeaturePreference(feature: LlmFeatureKey): Promise<LlmFeaturePreferences> {
+    return this.fetch(`/api/llm/feature-preferences/${feature}`, {
+      method: 'DELETE',
+    });
+  }
+
+  // ========== Admin LLM policy + oversight ==========
+
+  async getAdminLlmPolicy(): Promise<LlmAdminPolicy> {
+    return this.fetch('/api/admin/llm/policy');
+  }
+
+  async updateAdminLlmPolicy(data: LlmAdminPolicyPatch): Promise<LlmAdminPolicy> {
+    return this.fetch('/api/admin/llm/policy', {
+      method: 'PATCH',
+      body: JSON.stringify(data),
+    });
+  }
+
+  async listAllLlmConnectors(): Promise<LlmAdminConnector[]> {
+    return this.fetch('/api/admin/llm/connectors');
+  }
+
+  async revokeAdminLlmConnector(id: number): Promise<LlmAdminConnector> {
+    return this.fetch(`/api/admin/llm/connectors/${id}/revoke`, { method: 'POST' });
+  }
+
+  async getAdminLlmUsage(days = 30): Promise<LlmAdminUsage> {
+    return this.fetch(`/api/admin/llm/usage?days=${days}`);
+  }
+
+  /**
+   * Set or clear a connector's monthly token cap (admin-only, issue #339).
+   * Pass `null` to clear the cap (unlimited).
+   */
+  async setAdminLlmConnectorCap(
+    id: number,
+    monthlyTokenCap: number | null,
+  ): Promise<LlmAdminConnector> {
+    return this.fetch(`/api/admin/llm/connectors/${id}/cap`, {
+      method: 'PATCH',
+      body: JSON.stringify({ monthly_token_cap: monthlyTokenCap }),
+    });
+  }
+
+  // ========== Admin LLM audit trail (issue #341) ==========
+
+  private buildAuditQuery(filters: AdminLlmAuditFilters = {}): URLSearchParams {
+    const params = new URLSearchParams();
+    if (filters.event_type) params.set('event_type', filters.event_type);
+    if (filters.actor_user_id != null) {
+      params.set('actor_user_id', String(filters.actor_user_id));
+    }
+    if (filters.target_connector_id != null) {
+      params.set('target_connector_id', String(filters.target_connector_id));
+    }
+    if (filters.days != null) params.set('days', String(filters.days));
+    if (filters.limit != null) params.set('limit', String(filters.limit));
+    if (filters.offset != null) params.set('offset', String(filters.offset));
+    return params;
+  }
+
+  async getAdminLlmAudit(filters: AdminLlmAuditFilters = {}): Promise<LlmAdminAudit> {
+    const params = this.buildAuditQuery(filters);
+    return this.fetch(`/api/admin/llm/audit?${params.toString()}`);
+  }
+
+  /**
+   * Download the (filtered) audit trail as a CSV Blob. Pagination params are
+   * ignored server-side for the export — it honors only the filter fields.
+   */
+  async downloadAdminLlmAuditCsv(filters: AdminLlmAuditFilters = {}): Promise<Blob> {
+    const params = this.buildAuditQuery({
+      event_type: filters.event_type,
+      actor_user_id: filters.actor_user_id,
+      target_connector_id: filters.target_connector_id,
+      days: filters.days,
+    });
+    const response = await this.rawFetch(`/api/admin/llm/audit.csv?${params.toString()}`);
+    return response.blob();
+  }
+
   // ========== Kiosk Pairing ==========
 
   async getKioskPairChallenge(): Promise<{ nonce: string; expires_in: number }> {
diff --git a/dashboard/next.config.js b/dashboard/next.config.js
index 44585cf6..185e530c 100644
--- a/dashboard/next.config.js
+++ b/dashboard/next.config.js
@@ -15,6 +15,13 @@ const csp = [
 const nextConfig = {
   output: 'standalone',
   allowedDevOrigins: ['192.168.*.*'],
+  async redirects() {
+    return [
+      // DJ AI connector/model settings moved into the account page (#357).
+      // Keep old bookmarks/links working with a permanent (308) redirect.
+      { source: '/settings/ai', destination: '/account', permanent: true },
+    ];
+  },
   async headers() {
     return [
       {
diff --git a/docs/LLM-PLUGIN.md b/docs/LLM-PLUGIN.md
new file mode 100644
index 00000000..6d03f304
--- /dev/null
+++ b/docs/LLM-PLUGIN.md
@@ -0,0 +1,323 @@
+# LLM Adapter Plug-in Guide
+
+The WrzDJ backend dispatches every LLM call through the **LLM Gateway**, which
+selects a connector for the calling user and routes the request through a
+provider-specific **adapter**. The set of adapters is open: forks and
+third-party deployments can add new providers without modifying any file
+under `server/app/services/llm/`.
+
+This document is the contract that third-party plug-ins write against.
+
+> Companion guide: [`docs/PLUGIN-ARCHITECTURE.md`](PLUGIN-ARCHITECTURE.md)
+> describes the bridge-side equipment plug-in system. The LLM plug-in surface
+> follows the same shape: a small ABC, a registry, and a strict typed-error
+> contract.
+
+## Architecture Overview
+
+```text
+Caller (recommendation engine, agentic feature)
+        │
+        ▼
+Gateway.dispatch(db, actor, request, *, purpose)
+        │   1. Resolve LlmConnector (per-DJ MRU → org default)
+        │   2. registry.get_adapter_class(connector_type)
+        │   3. adapter = cls(connector); await adapter.chat(request)
+        │   4. Log call + handle fallback policy
+        ▼
+LlmAdapter (your plug-in)
+        │   1. Parse connector.credentials (encrypted JSON blob)
+        │   2. Translate ChatRequest → provider-native request
+        │   3. Translate provider response → ChatResponse
+        │   4. Map provider errors → typed LlmError subclasses
+        ▼
+Provider HTTP endpoint / SDK
+```
+
+| Layer | File | Responsibility |
+|-------|------|----------------|
+| Adapter | `app/services/llm/adapters/*.py` (built-in) <br> `LLM_PLUGIN_DIR/*.py` (third-party) | Convert between canonical and provider-native shapes; map errors |
+| Registry | `app/services/llm/registry.py` | `connector_type` → adapter class lookup |
+| Tool translation | `app/services/llm/tool_translation.py` | JSON-Schema `ToolSpec` ↔ provider tool/function shape |
+| Gateway | `app/services/llm/gateway.py` | Resolve connector, call adapter, log, handle fallback |
+| Models | `app/models/llm_connector.py` | `LlmConnector` row (encrypted credentials), call log, audit log |
+| Exceptions | `app/services/llm/exceptions.py` | Typed error hierarchy adapters must raise |
+
+The connector row stores credentials as **encrypted JSON** via the
+`EncryptedText` SQLAlchemy column type — accessing
+`connector.credentials` returns the decrypted plaintext blob. Your adapter is
+responsible for parsing that blob.
+
+## The `LlmAdapter` ABC
+
+Defined in [`app/services/llm/base.py`](../server/app/services/llm/base.py).
+
+```python
+class LlmAdapter(ABC):
+    connector_type: str = ""  # set on the subclass — registry key
+
+    def __init__(self, connector) -> None:
+        self.connector = connector
+
+    @abstractmethod
+    async def chat(self, request: ChatRequest) -> ChatResponse: ...
+
+    @abstractmethod
+    async def health_check(self) -> None: ...
+```
+
+### Required Class Attribute: `connector_type`
+
+A short, lowercase, snake-case string. The DB column that stores it is 40
+characters; pick something unique and stable (e.g. `mistral_apikey`,
+`groq_apikey`, `local_vllm`). The registry **refuses to bind the same
+`connector_type` to two different classes** — that prevents silent shadowing
+of built-in adapters.
+
+### Required Method: `chat()`
+
+| Property | Contract |
+|----------|----------|
+| Coroutine | Yes — `async def`. The gateway always awaits. |
+| Input | A canonical `ChatRequest`. |
+| Output | A canonical `ChatResponse`. |
+| Errors | One of the typed `LlmError` subclasses (see below). Never a raw HTTP / SDK exception. |
+| Side effects | None other than the upstream network call. Do **not** mutate the connector row. |
+| Logging | Do not log full prompts, completions, or any credential material. |
+
+### Required Method: `health_check()`
+
+Validate the credential against the provider. The gateway calls this from the
+admin "Test connector" path. Returns `None` on success; raises the same typed
+exceptions as `chat()` on failure.
+
+Pattern: issue the cheapest possible call (e.g. `max_tokens=1`). The shared
+helper `build_healthcheck_request()` in
+`app/services/llm/adapters/_httpx_openai.py` is reusable for OpenAI-shaped
+endpoints.
+
+## Canonical Types
+
+Defined in [`app/services/llm/base.py`](../server/app/services/llm/base.py).
+These are **stable** Pydantic models — fields may be added in a minor release
+but never renamed or removed without a major-version bump.
+
+### `ChatRequest`
+
+| Field | Type | Notes |
+|-------|------|-------|
+| `messages` | `list[Message]` | Required. `role ∈ {"system", "user", "assistant", "tool"}`. Tool messages carry `tool_call_id`. |
+| `tools` | `list[ToolSpec] \| None` | JSON-Schema shape. Translate via `tool_translation.to_*_tools()`. |
+| `force_tool` | `str \| None` | Forces a specific tool name; raise `ToolTranslationError` if not in `tools`. |
+| `max_tokens` | `int \| None` | Adapters supply a default if `None`. |
+| `temperature` | `float \| None` | Pass through verbatim when not `None`. |
+| `model` | `str \| None` | Overrides `connector.model_hint`. |
+| `timeout_seconds` | `float \| None` | Adapters MAY clamp to a max. |
+| `system` | `str \| None` | Provider-native system prompt. Map to the right surface (OpenAI: first system message; Anthropic: top-level `system`). |
+| `fallback_policy` | `Literal["none", "org_default", "retry_then_org_default"]` | Handled by the gateway, not the adapter. Ignore. |
+
+### `ChatResponse`
+
+| Field | Type | Notes |
+|-------|------|-------|
+| `text` | `str` | The textual assistant reply. Empty string if the model only emitted tool calls. |
+| `tool_calls` | `list[ToolCall]` | Empty list when no tools were called. |
+| `stop_reason` | `Literal["end_turn", "tool_use", "max_tokens", "error"]` | Required. Map from the provider's native stop reason. |
+| `usage` | `TokenUsage \| None` | Counts only — never prompt content. Optional. |
+| `model` | `str \| None` | Provider-reported model id (for telemetry). Recommended. |
+
+### `ToolSpec`, `ToolCall`, `Message`
+
+See the source. `ToolSpec.input_schema` is a JSON-Schema dict;
+`tool_translation.py` knows how to translate it for OpenAI / Anthropic /
+Bedrock and parse the response back into canonical `ToolCall` objects.
+Reuse those helpers rather than reimplementing them per adapter.
+
+## Exception Contract
+
+Defined in [`app/services/llm/exceptions.py`](../server/app/services/llm/exceptions.py).
+Every error from the adapter must be one of these. The gateway translates
+them into telemetry, audit events, and HTTP response codes; raw provider
+errors **must not** reach the caller (they often contain bearer tokens in
+error messages — a credential-leak vector).
+
+| Exception | When to raise | Status hint |
+|-----------|---------------|-------------|
+| `AuthInvalid` | Credentials are malformed, missing, or rejected (`401`/`403`). Includes "failed to parse the credential JSON". | Marks connector `status="auth_invalid"`; writes audit event. |
+| `RateLimited(retry_after_seconds=...)` | Provider returned `429`. Pass through `Retry-After` if present. | Gateway logs and surfaces as `429` to the caller. |
+| `QuotaExceeded` | Billing failure (`402`) or provider-specific quota error. | Logged, surfaced as `402` to caller. |
+| `ProviderUnavailable` | `5xx`, network failure, timeout, generic SDK error. | Logged, surfaced as `502`. Eligible for fallback. |
+| `ToolTranslationError` | Unable to translate input tools or parse the response. | Logged, surfaced as `502`. **Not** a fallback trigger. |
+| `NoLlmConfigured` | **Gateway-only.** Adapters should not raise this. | – |
+
+### Mapping example (OpenAI HTTP shape)
+
+```python
+status = response.status_code
+if status in (401, 403):
+    raise AuthInvalid(f"Auth failed (HTTP {status})")
+if status == 402:
+    raise QuotaExceeded("Quota or billing failure")
+if status == 429:
+    retry = response.headers.get("retry-after")
+    raise RateLimited("Rate limited", retry_after_seconds=int(float(retry)) if retry else None)
+if 500 <= status < 600:
+    raise ProviderUnavailable(f"Upstream error (HTTP {status})")
+# 4xx other than the above → almost certainly a translation problem.
+raise ToolTranslationError(f"Upstream rejected request (HTTP {status})")
+```
+
+## Tool Translation
+
+The canonical `ToolSpec` is JSON-Schema. Adapters should delegate to
+[`app/services/llm/tool_translation.py`](../server/app/services/llm/tool_translation.py)
+rather than re-implementing the conversion. The module exposes:
+
+| Helper | Direction |
+|--------|-----------|
+| `to_openai_tools(tools, force)` | Canonical → OpenAI `tools` + `tool_choice` |
+| `parse_openai_response(payload)` | OpenAI body → `ChatResponse` |
+| `to_anthropic_tools(tools, force)` | Canonical → Anthropic `tools` + `tool_choice` |
+| `parse_anthropic_response(message)` | Anthropic SDK message → `ChatResponse` |
+| `to_bedrock_tools(tools, force)` | Canonical → Bedrock Converse `toolConfig` |
+| `parse_bedrock_response(payload)` | Bedrock body → `ChatResponse` |
+
+Adding a new translation pair for a provider whose tool shape genuinely
+differs is allowed — open a PR adding helpers under the same naming
+convention. Until then, do not silently re-shape tools inside your adapter.
+
+## Registration
+
+Register the adapter as the **last statement** of your module:
+
+```python
+register_adapter(MyAdapter.connector_type, MyAdapter)
+```
+
+That call:
+
+- Validates the class subclasses `LlmAdapter`.
+- Rejects empty `connector_type`.
+- Rejects double-binding (a different class trying to take an already-bound
+  key — surfaced as `ValueError` at startup).
+
+Re-registering the *same* class is a no-op (safe for test re-imports).
+
+## Loading Third-Party Plug-ins
+
+There are two supported mechanisms:
+
+1. **Import from your own code.** Add the file to your fork of the backend
+   and ensure it gets imported at startup (e.g. add it to the
+   `app/services/llm/registry.py::_bootstrap` block, or import it from
+   `app/main.py`). This is the recommended path for forks.
+
+2. **`LLM_PLUGIN_DIR` env var.** Set the environment variable to a directory
+   path. At startup the loader
+   ([`app/services/llm/plugin_loader.py`](../server/app/services/llm/plugin_loader.py))
+   imports every `*.py` file in that directory (non-recursive; files starting
+   with `_` are skipped). Each plug-in is responsible for calling
+   `register_adapter()` on import. A broken plug-in is logged with a full
+   stack trace and skipped — it does **not** prevent the rest of the directory
+   or the backend itself from starting.
+
+### Security posture for `LLM_PLUGIN_DIR`
+
+Loading a plug-in grants it the **full privileges of the backend process**.
+There is no sandbox; this is the same trust boundary as `pip install`.
+Operators must:
+
+- Treat the plug-in directory as a privileged path. Only the backend's
+  service account should have write access to it.
+- Audit every plug-in's source the same way they would audit a third-party
+  Python dependency.
+- Never set `LLM_PLUGIN_DIR` to a world-writable or multi-tenant path.
+
+In production we recommend leaving `LLM_PLUGIN_DIR` unset and packaging
+trusted plug-ins as ordinary Python modules. The env-var loader exists to
+make local experimentation and forks ergonomic.
+
+## Stable vs Internal API
+
+The plug-in surface is **the surface listed in this document**. Everything
+else under `app/services/llm/` is internal — including helper modules,
+private functions, and adapter base-class internals not enumerated above.
+
+| Surface | Stability |
+|---------|-----------|
+| `LlmAdapter` ABC method signatures (`chat`, `health_check`, `connector_type`) | **Stable.** Breaking change → major version bump. |
+| `ChatRequest`, `ChatResponse`, `Message`, `ToolSpec`, `ToolCall`, `TokenUsage` field names + types | **Stable.** Field additions in minor versions; never renames/removals without a major bump. |
+| Exception types and their constructor signatures | **Stable.** |
+| `register_adapter`, `get_adapter_class`, `list_connector_types`, `is_registered` | **Stable.** |
+| `tool_translation.to_*_tools` / `parse_*_response` | **Stable** for the providers documented above. |
+| `_httpx_openai`, `url_validator`, `connector_storage` | **Internal.** Reuse at your own risk; may change without notice. |
+| `gateway.dispatch` internals (fallback, logging, audit) | **Internal.** Callers must use the public `Gateway.dispatch` entrypoint. |
+| `LlmConnector` ORM model | **Internal.** Adapters touch only `connector.credentials`, `connector.model_hint`, and `connector.base_url_plain`. |
+
+Schema changes to the `LlmConnector` storage shape (encrypted JSON blob keys)
+are versioned by `connector_type`. Each provider chooses its own blob keys
+in its own migration; the only invariant is that **the blob is a JSON object**.
+
+## Test Matrix
+
+Every registered adapter — built-in or third-party — must pass the
+parametrised contract tests in
+[`server/tests/test_llm_adapter_contract.py`](../server/tests/test_llm_adapter_contract.py).
+The contract covers:
+
+1. The class subclasses `LlmAdapter`.
+2. `connector_type` is non-empty and matches the registration key.
+3. `chat` and `health_check` are async callables.
+4. The constructor accepts a connector row without raising.
+5. `chat()` raises `AuthInvalid` (or another `LlmError`) for malformed
+   credential blobs — never a raw `JSONDecodeError`, `KeyError`, or HTTP
+   exception.
+6. The registry returns classes (not instances) and raises `KeyError` on
+   unknown lookups.
+
+Adapter-specific HTTP and parsing behaviour belongs in a separate test file
+(see the built-in adapters' tests in `test_llm_adapters.py` for the pattern).
+
+Run the contract test against your adapter:
+
+```bash
+cd server
+.venv/bin/pytest tests/test_llm_adapter_contract.py
+```
+
+If a contract test fails on your adapter, **fix the adapter** — do not
+modify the contract. The contract is what lets the gateway dispatch
+generically.
+
+## Reference Skeleton
+
+The minimum working adapter lives at
+[`docs/examples/echo_adapter.py`](examples/echo_adapter.py). It is exercised
+by `test_skeleton_echo_adapter_*` in the contract test file, so any change
+that breaks the documented surface fails CI immediately.
+
+## Adding a Plug-in in 5 Minutes
+
+```bash
+# 1. Copy the skeleton.
+cp docs/examples/echo_adapter.py /opt/wrzdj/llm_plugins/mistral_apikey.py
+
+# 2. Edit it:
+#    - Change `connector_type` to a unique value (e.g. "mistral_apikey").
+#    - Replace the echo body with your provider call.
+#    - Map provider errors to the typed exceptions.
+
+# 3. Point the backend at the plug-in directory.
+export LLM_PLUGIN_DIR=/opt/wrzdj/llm_plugins
+uvicorn app.main:app
+
+# 4. Verify the registry sees it.
+python -c "from app.services.llm.registry import list_connector_types; print(list_connector_types())"
+
+# 5. Run the contract tests.
+cd server && .venv/bin/pytest tests/test_llm_adapter_contract.py
+```
+
+Once your adapter is registered, DJs can create a connector row via
+`POST /api/llm/connectors` with `connector_type="mistral_apikey"` and the
+gateway will route their requests through your adapter automatically.
diff --git a/docs/examples/echo_adapter.py b/docs/examples/echo_adapter.py
new file mode 100644
index 00000000..40930948
--- /dev/null
+++ b/docs/examples/echo_adapter.py
@@ -0,0 +1,174 @@
+"""Echo adapter — minimal reference implementation of ``LlmAdapter``.
+
+This skeleton is the canonical "blank slate" for third-party LLM provider
+plug-ins. It implements the full :class:`~app.services.llm.base.LlmAdapter`
+contract without making any network calls — every request is echoed back as
+the assistant message body.
+
+Usage in tests::
+
+    # Self-test against the contract — no production import.
+    from docs.examples import echo_adapter  # noqa: F401  (side-effect: register)
+    from app.services.llm.registry import get_adapter_class
+
+    cls = get_adapter_class("echo")
+    response = await cls(connector).chat(request)
+
+Usage in production (third-party plug-ins)::
+
+    # 1. Copy this file under any module path you control.
+    # 2. Customize ``connector_type`` and the body of ``chat()``.
+    # 3. Either:
+    #    a) drop the .py file into the directory pointed to by ``LLM_PLUGIN_DIR``,
+    #       or
+    #    b) import the module from your own bootstrap code at startup.
+    # 4. The :func:`register_adapter` call at the bottom binds the class to the
+    #    registry the moment the module is imported.
+
+See ``docs/LLM-PLUGIN.md`` for the full extension contract.
+
+Security note: this skeleton intentionally does not validate or sanitise the
+input it echoes. Real adapters must:
+- Treat ``connector.credentials`` as untrusted (the encrypted blob can be
+  malformed; raise :class:`AuthInvalid` rather than letting :class:`json.JSONDecodeError`
+  bubble up).
+- Translate upstream HTTP/SDK errors into the typed exception hierarchy
+  (``AuthInvalid`` / ``RateLimited`` / ``QuotaExceeded`` / ``ProviderUnavailable``
+  / ``ToolTranslationError``). Raw provider errors must not reach the caller.
+- Never log secrets, full prompts, or completion bodies (the gateway only
+  logs counts).
+"""
+
+from __future__ import annotations
+
+import json
+import logging
+from typing import Any
+
+from app.services.llm.base import (
+    ChatRequest,
+    ChatResponse,
+    ContentBlock,
+    LlmAdapter,
+    Message,
+    TokenUsage,
+)
+from app.services.llm.exceptions import AuthInvalid
+from app.services.llm.registry import register_adapter
+
+logger = logging.getLogger(__name__)
+
+
+class EchoAdapter(LlmAdapter):
+    """An adapter that echoes the last user message back as the assistant reply.
+
+    Useful for:
+    - Wiring tests for the gateway / connector storage layer end-to-end
+      without depending on a live provider.
+    - Showing third-party plug-in authors the minimum required surface.
+    """
+
+    # The registry key for this adapter. Plug-in authors must change this to a
+    # unique string before publishing — the registry refuses to register two
+    # different classes under the same ``connector_type``.
+    connector_type = "echo"
+
+    # ------------------------------------------------------------------
+    # Credential handling
+    # ------------------------------------------------------------------
+    def _read_credentials(self) -> dict[str, Any]:
+        """Parse the encrypted credential blob, raising AuthInvalid on failure.
+
+        The :class:`~app.models.llm_connector.LlmConnector` row stores
+        credentials as an encrypted JSON string. Accessing ``self.connector.credentials``
+        triggers decryption transparently via the ``EncryptedText`` column
+        type. After that, parsing is the adapter's responsibility — and every
+        failure mode here must surface as :class:`AuthInvalid` so the gateway
+        can mark the connector and emit a clean audit event.
+        """
+        raw = self.connector.credentials or ""
+        try:
+            blob = json.loads(raw)
+        except (json.JSONDecodeError, TypeError) as exc:
+            raise AuthInvalid("Connector credentials are malformed") from exc
+        if not isinstance(blob, dict):
+            raise AuthInvalid("Connector credentials shape is invalid")
+        return blob
+
+    # ------------------------------------------------------------------
+    # LlmAdapter — required methods
+    # ------------------------------------------------------------------
+    async def chat(self, request: ChatRequest) -> ChatResponse:
+        """Echo the most recent user message back as the assistant reply.
+
+        Real adapters should:
+        - Translate ``request.messages`` to the provider's native message shape.
+        - Call ``to_<provider>_tools(request.tools, request.force_tool)`` from
+          ``app.services.llm.tool_translation`` to translate tools.
+        - Call ``parse_<provider>_response(...)`` from that same module to
+          translate the response back to ``ChatResponse``.
+        - Map provider HTTP / SDK errors to the typed exception hierarchy.
+        """
+        # We deliberately read credentials before doing any echoing — that way
+        # this skeleton exercises the same boundary (malformed creds raise
+        # AuthInvalid) that real adapters depend on.
+        self._read_credentials()
+
+        last_user = next(
+            (m for m in reversed(request.messages) if m.role == "user"),
+            None,
+        )
+        if last_user is None:
+            text = ""
+        else:
+            text = _flatten_message_text(last_user)
+
+        return ChatResponse(
+            text=text,
+            tool_calls=[],
+            stop_reason="end_turn",
+            usage=TokenUsage(prompt=len(text.split()), completion=len(text.split())),
+            # Surface the resolved model name (request override → connector hint
+            # → adapter default) so call logs and recommendation telemetry stay
+            # accurate. Real adapters should set this to the *provider-reported*
+            # model id from the response payload, not the requested model.
+            model=request.model or self.connector.model_hint or "echo-1",
+        )
+
+    async def health_check(self) -> None:
+        """Validate the credential without exercising the (nonexistent) provider.
+
+        Real adapters should issue a cheap, low-token call (e.g. ``max_tokens=1``)
+        and raise the same typed exceptions as :meth:`chat`.
+        """
+        # No provider to ping — the credential parse step is enough proof that
+        # the connector is wired correctly.
+        self._read_credentials()
+
+
+def _flatten_message_text(msg: Message) -> str:
+    """Collapse a possibly-multi-block message to plain text.
+
+    Real provider adapters typically keep the block structure; this skeleton
+    flattens because a string return matches the simplest possible echo.
+    """
+    content = msg.content
+    if isinstance(content, str):
+        return content
+    parts: list[str] = []
+    for block in content:
+        if isinstance(block, ContentBlock):
+            parts.append(block.text)
+        elif isinstance(block, dict):
+            parts.append(block.get("text") or "")
+    return "".join(parts)
+
+
+# The registry call here is what makes the skeleton "live" — importing this
+# module registers the adapter under the ``connector_type`` declared above.
+#
+# Third-party plug-ins follow the same pattern. The registry refuses to bind
+# the same ``connector_type`` to two different classes, so plug-in authors
+# must pick a unique value (the ``LlmConnector.connector_type`` column is 40
+# chars; keep it short, lowercase, snake-case, e.g. ``mistral_apikey``).
+register_adapter(EchoAdapter.connector_type, EchoAdapter)
diff --git a/docs/superpowers/plans/2026-05-25-llm-audit-trail-admin-ui.md b/docs/superpowers/plans/2026-05-25-llm-audit-trail-admin-ui.md
new file mode 100644
index 00000000..51474357
--- /dev/null
+++ b/docs/superpowers/plans/2026-05-25-llm-audit-trail-admin-ui.md
@@ -0,0 +1,62 @@
+# LLM Audit-Trail Admin UI (#341) Implementation Plan
+
+> **For agentic workers:** Steps use checkbox (`- [ ]`) syntax for tracking. TDD throughout.
+
+**Goal:** Add an admin-only browse/filter/export UI for the existing `llm_audit_event` table on the `/admin/ai` page.
+
+**Architecture:** New read-only backend endpoints on `admin_llm.py` (`GET /api/admin/llm/audit` paginated JSON + `GET /api/admin/llm/audit.csv` streaming CSV), both joining actor username + target connector display name (never credentials). New Pydantic schemas. New API-client methods + a new "Audit trail" card section on the existing `/admin/ai` page (the page uses cards as sections — no tab component exists).
+
+**Tech Stack:** FastAPI, SQLAlchemy 2.0, slowapi, Pydantic v2, Next.js/React 19 + vanilla CSS, vitest.
+
+**Scope fences:** Edit only `server/app/api/admin_llm.py`, `server/app/schemas/llm.py`, `server/tests/*`, `dashboard/app/admin/ai/page.tsx` (+ `__tests__`), `dashboard/lib/api.ts` (add-only), `dashboard/lib/api-types.ts` (add-only). NO migration. READ-ONLY on `llm_audit_event`.
+
+---
+
+## Task 1: Backend schemas + paginated audit endpoint
+
+**Files:**
+- Modify: `server/app/schemas/llm.py` (add `AuditEventRow`, `AdminAuditOut`)
+- Modify: `server/app/api/admin_llm.py` (add `GET /audit`)
+- Test: `server/tests/test_llm_admin_audit.py`
+
+- [ ] Step 1: Write failing tests covering: basic list (admin), 403 for non-admin, filter by event_type, filter by actor_user_id, filter by target_connector_id, days window, pagination (limit/offset + total), joined actor_username + target_connector_display_name, no credentials leaked.
+- [ ] Step 2: Run → FAIL (404 / no endpoint).
+- [ ] Step 3: Add schemas + endpoint. Query `LlmAuditEvent` left-joined to User (actor) and LlmConnector (target). Filters all optional. `days` default 30, range 1..3650. limit 1..200 default 50, offset >=0. Return rows newest-first + `total`.
+- [ ] Step 4: Run → PASS.
+- [ ] Step 5: Commit.
+
+## Task 2: CSV export endpoint
+
+**Files:**
+- Modify: `server/app/api/admin_llm.py` (add `GET /audit.csv`)
+- Test: `server/tests/test_llm_admin_audit.py`
+
+- [ ] Step 1: Write failing tests: CSV content-type + header row + a data row; honors event_type filter; 403 non-admin; cap rows.
+- [ ] Step 2: Run → FAIL.
+- [ ] Step 3: Implement StreamingResponse with `csv` module; same filter helper as Task 1; cap at 10000 rows. Columns: timestamp, actor, event_type, target_connector, notes (notes column reserved/empty — schema has no notes field; emit blank to honor issue's column list).
+- [ ] Step 4: Run → PASS.
+- [ ] Step 5: Commit.
+
+## Task 3: Frontend API client + types
+
+**Files:**
+- Modify: `dashboard/lib/api-types.ts` (add `LlmAdminAudit`, `LlmAuditRow`)
+- Modify: `dashboard/lib/api.ts` (add `getAdminLlmAudit`, `getAdminLlmAuditCsvUrl`/download helper)
+- Regenerate: `dashboard/lib/api-types.generated.ts` via `npm run types:export && npm run types:generate`
+
+- [ ] Step 1: Regenerate OpenAPI types so new schemas appear.
+- [ ] Step 2: Add manual aliases + client methods.
+- [ ] Step 3: tsc passes.
+- [ ] Step 4: Commit.
+
+## Task 4: Audit trail card on /admin/ai page + tests
+
+**Files:**
+- Modify: `dashboard/app/admin/ai/page.tsx`
+- Test: `dashboard/app/admin/ai/__tests__/page.test.tsx`
+
+- [ ] Step 1: Write failing test: renders "Audit trail" heading + a seeded row; filter inputs present; export button present.
+- [ ] Step 2: Run → FAIL.
+- [ ] Step 3: Implement card: filters (event type select, actor, target connector, days), table (timestamp, actor, event type, connector, notes), pagination (prev/next), CSV export button.
+- [ ] Step 4: Run → PASS. Full frontend CI.
+- [ ] Step 5: Commit.
diff --git a/docs/superpowers/plans/2026-05-26-move-dj-ai-settings-to-account.md b/docs/superpowers/plans/2026-05-26-move-dj-ai-settings-to-account.md
new file mode 100644
index 00000000..72ae4cd0
--- /dev/null
+++ b/docs/superpowers/plans/2026-05-26-move-dj-ai-settings-to-account.md
@@ -0,0 +1,96 @@
+# Move DJ AI connector/model settings into the account page Implementation Plan
+
+> **For agentic workers:** REQUIRED SUB-SKILL: Use superpowers:subagent-driven-development (recommended) or superpowers:executing-plans to implement this plan task-by-task. Steps use checkbox (`- [ ]`) syntax for tracking.
+
+**Goal:** Relocate the DJ-facing AI connector UI (connect/test/rotate/delete, model hint, Hermes onboarding) from `/settings/ai` into the existing `/account` page, redirect the old route, and update tests — keeping the admin `/admin/ai` UI untouched.
+
+**Architecture:** Extract the existing `/settings/ai` page body into a reusable client component `components/AiProvidersSection.tsx`. Render it as a third inline card section inside `/account`. Delete the old `/settings/ai` route and add a server-side redirect in `next.config.js` so bookmarks 308 to `/account`. Preserve fail-closed policy behavior verbatim (it moves with the component).
+
+**Tech Stack:** Next.js 16 (App Router), React 19, TypeScript (strict), vanilla CSS + inline styles, Vitest + Testing Library.
+
+---
+
+### Task 1: Extract AI providers UI into a reusable component
+
+**Files:**
+- Create: `dashboard/components/AiProvidersSection.tsx`
+- Reference (source of logic): `dashboard/app/(dj)/settings/ai/page.tsx`
+
+The component contains ALL connector logic from the current page: policy fetch (`fetchPolicySoft` → `getLlmPolicy`), `allowedTypes` fail-closed memo, connectors list, create form (all provider types incl. bedrock/azure/openai_compatible/openrouter dropdown), test, delete. It must NOT include the page-level `<main>` wrapper, the "← Dashboard" link header, the `useAuth`/`useRouter` auth-redirect (those stay at the page level — `/account` already does the auth gate). It exports a default React component `AiProvidersSection` rendering a `<section>` that begins with an `<h2>AI / Model providers</h2>` and the existing intro paragraph, then "Connected providers" and the add-provider form.
+
+- [ ] **Step 1: Create the component** by moving the body. Keep every form field, label text (e.g. `Provider`, `Display name`, `API key`, `Resource name`, `Bedrock model ID`, `Model (optional)`), the OpenRouter model fetch effect, and the fail-closed `allowedTypes` logic identical so existing test assertions still hold. The top of the rendered output is an intro `<h2>` + `<p>`; the rest is the two `<section>`s. Wrap all of it in a single fragment/section with `style={{ marginTop: '2rem' }}` matching the account-page card rhythm (it will live inside its own card in Task 2, so use a plain wrapper, not a `.card`).
+
+- [ ] **Step 2: Type-check** — `cd dashboard && npx tsc --noEmit`. Expected: PASS.
+
+- [ ] **Step 3: Commit**
+
+```bash
+git add dashboard/components/AiProvidersSection.tsx
+git commit -m "refactor(ai): extract AI providers UI into reusable component"
+```
+
+---
+
+### Task 2: Render the AI section inside /account and delete old route
+
+**Files:**
+- Modify: `dashboard/app/(dj)/account/page.tsx`
+- Modify: `dashboard/next.config.js` (add `redirects()`)
+- Delete: `dashboard/app/(dj)/settings/ai/page.tsx`
+- Delete: `dashboard/app/(dj)/settings/ai/__tests__/page.test.tsx` (logic re-tested via component in Task 3)
+- Delete dir if empty: `dashboard/app/(dj)/settings/`
+
+- [ ] **Step 1: Import and render** `AiProvidersSection` in `/account`. Add a third card `<div>` (same wrapper style as Change Email card: `{ background: 'var(--card)', borderRadius: '0.75rem', padding: '1.5rem', marginTop: '1.5rem' }`) below Change Email, containing `<AiProvidersSection />`. Widen the page `<main>` maxWidth from `480px` to `720px` so the provider form (which used `720px`) is not cramped.
+
+- [ ] **Step 2: Add redirect** in `next.config.js`:
+
+```js
+async redirects() {
+  return [
+    { source: '/settings/ai', destination: '/account', permanent: true },
+  ];
+},
+```
+
+- [ ] **Step 3: Delete** the old route file, its test, and the now-empty `settings/` dir.
+
+- [ ] **Step 4: Grep** `grep -rn "/settings/ai" dashboard/ --include="*.ts" --include="*.tsx" | grep -v node_modules` → expect no remaining nav/link hits (only possibly api-types doc comments, which are fine).
+
+- [ ] **Step 5: Type-check + lint** — `cd dashboard && npx tsc --noEmit && npm run lint`. Expected: PASS.
+
+- [ ] **Step 6: Commit**
+
+```bash
+git add dashboard/app/\(dj\)/account/page.tsx dashboard/next.config.js
+git add -u dashboard/app/\(dj\)/settings
+git commit -m "feat(ai): move DJ AI settings into account page; redirect old route (#357)"
+```
+
+---
+
+### Task 3: Move/adapt the AI tests to the component + account page
+
+**Files:**
+- Create: `dashboard/components/__tests__/AiProvidersSection.test.tsx` (port the old settings/ai tests, importing the component instead of the page; drop the `next/navigation`/`useAuth` mocks that the page-level no longer needs but keep `next/link` mock if used)
+- Modify: `dashboard/app/(dj)/account/__tests__/page.test.tsx` (add the AI api methods to the `@/lib/api` mock so the section can mount inside the account page without throwing, and assert the AI heading renders)
+
+- [ ] **Step 1: Port connector tests** to `AiProvidersSection.test.tsx` — same assertions (lists connectors, fail-closed hides providers, policy filtering, azure/bedrock/openrouter fields, test, delete). Render `<AiProvidersSection />` directly. Keep `vi.mock('next/link', ...)` if the component still uses `Link` (it should NOT — Link header stays on the page; remove the import). Mock `@/lib/api` methods used: `listLlmConnectors`, `getLlmPolicy`, `createLlmConnector`, `testLlmConnector`, `deleteLlmConnector`, `listOpenRouterModels`, `getAdminLlmPolicy` (for the "reads DJ-scoped not admin" test).
+
+- [ ] **Step 2: Update account page test** — extend the existing `vi.mock('@/lib/api', ...)` to add `listLlmConnectors: () => Promise.resolve([])` and `getLlmPolicy: () => Promise.reject(new Error('x'))` (fail-closed, no extra UI). Add a test: AI heading `AI / Model providers` is in the document.
+
+- [ ] **Step 3: Run frontend tests** — `cd dashboard && npm test -- --run`. Expected: PASS, coverage thresholds met.
+
+- [ ] **Step 4: Commit**
+
+```bash
+git add dashboard/components/__tests__/AiProvidersSection.test.tsx dashboard/app/\(dj\)/account/__tests__/page.test.tsx
+git commit -m "test(ai): relocate AI provider tests to component + account page (#357)"
+```
+
+---
+
+## Self-Review
+
+- Spec coverage: relocate UI (Task 1+2) ✓; update nav/links (Task 2 grep — only the page itself referenced it) ✓; redirect old route (Task 2) ✓; admin /admin/ai untouched (not touched by any task) ✓; tests moved (Task 3) ✓; fail-closed preserved (logic moved verbatim, retested) ✓.
+- Placeholder scan: none.
+- Type consistency: component name `AiProvidersSection` used consistently in Tasks 1–3.
diff --git a/docs/superpowers/plans/2026-05-26-remove-deprecated-anthropic-env-reads.md b/docs/superpowers/plans/2026-05-26-remove-deprecated-anthropic-env-reads.md
new file mode 100644
index 00000000..a09d7160
--- /dev/null
+++ b/docs/superpowers/plans/2026-05-26-remove-deprecated-anthropic-env-reads.md
@@ -0,0 +1,106 @@
+# Remove deprecated ANTHROPIC_API_KEY env-var reads Implementation Plan
+
+> **For agentic workers:** REQUIRED SUB-SKILL: Use superpowers:subagent-driven-development (recommended) or superpowers:executing-plans to implement this plan task-by-task. Steps use checkbox (`- [ ]`) syntax for tracking.
+
+**Goal:** Remove the now-dead legacy `ANTHROPIC_API_KEY` env-var fallback path in the recommendation engine, since the LLM Gateway connector system has been the source of truth for credentials since the MVP.
+
+**Architecture:** Every production caller of `call_llm` / `generate_llm_suggestions` passes `db` + `actor`, so the gateway path always runs and the `_legacy_call` direct-Anthropic fallback (and its `anthropic_api_key` / `anthropic_max_tokens` / `anthropic_timeout_seconds` config reads) is dead code. We delete that fallback, the unused config fields, and refresh the legacy unit test to drive the gateway path instead. We deliberately KEEP `config.anthropic_api_key` and `config.anthropic_model` because the admin AI-settings/model-listing endpoints and the recommendation response `llm_model` default still read them — removing those is a cross-cutting frontend+API-contract change out of scope for this backend cleanup.
+
+**Tech Stack:** Python 3.11+, FastAPI, pydantic-settings, pytest.
+
+---
+
+## Design decisions (scope reconciliation)
+
+The issue's literal grep target is the **uppercase env-var name** `ANTHROPIC_API_KEY`. In non-test code that string appears only in:
+- `server/alembic/versions/046_admin_ai_oauth.py` — historical one-shot data migration. **MUST stay** (allowable exception).
+- `server/app/services/recommendation/llm_hooks.py:78` — a docstring mention of the dead fallback. **Removed** here.
+
+The actual env-var *reads* go through the pydantic-settings attribute `config.anthropic_api_key` (lowercase). Mapping every read:
+
+| Location | What it does | Decision |
+|---|---|---|
+| `llm_client._legacy_call` | direct-Anthropic fallback when `db is None` | **REMOVE** — dead; all callers pass `db` |
+| `llm_client._resolve_max_tokens` | reads `anthropic_max_tokens` for gateway `ChatRequest.max_tokens` | **KEEP the cap, drop the config dependency** — inline the `1024` default |
+| `llm_hooks.is_llm_available` final fallback | `bool(get_settings().anthropic_api_key)` | **REMOVE** — gateway connector check is authoritative |
+| `admin._list_anthropic_models` / `/ai/settings` | live admin observability of the legacy key | **KEEP** — powers admin UI + API contract + frontend tests; out of scope |
+| `events.py:986` | `result.llm_model or get_settings().anthropic_model` display default | **KEEP** — `anthropic_model` is a model-name default, not a credential fallback |
+
+Config fields:
+- `anthropic_max_tokens`, `anthropic_timeout_seconds` → **REMOVE** (only the deleted `_legacy_call` / `_resolve_max_tokens` used them).
+- `anthropic_api_key`, `anthropic_model` → **KEEP** (still read by admin + events display).
+
+---
+
+## File Structure
+
+- `server/app/services/recommendation/llm_client.py` — delete `_legacy_call`, the `AsyncAnthropic` import, the `db is None` branch; inline max-tokens default.
+- `server/app/services/recommendation/llm_hooks.py` — drop the `db is None` env-var fallback and the docstring `ANTHROPIC_API_KEY` mention; tighten `is_llm_available` to require `db`.
+- `server/app/core/config.py` — remove `anthropic_max_tokens`, `anthropic_timeout_seconds`.
+- `server/tests/test_llm_client.py` — replace the `AsyncAnthropic`-patching legacy tests with gateway-path tests.
+- `server/tests/test_llm_hooks.py` — drop the env-var-availability assertions.
+- `.env.example` — drop the deprecated `ANTHROPIC_*` lines (keep nothing that's dead).
+- `CLAUDE.md` — update the Environment section + LLM Gateway note.
+
+---
+
+### Task 1: Remove the dead `_legacy_call` fallback in `llm_client.py`
+
+**Files:**
+- Modify: `server/app/services/recommendation/llm_client.py`
+- Test: `server/tests/test_llm_client.py`
+
+- [ ] **Step 1: Rewrite `TestCallLLM` to drive the gateway path**
+
+Replace the two `AsyncAnthropic`-patching tests with tests that pass a fake `db` and patch `Gateway.dispatch`, asserting the parse + trim behavior.
+
+- [ ] **Step 2: Run to verify they fail** (`call_llm` still has the `db is None` branch / `Gateway` not yet the sole path)
+
+Run: `.venv/bin/pytest tests/test_llm_client.py -q`
+
+- [ ] **Step 3: Edit `llm_client.py`**
+  - Remove `from anthropic import AsyncAnthropic`.
+  - Remove the `if db is None: result = await _legacy_call(...)` branch — make the gateway path unconditional; raise/parse via gateway always.
+  - Delete `_legacy_call`.
+  - Replace `_resolve_max_tokens()` body to return a module constant default (`DEFAULT_MAX_TOKENS = 1024`) instead of `get_settings().anthropic_max_tokens`.
+  - Remove the now-unused `get_settings` import if nothing else uses it.
+
+- [ ] **Step 4: Run tests** — `.venv/bin/pytest tests/test_llm_client.py -q` → PASS
+
+- [ ] **Step 5: Commit**
+
+### Task 2: Tighten `is_llm_available` in `llm_hooks.py`
+
+**Files:**
+- Modify: `server/app/services/recommendation/llm_hooks.py`
+- Test: `server/tests/test_llm_hooks.py`
+
+- [ ] **Step 1: Update `test_llm_hooks.py`** — remove the two assertions that `is_llm_available()` (no db) keys off `anthropic_api_key`; keep/adjust the db-based connector tests. `is_llm_available()` with no db now returns `False`.
+- [ ] **Step 2: Run to verify fail.**
+- [ ] **Step 3: Edit `llm_hooks.py`** — drop the final `bool(get_settings().anthropic_api_key)` fallback (both the `db is not None` tail and the no-db return → `False`); remove the `ANTHROPIC_API_KEY` docstring bullet and the `db is None` env-var sentence in `generate_llm_suggestions`; remove the now-unused `get_settings` import.
+- [ ] **Step 4: Run tests** → PASS.
+- [ ] **Step 5: Commit.**
+
+### Task 3: Remove dead config fields
+
+**Files:**
+- Modify: `server/app/core/config.py`
+
+- [ ] **Step 1: Remove `anthropic_max_tokens` and `anthropic_timeout_seconds`** from the `Settings` class. Keep `anthropic_api_key` and `anthropic_model` (still used by admin + events).
+- [ ] **Step 2: Grep** `grep -rn "anthropic_max_tokens\|anthropic_timeout" server/app` → zero hits.
+- [ ] **Step 3: Commit.**
+
+### Task 4: Docs + env example
+
+**Files:**
+- Modify: `.env.example`, `CLAUDE.md`
+
+- [ ] **Step 1: `.env.example`** — remove the deprecated `ANTHROPIC_API_KEY` / `ANTHROPIC_MODEL` / `ANTHROPIC_MAX_TOKENS` / `ANTHROPIC_TIMEOUT_SECONDS` lines and rewrite the surrounding comment to state credentials are connector-only.
+- [ ] **Step 2: `CLAUDE.md`** — update the Anthropic env-var line in the Environment section and the LLM Gateway note (legacy fallback removed).
+- [ ] **Step 3: Commit.**
+
+### Task 5: Full backend CI + acceptance grep
+
+- [ ] `cd server && .venv/bin/ruff check . && .venv/bin/ruff format --check . && .venv/bin/bandit -r app -c pyproject.toml -q && .venv/bin/pytest --tb=short -q`
+- [ ] `grep -rn "ANTHROPIC_API_KEY" server/ | grep -v /tests/` → only the alembic migration hits remain.
+- [ ] `.venv/bin/alembic upgrade head && .venv/bin/alembic check` (config field removal must not drift).
diff --git a/docs/superpowers/plans/2026-05-26-sse-stream-pooled-db-connection-leak.md b/docs/superpowers/plans/2026-05-26-sse-stream-pooled-db-connection-leak.md
new file mode 100644
index 00000000..aa35419b
--- /dev/null
+++ b/docs/superpowers/plans/2026-05-26-sse-stream-pooled-db-connection-leak.md
@@ -0,0 +1,333 @@
+# Fix SSE Stream Pooled DB Connection Leak Implementation Plan
+
+> **For agentic workers:** REQUIRED SUB-SKILL: Use superpowers:subagent-driven-development (recommended) or superpowers:executing-plans to implement this plan task-by-task. Steps use checkbox (`- [ ]`) syntax for tracking.
+
+**Goal:** Stop the public SSE `event_stream` endpoint from pinning a pooled DB connection for the entire (potentially unbounded) lifetime of an EventSource connection, which exhausts the pool (size 5 + overflow 10 = 15) under modest guest load.
+
+**Architecture:** Remove the `db: Session = Depends(get_db)` request-scoped dependency from `event_stream`. Run the one-shot existence/auth check inside a short-lived `with SessionLocal() as s:` block that is fully closed (connection returned to the pool) BEFORE the `EventSourceResponse` is returned. The async generator currently performs no per-tick DB access, so it opens no session; if future per-tick DB access is needed it must open its own short-lived `SessionLocal()` session. Existence/auth error responses (404 unknown, 410 archived/expired) are preserved exactly.
+
+**Tech Stack:** FastAPI, SQLAlchemy 2.0 (QueuePool), sse-starlette, pytest.
+
+---
+
+### Task 1: Regression test proving idle SSE streams hold ~0 pooled DB connections
+
+**Files:**
+- Test: `server/tests/test_sse_pool.py` (create)
+
+The existing `client`/`db` fixtures override `get_db` with a single shared `StaticPool` SQLite session, so they cannot measure the production `QueuePool`. This test exercises the real `event_stream` endpoint function directly against a real `SessionLocal`-backed engine, asserting the function returns (existence check done) with the pool fully checked back in, and that the returned generator can be opened/closed without checking out a connection.
+
+- [ ] **Step 1: Write the failing test**
+
+```python
+"""Regression test for issue #356 — SSE event_stream must NOT pin a pooled
+DB connection for the lifetime of the stream.
+
+Before the fix, event_stream declared `db: Session = Depends(get_db)`, so
+FastAPI held the session (and its checked-out QueuePool connection) open
+until the request finished — which for an EventSource never happens while
+the browser holds it open. ~15 concurrent guest viewers exhausted the pool.
+
+These tests bypass the conftest StaticPool override and drive a real
+QueuePool engine so engine.pool.checkedout() is meaningful.
+"""
+
+import asyncio
+from datetime import timedelta
+
+import pytest
+from sqlalchemy import create_engine
+from sqlalchemy.orm import sessionmaker
+from starlette.requests import Request as StarletteRequest
+
+from app.core.time import utcnow
+from app.models.base import Base
+from app.models.user import User
+from app.models.event import Event
+from app.services.auth import get_password_hash
+
+
+@pytest.fixture()
+def pooled_engine(monkeypatch):
+    """A real file-backed SQLite engine using QueuePool (default), so
+    engine.pool.checkedout() reflects actual checked-out connections.
+
+    Patches app.db.session.SessionLocal AND the name already imported into
+    app.api.sse so the endpoint resolves our pooled session factory.
+    """
+    import app.db.session as db_session
+    import app.api.sse as sse_module
+
+    engine = create_engine(
+        "sqlite:///file:sse_pool_test?mode=memory&cache=shared&uri=true",
+        pool_size=5,
+        max_overflow=10,
+    )
+    Base.metadata.create_all(bind=engine)
+    TestSession = sessionmaker(autocommit=False, autoflush=False, bind=engine)
+
+    monkeypatch.setattr(db_session, "SessionLocal", TestSession)
+    monkeypatch.setattr(sse_module, "SessionLocal", TestSession, raising=False)
+
+    # Seed an active event using a short-lived session.
+    with TestSession() as s:
+        user = User(
+            username="pooluser",
+            password_hash=get_password_hash("poolpassword123"),
+            role="dj",
+        )
+        s.add(user)
+        s.commit()
+        s.refresh(user)
+        evt = Event(
+            code="POOL01",
+            join_code="POOLJN",
+            name="Pool Event",
+            created_by_user_id=user.id,
+            expires_at=utcnow() + timedelta(hours=6),
+        )
+        s.add(evt)
+        s.commit()
+
+    try:
+        yield engine, TestSession
+    finally:
+        Base.metadata.drop_all(bind=engine)
+        engine.dispose()
+
+
+def _make_request(code: str) -> StarletteRequest:
+    """Minimal ASGI scope for a GET that reports as connected."""
+    scope = {
+        "type": "http",
+        "method": "GET",
+        "path": f"/api/public/events/{code}/stream",
+        "headers": [],
+        "query_string": b"",
+    }
+
+    async def receive():  # pragma: no cover - never drained in these tests
+        return {"type": "http.disconnect"}
+
+    return StarletteRequest(scope, receive)
+
+
+def test_event_stream_returns_with_pool_checked_in(pooled_engine):
+    """After event_stream() returns, the existence-check connection must be
+    back in the pool (checkedout() == 0)."""
+    from app.api.sse import event_stream
+
+    engine, _ = pooled_engine
+    assert engine.pool.checkedout() == 0
+
+    req = _make_request("POOLJN")
+    response = asyncio.run(event_stream(code="POOLJN", request=req))
+
+    # EventSourceResponse created, generator not yet iterated.
+    assert engine.pool.checkedout() == 0
+
+
+def test_n_concurrent_idle_streams_hold_zero_pool_connections(pooled_engine):
+    """N concurrent open (idle) SSE streams must hold ~0 pooled connections.
+
+    Open N generators (past pool_size + max_overflow = 15), prime each one
+    tick so the generator body is actively suspended on queue.get(), then
+    assert the pool has 0 checked-out connections. Before the fix this would
+    be N (one pinned per stream) and would TimeoutError past 15.
+    """
+    from app.api.sse import event_stream
+
+    engine, _ = pooled_engine
+    n = 25  # well past pool capacity (15)
+
+    async def drive():
+        generators = []
+        for _ in range(n):
+            req = _make_request("POOLJN")
+            resp = await event_stream(code="POOLJN", request=req)
+            gen = resp.body_iterator
+            generators.append(gen)
+
+        # Prime each generator one step so it subscribes and suspends on
+        # queue.get(); give the event loop a tick to settle.
+        primer_tasks = [asyncio.ensure_future(g.__anext__()) for g in generators]
+        await asyncio.sleep(0.05)
+
+        checked_out = engine.pool.checkedout()
+
+        # Cancel the primers and close generators to release subscriptions.
+        for t in primer_tasks:
+            t.cancel()
+        for g in generators:
+            await g.aclose()
+
+        return checked_out
+
+    checked_out = asyncio.run(drive())
+    assert checked_out == 0, (
+        f"Expected 0 pooled connections held by {n} idle SSE streams, "
+        f"got {checked_out} — the stream is pinning DB connections."
+    )
+
+
+def test_event_stream_preserves_404_for_unknown_event(pooled_engine):
+    """Existence check must still reject unknown codes with 404."""
+    from fastapi import HTTPException
+
+    from app.api.sse import event_stream
+
+    req = _make_request("NOEXIS")
+    with pytest.raises(HTTPException) as exc:
+        asyncio.run(event_stream(code="NOEXIS", request=req))
+    assert exc.value.status_code == 404
+```
+
+- [ ] **Step 2: Run test to verify it fails**
+
+Run (from `server/`): `.venv/bin/pytest tests/test_sse_pool.py -v`
+Expected: `test_event_stream_returns_with_pool_checked_in` raises `TypeError` because `event_stream` still requires the `db` parameter (FastAPI `Depends` default is not auto-injected when calling the function directly), and/or the pool assertions fail. RED.
+
+- [ ] **Step 3: Implement the fix in `server/app/api/sse.py`**
+
+Remove the `db: Session = Depends(get_db)` parameter. Import `SessionLocal`. Run the existence check in a short-lived session closed before returning.
+
+```python
+"""SSE streaming endpoint for real-time event updates (no authentication required)."""
+
+import asyncio
+import json
+import logging
+from typing import Any
+
+from fastapi import APIRouter, HTTPException, Request
+from sse_starlette.sse import EventSourceResponse
+
+from app.core.rate_limit import limiter
+from app.db.session import SessionLocal
+from app.services.event import EventLookupResult, get_event_by_join_code_with_status
+from app.services.event_bus import get_event_bus
+
+logger = logging.getLogger(__name__)
+router = APIRouter()
+
+DISCONNECT_CHECK_INTERVAL = 15  # seconds
+
+
+async def _event_generator(
+    request: Request,
+    event_code: str,
+) -> Any:
+    """Yield SSE events for a given event code until the client disconnects.
+
+    Keepalive pings are handled by sse-starlette's built-in ping task (every 15s).
+    This generator only yields actual events. The timeout on queue.get() lets us
+    periodically check for client disconnect without blocking forever.
+
+    NOTE (issue #356): this generator deliberately holds NO DB session. If a
+    future change needs per-tick DB access it MUST open its own short-lived
+    `with SessionLocal() as s:` session per tick and close it before awaiting —
+    never hold a pooled connection across the stream lifetime.
+    """
+    bus = get_event_bus()
+    queue = bus.subscribe(event_code)
+    try:
+        while True:
+            if await request.is_disconnected():
+                break
+            try:
+                message = await asyncio.wait_for(queue.get(), timeout=DISCONNECT_CHECK_INTERVAL)
+                yield {
+                    "event": message["event"],
+                    "data": json.dumps(message["data"]),
+                }
+            except TimeoutError:
+                # No event received — loop to check is_disconnected()
+                continue
+    finally:
+        bus.unsubscribe(event_code, queue)
+
+
+@router.get("/events/{code}/stream")
+@limiter.limit("10/minute")
+async def event_stream(
+    code: str,
+    request: Request,
+) -> EventSourceResponse:
+    """Public SSE endpoint for real-time event updates.
+
+    SECURITY (CRIT-5): rate-limited and existence-checked. Before this fix,
+    the endpoint had no rate limit and no existence check, allowing
+    unauthenticated DoS (unlimited long-lived connections exhausting FDs)
+    and passive eavesdropping via 6-char event-code brute force.
+
+    POOL SAFETY (issue #356): the existence/auth check runs in a short-lived
+    session that is closed (its pooled connection returned) BEFORE the
+    EventSourceResponse is returned. An EventSource connection can stay open
+    indefinitely, so we must NOT hold a request-scoped get_db session across
+    the stream lifetime — doing so pinned one pooled connection per open
+    stream and exhausted the QueuePool (size 5 + overflow 10) under guest load.
+
+    Event types:
+    - request_created: New request submitted
+    - request_status_changed: Request status update
+    - now_playing_changed: Now-playing track update
+    - requests_bulk_update: Batch accept/reject
+    - bridge_status_changed: Bridge connect/disconnect
+    """
+    with SessionLocal() as db:
+        event, result = get_event_by_join_code_with_status(db, code)
+        if result == EventLookupResult.NOT_FOUND:
+            raise HTTPException(status_code=404, detail="Event not found")
+        if result == EventLookupResult.ARCHIVED:
+            raise HTTPException(status_code=410, detail="Event has been archived")
+        if result == EventLookupResult.EXPIRED:
+            raise HTTPException(status_code=410, detail="Event has expired")
+        event_code = event.code
+
+    return EventSourceResponse(
+        _event_generator(request, event_code),
+        media_type="text/event-stream",
+        headers={"X-Accel-Buffering": "no"},
+    )
+```
+
+- [ ] **Step 4: Run the new tests to verify they pass**
+
+Run (from `server/`): `.venv/bin/pytest tests/test_sse_pool.py -v`
+Expected: all 3 tests PASS.
+
+- [ ] **Step 5: Run existing SSE security tests to confirm no regression**
+
+Run (from `server/`): `.venv/bin/pytest tests/test_sse_security.py -v`
+Expected: all PASS (404/410 existence checks + rate limit preserved).
+
+- [ ] **Step 6: Full backend CI gate**
+
+Run (from `server/`):
+```bash
+.venv/bin/ruff check .
+.venv/bin/ruff format --check .
+.venv/bin/bandit -r app -c pyproject.toml -q
+.venv/bin/pytest --tb=short -q
+```
+Expected: all green, coverage >= 80%.
+
+- [ ] **Step 7: Commit**
+
+```bash
+git add server/app/api/sse.py server/tests/test_sse_pool.py docs/superpowers/plans/2026-05-26-sse-stream-pooled-db-connection-leak.md
+git commit -m "fix(sse): don't pin a pooled DB connection for the SSE stream lifetime (#356)"
+```
+
+---
+
+## Self-Review
+
+**Spec coverage:**
+- "Open SSE streams no longer hold a pooled DB connection while idle" → fix removes `Depends(get_db)`, uses `with SessionLocal()` closed before returning; `test_n_concurrent_idle_streams_hold_zero_pool_connections` proves it.
+- "A test confirms N concurrent open streams consume ~0 idle pool connections" → `test_n_concurrent_idle_streams_hold_zero_pool_connections` (N=25 > pool capacity 15).
+- "Existence/auth checks preserved" → `test_event_stream_preserves_404_for_unknown_event` + existing `test_sse_security.py`.
+
+**Placeholder scan:** none.
+
+**Type consistency:** `event_stream(code, request)`, `_event_generator(request, event_code)`, `SessionLocal()` — consistent across plan and fix.
diff --git a/docs/superpowers/plans/2026-05-28-llm-cost-quota-caps.md b/docs/superpowers/plans/2026-05-28-llm-cost-quota-caps.md
new file mode 100644
index 00000000..318aaa01
--- /dev/null
+++ b/docs/superpowers/plans/2026-05-28-llm-cost-quota-caps.md
@@ -0,0 +1,1208 @@
+# LLM Cost / Quota Caps per DJ Implementation Plan
+
+> **For agentic workers:** REQUIRED SUB-SKILL: Use superpowers:subagent-driven-development (recommended) or superpowers:executing-plans to implement this plan task-by-task. Steps use checkbox (`- [ ]`) syntax for tracking.
+
+**Goal:** Let admins set a monthly token cap per DJ LLM connector; the gateway refuses calls that would push the current calendar month over the cap with a clear DJ-facing message.
+
+**Architecture:** Add a nullable `monthly_token_cap` integer column to `LlmConnector` (None = unlimited). A direct aggregation query sums `tokens_in + tokens_out` from `llm_call_log` for the current calendar month per connector. The gateway runs a pre-flight check in `dispatch()`: if current month usage already meets/exceeds the cap, raise a new `QuotaCapReached` exception. Admins set caps via a new PATCH endpoint in `admin_llm.py`; the admin UI adds a cap input + usage-vs-cap progress bar per connector row.
+
+**Tech Stack:** FastAPI, SQLAlchemy 2.0, Alembic, Pydantic v2, Next.js 16 / React 19 (vanilla CSS), pytest, vitest.
+
+**Why direct aggregation (not a rollup table):** At current volume (`llm_call_log` has a 30-365 day retention window, per-DJ DJ-initiated recommendation calls — low hundreds/month at most), a single indexed `SUM(...) WHERE created_at >= month_start GROUP BY connector_id` is correct and cheap. `llm_call_log.created_at` is already indexed. A materialized view or hourly cron rollup adds operational complexity (refresh scheduling, staleness windows, an extra table + migration) with no measurable benefit until call volume is orders of magnitude higher. Documented here and in the PR; revisit if usage telemetry shows the aggregation query becoming hot.
+
+---
+
+## File Structure
+
+**Backend:**
+- `server/app/models/llm_connector.py` — add `monthly_token_cap: Mapped[int | None]` column on `LlmConnector`.
+- `server/alembic/versions/050_llm_connector_monthly_token_cap.py` — new migration (down_revision `049`).
+- `server/app/services/llm/exceptions.py` — add `QuotaCapReached(LlmError)`.
+- `server/app/services/llm/connector_storage.py` — add `current_month_token_usage(db, connector_id)` aggregation helper + `set_monthly_cap(connector, cap)` setter with validation.
+- `server/app/services/llm/gateway.py` — add a pre-flight cap check in `dispatch()` before the primary attempt (and before any fallback attempt against a connector with a cap).
+- `server/app/schemas/llm.py` — add `monthly_token_cap` to `ConnectorOut`; add `AdminConnectorCapPatch` request schema; add `current_month_tokens` to `AdminConnectorOut`.
+- `server/app/api/admin_llm.py` — add `PATCH /connectors/{id}/cap` endpoint; populate `current_month_tokens` in the connectors listing.
+- `server/app/api/events.py` — ensure `QuotaCapReached` from the LLM recommendation endpoint surfaces the DJ-facing 429 message instead of the generic 502.
+
+**Frontend:**
+- `dashboard/lib/api-types.generated.ts` — regenerated from backend OpenAPI (do not hand-edit).
+- `dashboard/lib/api.ts` — add `setAdminLlmConnectorCap(id, cap)` method.
+- `dashboard/app/admin/ai/page.tsx` — add cap input + usage-vs-cap progress bar to each per-DJ connector row.
+
+**Tests:**
+- `server/tests/test_llm_quota_cap.py` — new: aggregation helper, gateway pre-flight enforcement, cap setter validation.
+- `server/tests/test_llm_api.py` — extend: admin cap PATCH endpoint (auth, validation, set/clear).
+- `dashboard/app/admin/ai/__tests__/` or inline — cap UI rendering + progress bar (if an existing test harness for the page exists; otherwise add focused component-free logic test).
+
+---
+
+## Task 1: Add `QuotaCapReached` exception
+
+**Files:**
+- Modify: `server/app/services/llm/exceptions.py`
+- Test: `server/tests/test_llm_quota_cap.py`
+
+- [ ] **Step 1: Write the failing test**
+
+Create `server/tests/test_llm_quota_cap.py`:
+
+```python
+"""Tests for per-DJ monthly token caps (issue #339)."""
+
+from __future__ import annotations
+
+from app.services.llm.exceptions import LlmError, QuotaCapReached
+
+
+def test_quota_cap_reached_is_llm_error():
+    exc = QuotaCapReached("cap reached")
+    assert isinstance(exc, LlmError)
+    assert str(exc) == "cap reached"
+```
+
+- [ ] **Step 2: Run test to verify it fails**
+
+Run: `.venv/bin/pytest tests/test_llm_quota_cap.py -v`
+Expected: FAIL — `ImportError: cannot import name 'QuotaCapReached'`
+
+- [ ] **Step 3: Add the exception**
+
+In `server/app/services/llm/exceptions.py`, after the `QuotaExceeded` class:
+
+```python
+class QuotaCapReached(LlmError):
+    """The DJ's admin-set monthly token cap for this connector is reached.
+
+    Distinct from :class:`QuotaExceeded` (a provider-side billing/quota error):
+    this is a WrzDJ-internal pre-flight refusal raised *before* any provider
+    call, so no tokens are spent. The DJ-facing message is fixed and contains
+    no internal details — see the gateway pre-flight check.
+    """
+```
+
+- [ ] **Step 4: Run test to verify it passes**
+
+Run: `.venv/bin/pytest tests/test_llm_quota_cap.py -v`
+Expected: PASS
+
+- [ ] **Step 5: Commit**
+
+```bash
+git add server/app/services/llm/exceptions.py server/tests/test_llm_quota_cap.py
+git commit -m "feat(llm): add QuotaCapReached exception for monthly token caps"
+```
+
+---
+
+## Task 2: Add `monthly_token_cap` column + migration
+
+**Files:**
+- Modify: `server/app/models/llm_connector.py`
+- Create: `server/alembic/versions/050_llm_connector_monthly_token_cap.py`
+- Test: `server/tests/test_llm_quota_cap.py`
+
+- [ ] **Step 1: Write the failing test**
+
+Append to `server/tests/test_llm_quota_cap.py`:
+
+```python
+import json
+
+from app.models.llm_connector import LlmConnector
+from app.models.user import User
+from app.services.auth import get_password_hash
+
+
+def _make_dj(db, username="capdj"):
+    user = User(username=username, password_hash=get_password_hash("password123"), role="dj")
+    db.add(user)
+    db.commit()
+    db.refresh(user)
+    return user
+
+
+def _make_connector(db, user, *, monthly_token_cap=None):
+    row = LlmConnector(
+        user_id=user.id,
+        connector_type="openai_apikey",
+        display_name="Cap connector",
+        status="active",
+        credentials=json.dumps({"api_key": "sk-fake-key"}),
+        model_hint="gpt-5-mini",
+        monthly_token_cap=monthly_token_cap,
+    )
+    db.add(row)
+    db.commit()
+    db.refresh(row)
+    return row
+
+
+def test_connector_defaults_to_no_cap(db):
+    user = _make_dj(db)
+    connector = _make_connector(db, user)
+    assert connector.monthly_token_cap is None
+
+
+def test_connector_stores_cap(db):
+    user = _make_dj(db, username="capdj2")
+    connector = _make_connector(db, user, monthly_token_cap=100_000)
+    db.refresh(connector)
+    assert connector.monthly_token_cap == 100_000
+```
+
+- [ ] **Step 2: Run test to verify it fails**
+
+Run: `.venv/bin/pytest tests/test_llm_quota_cap.py -v`
+Expected: FAIL — `TypeError: 'monthly_token_cap' is an invalid keyword argument for LlmConnector`
+
+- [ ] **Step 3: Add the model column**
+
+In `server/app/models/llm_connector.py`, inside `LlmConnector`, after the `last_health_check_status` column (before `__table_args__`):
+
+```python
+    # Admin-set monthly token cap (issue #339). NULL = unlimited. When set, the
+    # gateway refuses dispatch once the current calendar month's summed
+    # tokens_in + tokens_out for this connector meets or exceeds the cap. The
+    # cap is admin-only (set via /api/admin/llm/connectors/{id}/cap) and is
+    # checked PRE-FLIGHT only — editing it never disrupts an in-flight call.
+    monthly_token_cap: Mapped[int | None] = mapped_column(Integer, nullable=True)
+```
+
+- [ ] **Step 4: Create the migration**
+
+Create `server/alembic/versions/050_llm_connector_monthly_token_cap.py`:
+
+```python
+"""Add monthly_token_cap to llm_connectors (issue #339).
+
+Revision ID: 050
+Revises: 049
+Create Date: 2026-05-28
+
+Adds an admin-set per-DJ monthly token cap to ``llm_connectors``:
+
+- ``monthly_token_cap`` (Integer, nullable) — NULL means unlimited. When set,
+  the LLM gateway refuses dispatch once the current calendar month's summed
+  ``tokens_in + tokens_out`` for the connector meets or exceeds this value.
+
+Nullable with no server default so existing connectors stay unlimited.
+"""
+
+import sqlalchemy as sa
+
+from alembic import op
+
+revision: str = "050"
+down_revision: str | None = "049"
+branch_labels = None
+depends_on = None
+
+
+def upgrade() -> None:
+    op.add_column(
+        "llm_connectors",
+        sa.Column("monthly_token_cap", sa.Integer(), nullable=True),
+    )
+
+
+def downgrade() -> None:
+    op.drop_column("llm_connectors", "monthly_token_cap")
+```
+
+- [ ] **Step 5: Run test to verify it passes**
+
+Run: `.venv/bin/pytest tests/test_llm_quota_cap.py -v`
+Expected: PASS (SQLite test DB recreates schema from models)
+
+- [ ] **Step 6: Verify alembic on isolated Postgres DB**
+
+Run (isolated DB avoids the shared-DB drift from sibling worktrees):
+```bash
+DATABASE_URL="postgresql+psycopg://wrzdj:wrzdj@localhost:5432/wrzdj_issue339" .venv/bin/alembic upgrade head
+DATABASE_URL="postgresql+psycopg://wrzdj:wrzdj@localhost:5432/wrzdj_issue339" .venv/bin/alembic check
+```
+Expected: `No new upgrade operations detected.`
+
+If the isolated DB was already at head from a prior run, recreate it first:
+```bash
+docker exec wrzdj-db-1 psql -U wrzdj -d postgres -c "DROP DATABASE IF EXISTS wrzdj_issue339;" -c "CREATE DATABASE wrzdj_issue339;"
+```
+
+- [ ] **Step 7: Commit**
+
+```bash
+git add server/app/models/llm_connector.py server/alembic/versions/050_llm_connector_monthly_token_cap.py server/tests/test_llm_quota_cap.py
+git commit -m "feat(llm): add monthly_token_cap column + migration 050"
+```
+
+---
+
+## Task 3: Add current-month usage aggregation + cap setter helpers
+
+**Files:**
+- Modify: `server/app/services/llm/connector_storage.py`
+- Test: `server/tests/test_llm_quota_cap.py`
+
+- [ ] **Step 1: Write the failing test**
+
+Append to `server/tests/test_llm_quota_cap.py`:
+
+```python
+from datetime import timedelta
+
+import pytest
+
+from app.core.time import utcnow
+from app.models.llm_connector import LlmCallLog
+from app.services.llm.connector_storage import (
+    current_month_token_usage,
+    set_monthly_cap,
+)
+
+
+def _log(db, connector_id, *, tokens_in, tokens_out, when=None):
+    row = LlmCallLog(
+        connector_id=connector_id,
+        purpose="test",
+        status="ok",
+        latency_ms=10,
+        tokens_in=tokens_in,
+        tokens_out=tokens_out,
+    )
+    db.add(row)
+    db.flush()
+    if when is not None:
+        row.created_at = when
+    db.commit()
+    return row
+
+
+def test_current_month_usage_sums_in_and_out(db):
+    user = _make_dj(db, username="usagedj")
+    connector = _make_connector(db, user)
+    _log(db, connector.id, tokens_in=100, tokens_out=50)
+    _log(db, connector.id, tokens_in=10, tokens_out=5)
+    assert current_month_token_usage(db, connector.id) == 165
+
+
+def test_current_month_usage_excludes_prior_months(db):
+    user = _make_dj(db, username="usagedj2")
+    connector = _make_connector(db, user)
+    # 40 days ago — previous month, must be excluded.
+    _log(db, connector.id, tokens_in=1000, tokens_out=1000, when=utcnow() - timedelta(days=40))
+    _log(db, connector.id, tokens_in=7, tokens_out=3)
+    assert current_month_token_usage(db, connector.id) == 10
+
+
+def test_current_month_usage_treats_null_tokens_as_zero(db):
+    user = _make_dj(db, username="usagedj3")
+    connector = _make_connector(db, user)
+    _log(db, connector.id, tokens_in=None, tokens_out=None)
+    _log(db, connector.id, tokens_in=5, tokens_out=None)
+    assert current_month_token_usage(db, connector.id) == 5
+
+
+def test_set_monthly_cap_accepts_positive_int(db):
+    user = _make_dj(db, username="capset")
+    connector = _make_connector(db, user)
+    set_monthly_cap(connector, 50_000)
+    assert connector.monthly_token_cap == 50_000
+
+
+def test_set_monthly_cap_accepts_none_to_clear(db):
+    user = _make_dj(db, username="capclear")
+    connector = _make_connector(db, user, monthly_token_cap=10)
+    set_monthly_cap(connector, None)
+    assert connector.monthly_token_cap is None
+
+
+def test_set_monthly_cap_rejects_negative(db):
+    user = _make_dj(db, username="capneg")
+    connector = _make_connector(db, user)
+    with pytest.raises(ValueError):
+        set_monthly_cap(connector, -1)
+```
+
+- [ ] **Step 2: Run test to verify it fails**
+
+Run: `.venv/bin/pytest tests/test_llm_quota_cap.py -v`
+Expected: FAIL — `ImportError: cannot import name 'current_month_token_usage'`
+
+- [ ] **Step 3: Implement the helpers**
+
+In `server/app/services/llm/connector_storage.py`, add a module-level helper for the month boundary and the two functions. Add near the other aggregation helpers (after `get_usage_stats`):
+
+```python
+def _calendar_month_start() -> "datetime":
+    """First instant (UTC, naive) of the current calendar month."""
+    from app.core.time import utcnow
+
+    now = utcnow()
+    return now.replace(day=1, hour=0, minute=0, second=0, microsecond=0)
+
+
+def current_month_token_usage(db: Session, connector_id: int) -> int:
+    """Sum tokens_in + tokens_out for ``connector_id`` in the current month.
+
+    Direct aggregation against the indexed ``llm_call_log.created_at`` column.
+    NULL token counts are coalesced to 0. Returns 0 when there are no rows.
+    Used by the gateway pre-flight cap check + the admin usage-vs-cap display.
+    """
+    month_start = _calendar_month_start()
+    total = db.execute(
+        select(
+            func.coalesce(func.sum(LlmCallLog.tokens_in), 0)
+            + func.coalesce(func.sum(LlmCallLog.tokens_out), 0)
+        ).where(
+            LlmCallLog.connector_id == connector_id,
+            LlmCallLog.created_at >= month_start,
+        )
+    ).scalar_one()
+    return int(total or 0)
+
+
+def set_monthly_cap(connector: LlmConnector, cap: int | None) -> LlmConnector:
+    """Set (or clear) the connector's monthly token cap. Caller commits.
+
+    ``cap=None`` clears the cap (unlimited). A non-None cap must be a
+    non-negative integer; negative values are rejected with ``ValueError``
+    (→ HTTP 400 at the API boundary).
+    """
+    if cap is not None and cap < 0:
+        raise ValueError("monthly_token_cap must be a non-negative integer or null")
+    connector.monthly_token_cap = cap
+    return connector
+```
+
+Add `datetime` to the typing import context — the `_calendar_month_start` return annotation uses a string forward-ref `"datetime"`, but for clarity add `from datetime import datetime` at the top of the module if not already imported. Check the existing imports first; if `datetime` is not imported, add it. Then change the annotation to `-> datetime:` (drop the quotes).
+
+Add both new names to the `__all__` list:
+
+```python
+    "current_month_token_usage",
+    "set_monthly_cap",
+```
+
+- [ ] **Step 4: Run test to verify it passes**
+
+Run: `.venv/bin/pytest tests/test_llm_quota_cap.py -v`
+Expected: PASS
+
+- [ ] **Step 5: Commit**
+
+```bash
+git add server/app/services/llm/connector_storage.py server/tests/test_llm_quota_cap.py
+git commit -m "feat(llm): add current-month usage aggregation + cap setter"
+```
+
+---
+
+## Task 4: Gateway pre-flight cap enforcement
+
+**Files:**
+- Modify: `server/app/services/llm/gateway.py`
+- Test: `server/tests/test_llm_quota_cap.py`
+
+- [ ] **Step 1: Write the failing test**
+
+Append to `server/tests/test_llm_quota_cap.py`:
+
+```python
+from unittest.mock import AsyncMock, patch
+
+from app.services.llm.adapters.openai_apikey import OpenAIApiKeyAdapter
+from app.services.llm.base import ChatRequest, ChatResponse, Message, TokenUsage
+from app.services.llm.exceptions import QuotaCapReached
+from app.services.llm.gateway import Gateway
+
+
+def _req() -> ChatRequest:
+    return ChatRequest(messages=[Message(role="user", content="hi")])
+
+
+@pytest.mark.asyncio
+async def test_dispatch_allows_when_under_cap(db):
+    user = _make_dj(db, username="undercap")
+    connector = _make_connector(db, user, monthly_token_cap=1_000)
+    _log(db, connector.id, tokens_in=100, tokens_out=100)  # 200 used, under 1000
+
+    fake = ChatResponse(text="ok", tool_calls=[], stop_reason="end_turn",
+                         usage=TokenUsage(prompt=5, completion=2))
+    with patch.object(OpenAIApiKeyAdapter, "chat", new=AsyncMock(return_value=fake)):
+        resp = await Gateway.dispatch(db, user, _req(), purpose="test")
+    assert resp.text == "ok"
+
+
+@pytest.mark.asyncio
+async def test_dispatch_refuses_when_cap_reached(db):
+    user = _make_dj(db, username="atcap")
+    connector = _make_connector(db, user, monthly_token_cap=200)
+    _log(db, connector.id, tokens_in=150, tokens_out=50)  # 200 used, == cap
+
+    # The adapter must NOT be called — refusal is pre-flight.
+    chat_mock = AsyncMock()
+    with patch.object(OpenAIApiKeyAdapter, "chat", new=chat_mock):
+        with pytest.raises(QuotaCapReached):
+            await Gateway.dispatch(db, user, _req(), purpose="test")
+    chat_mock.assert_not_called()
+
+
+@pytest.mark.asyncio
+async def test_dispatch_unlimited_when_cap_none(db):
+    user = _make_dj(db, username="nolimit")
+    connector = _make_connector(db, user, monthly_token_cap=None)
+    _log(db, connector.id, tokens_in=10_000, tokens_out=10_000)
+
+    fake = ChatResponse(text="ok", tool_calls=[], stop_reason="end_turn",
+                        usage=TokenUsage(prompt=1, completion=1))
+    with patch.object(OpenAIApiKeyAdapter, "chat", new=AsyncMock(return_value=fake)):
+        resp = await Gateway.dispatch(db, user, _req(), purpose="test")
+    assert resp.text == "ok"
+```
+
+- [ ] **Step 2: Run test to verify it fails**
+
+Run: `.venv/bin/pytest tests/test_llm_quota_cap.py -k cap -v`
+Expected: FAIL — `test_dispatch_refuses_when_cap_reached` fails because the adapter is called and no `QuotaCapReached` is raised.
+
+- [ ] **Step 3: Implement the pre-flight check**
+
+In `server/app/services/llm/gateway.py`:
+
+Add the import for the helper + exception. Update the `from app.services.llm.connector_storage import ...` line:
+
+```python
+from app.services.llm.connector_storage import (
+    audit_event,
+    current_month_token_usage,
+    log_call,
+)
+```
+
+Add `QuotaCapReached` to the exceptions import block:
+
+```python
+from app.services.llm.exceptions import (
+    AuthInvalid,
+    LlmError,
+    NoLlmConfigured,
+    ProviderUnavailable,
+    QuotaCapReached,
+    QuotaExceeded,
+    RateLimited,
+    ToolTranslationError,
+)
+```
+
+Add a module-level helper after `_fallback_trigger`:
+
+```python
+def _enforce_monthly_cap(db: Session, connector: LlmConnector) -> None:
+    """Pre-flight: refuse dispatch when the connector's monthly cap is reached.
+
+    No-op when the connector has no cap (``monthly_token_cap is None``).
+    Compares the current calendar month's summed token usage against the cap;
+    refuses when usage already meets or exceeds it. Raised BEFORE any provider
+    call, so no tokens are spent and editing the cap never disrupts an
+    already-dispatched (in-flight) call.
+
+    The error message is fixed and leaks no internals (usage totals, cap value,
+    connector id) — see issue #339 security note.
+    """
+    cap = connector.monthly_token_cap
+    if cap is None:
+        return
+    used = current_month_token_usage(db, connector.id)
+    if used >= cap:
+        raise QuotaCapReached(
+            "Your monthly token cap is reached. Contact your admin to raise it."
+        )
+```
+
+In `Gateway.dispatch`, add the pre-flight check immediately after `primary = _resolve_connector(...)` / `actor_id = ...` and before "Attempt 1":
+
+```python
+        primary = _resolve_connector(db, actor)
+        actor_id = actor.id if actor else _system_actor_id(db, primary)
+
+        # Pre-flight: refuse if the resolved connector's monthly cap is reached
+        # (issue #339). Raised before any provider call — no tokens spent.
+        _enforce_monthly_cap(db, primary)
+```
+
+Also enforce the cap on the fallback connector before the fallback attempt. In the fallback branch, after `fallback = _resolve_org_default(db)` and the `if fallback is None or fallback.id == primary.id: raise` guard, before the `audit_event(...)` write, add:
+
+```python
+            # The fallback connector may itself be capped — refuse rather than
+            # silently spending another DJ's budget.
+            _enforce_monthly_cap(db, fallback)
+```
+
+`QuotaCapReached` is a subclass of `LlmError` but is NOT in `_FALLBACK_TRIGGERS`, so `_fallback_trigger()` returns `None` for it and the primary-connector cap refusal short-circuits to `raise` (no fallback) — which is correct: a cap is not a transient/credential error.
+
+- [ ] **Step 4: Run tests to verify they pass**
+
+Run: `.venv/bin/pytest tests/test_llm_quota_cap.py -v`
+Expected: PASS (all cap tests)
+
+Run the full gateway suite to confirm no regression:
+Run: `.venv/bin/pytest tests/test_llm_gateway.py -v`
+Expected: PASS
+
+- [ ] **Step 5: Commit**
+
+```bash
+git add server/app/services/llm/gateway.py server/tests/test_llm_quota_cap.py
+git commit -m "feat(llm): enforce monthly token cap pre-flight in gateway dispatch"
+```
+
+---
+
+## Task 5: Expose cap in schemas + admin connectors listing
+
+**Files:**
+- Modify: `server/app/schemas/llm.py`
+- Modify: `server/app/api/admin_llm.py`
+- Test: `server/tests/test_llm_api.py`
+
+- [ ] **Step 1: Write the failing test**
+
+Add to `server/tests/test_llm_api.py` (find the admin connectors-listing test area; add a new test). First inspect the file for an existing admin connector + admin_headers fixture pattern, then add:
+
+```python
+def test_admin_connectors_listing_includes_cap_and_usage(client, db, admin_headers, dj_user):
+    # Create a connector for a DJ with a cap, and log some usage this month.
+    import json as _json
+
+    from app.models.llm_connector import LlmCallLog, LlmConnector
+
+    connector = LlmConnector(
+        user_id=dj_user.id,
+        connector_type="openai_apikey",
+        display_name="Capped",
+        status="active",
+        credentials=_json.dumps({"api_key": "sk-fake-key"}),
+        monthly_token_cap=1000,
+    )
+    db.add(connector)
+    db.commit()
+    db.refresh(connector)
+    db.add(LlmCallLog(connector_id=connector.id, purpose="test", status="ok",
+                      latency_ms=5, tokens_in=120, tokens_out=80))
+    db.commit()
+
+    resp = client.get("/api/admin/llm/connectors", headers=admin_headers)
+    assert resp.status_code == 200
+    row = next(r for r in resp.json() if r["id"] == connector.id)
+    assert row["monthly_token_cap"] == 1000
+    assert row["current_month_tokens"] == 200
+```
+
+If `test_llm_api.py` has no `dj_user` fixture, create the DJ inline (mirror the local connector-creation helpers already used in that file).
+
+- [ ] **Step 2: Run test to verify it fails**
+
+Run: `.venv/bin/pytest tests/test_llm_api.py -k cap_and_usage -v`
+Expected: FAIL — `KeyError: 'monthly_token_cap'` or `'current_month_tokens'`
+
+- [ ] **Step 3: Update schemas**
+
+In `server/app/schemas/llm.py`:
+
+Add to `ConnectorOut` (after `last_health_check_status`):
+
+```python
+    # Admin-set monthly token cap (issue #339). None = unlimited.
+    monthly_token_cap: int | None = None
+```
+
+Add to `AdminConnectorOut` (after `dj_username`):
+
+```python
+    # Current calendar-month token usage (tokens_in + tokens_out), so the admin
+    # UI can render a usage-vs-cap progress bar without a second round-trip.
+    current_month_tokens: int = 0
+```
+
+Add a new request schema near `AdminPolicyPatch`:
+
+```python
+class AdminConnectorCapPatch(BaseModel):
+    """Admin set/clear a connector's monthly token cap (issue #339).
+
+    ``monthly_token_cap = null`` clears the cap (unlimited). A non-null value
+    must be a non-negative integer; ``0`` means "no further calls this month".
+    """
+
+    monthly_token_cap: int | None = Field(default=None, ge=0, le=1_000_000_000)
+```
+
+- [ ] **Step 4: Populate `current_month_tokens` in the listing**
+
+In `server/app/api/admin_llm.py`:
+
+Import the helper:
+
+```python
+from app.services.llm.connector_storage import (
+    AUDIT_POLICY_CHANGED,
+    AUDIT_REVOKED_BY_ADMIN,
+    audit_event,
+    current_month_token_usage,
+    get_connector,
+    get_usage_stats,
+    get_user_label,
+    list_all_connectors,
+    revoke_connector,
+)
+```
+
+Update `_connector_to_admin_out` to accept and inject `current_month_tokens`:
+
+```python
+def _connector_to_admin_out(
+    row: LlmConnector, dj_username: str, current_month_tokens: int = 0
+) -> AdminConnectorOut:
+    return AdminConnectorOut.model_validate(
+        {
+            **{c.name: getattr(row, c.name) for c in LlmConnector.__table__.columns},
+            "dj_username": dj_username,
+            "current_month_tokens": current_month_tokens,
+        }
+    )
+```
+
+In `list_connectors_admin`, compute usage per row:
+
+```python
+    return [
+        _connector_to_admin_out(
+            r,
+            usernames.get(r.user_id) or f"user#{r.user_id}",
+            current_month_token_usage(db, r.id),
+        )
+        for r in rows
+    ]
+```
+
+Update the two other `_connector_to_admin_out(...)` call sites in `revoke_connector_admin` (and the new cap endpoint in Task 6) to pass `current_month_token_usage(db, row.id)`.
+
+- [ ] **Step 5: Run test to verify it passes**
+
+Run: `.venv/bin/pytest tests/test_llm_api.py -k cap_and_usage -v`
+Expected: PASS
+
+- [ ] **Step 6: Commit**
+
+```bash
+git add server/app/schemas/llm.py server/app/api/admin_llm.py server/tests/test_llm_api.py
+git commit -m "feat(llm): expose monthly cap + current-month usage in admin listing"
+```
+
+---
+
+## Task 6: Admin PATCH endpoint to set/clear a connector cap
+
+**Files:**
+- Modify: `server/app/api/admin_llm.py`
+- Test: `server/tests/test_llm_api.py`
+
+- [ ] **Step 1: Write the failing test**
+
+Add to `server/tests/test_llm_api.py`:
+
+```python
+def test_admin_set_connector_cap(client, db, admin_headers, dj_user):
+    import json as _json
+
+    from app.models.llm_connector import LlmConnector
+
+    connector = LlmConnector(
+        user_id=dj_user.id, connector_type="openai_apikey", display_name="C",
+        status="active", credentials=_json.dumps({"api_key": "sk-fake-key"}),
+    )
+    db.add(connector)
+    db.commit()
+    db.refresh(connector)
+
+    resp = client.patch(
+        f"/api/admin/llm/connectors/{connector.id}/cap",
+        headers=admin_headers,
+        json={"monthly_token_cap": 50000},
+    )
+    assert resp.status_code == 200
+    assert resp.json()["monthly_token_cap"] == 50000
+
+    # Clear it.
+    resp = client.patch(
+        f"/api/admin/llm/connectors/{connector.id}/cap",
+        headers=admin_headers,
+        json={"monthly_token_cap": None},
+    )
+    assert resp.status_code == 200
+    assert resp.json()["monthly_token_cap"] is None
+
+
+def test_admin_set_cap_rejects_negative(client, db, admin_headers, dj_user):
+    import json as _json
+
+    from app.models.llm_connector import LlmConnector
+
+    connector = LlmConnector(
+        user_id=dj_user.id, connector_type="openai_apikey", display_name="C2",
+        status="active", credentials=_json.dumps({"api_key": "sk-fake-key"}),
+    )
+    db.add(connector)
+    db.commit()
+    db.refresh(connector)
+
+    resp = client.patch(
+        f"/api/admin/llm/connectors/{connector.id}/cap",
+        headers=admin_headers,
+        json={"monthly_token_cap": -5},
+    )
+    assert resp.status_code == 422  # Pydantic ge=0 rejection
+
+
+def test_admin_set_cap_404_for_missing_connector(client, admin_headers):
+    resp = client.patch(
+        "/api/admin/llm/connectors/999999/cap",
+        headers=admin_headers,
+        json={"monthly_token_cap": 100},
+    )
+    assert resp.status_code == 404
+
+
+def test_set_cap_requires_admin(client, db, auth_headers, test_user):
+    # A non-admin (plain DJ) must be rejected.
+    import json as _json
+
+    from app.models.llm_connector import LlmConnector
+
+    connector = LlmConnector(
+        user_id=test_user.id, connector_type="openai_apikey", display_name="C3",
+        status="active", credentials=_json.dumps({"api_key": "sk-fake-key"}),
+    )
+    db.add(connector)
+    db.commit()
+    db.refresh(connector)
+
+    resp = client.patch(
+        f"/api/admin/llm/connectors/{connector.id}/cap",
+        headers=auth_headers,
+        json={"monthly_token_cap": 100},
+    )
+    assert resp.status_code == 403
+```
+
+- [ ] **Step 2: Run test to verify it fails**
+
+Run: `.venv/bin/pytest tests/test_llm_api.py -k cap -v`
+Expected: FAIL — 404/405 (endpoint not yet defined)
+
+- [ ] **Step 3: Add the endpoint**
+
+In `server/app/api/admin_llm.py`:
+
+Add `AdminConnectorCapPatch` to the schema imports and `set_monthly_cap` + audit constant to the storage imports. Add a new audit constant usage — reuse `AUDIT_POLICY_CHANGED` for cap changes (it is the closest existing lifecycle event and avoids a model change), OR add a dedicated `AUDIT_CAP_CHANGED` if preferred. Use `AUDIT_POLICY_CHANGED` to avoid touching the model's audit constants and migrations.
+
+Imports:
+
+```python
+from app.schemas.llm import (
+    AdminAuditOut,
+    AdminConnectorCapPatch,
+    AdminConnectorOut,
+    AdminPolicyOut,
+    AdminPolicyPatch,
+    AdminUsageOut,
+    AuditEventRow,
+    UsageRow,
+)
+from app.services.llm.connector_storage import (
+    AUDIT_POLICY_CHANGED,
+    AUDIT_REVOKED_BY_ADMIN,
+    audit_event,
+    current_month_token_usage,
+    get_connector,
+    get_usage_stats,
+    get_user_label,
+    list_all_connectors,
+    revoke_connector,
+    set_monthly_cap,
+)
+```
+
+Add the endpoint (place it after `revoke_connector_admin`):
+
+```python
+@router.patch("/connectors/{connector_id}/cap", response_model=AdminConnectorOut)
+@limiter.limit("30/minute")
+def set_connector_cap_admin(
+    request: FastAPIRequest,
+    connector_id: int,
+    payload: AdminConnectorCapPatch,
+    admin: User = Depends(get_current_admin),
+    db: Session = Depends(get_db),
+) -> AdminConnectorOut:
+    """Set or clear a connector's monthly token cap (admin-only, issue #339).
+
+    ``monthly_token_cap = null`` clears the cap (unlimited). The change is
+    pre-flight only: an in-flight gateway call already past its cap check is
+    unaffected. Pydantic enforces the non-negative bound (``ge=0``).
+    """
+    row = get_connector(db, connector_id)
+    if row is None:
+        raise HTTPException(status_code=404, detail="Connector not found")
+
+    try:
+        set_monthly_cap(row, payload.monthly_token_cap)
+    except ValueError as exc:
+        raise HTTPException(status_code=400, detail=str(exc)) from exc
+
+    audit_event(
+        db,
+        actor_user_id=admin.id,
+        target_connector_id=row.id,
+        event_type=AUDIT_POLICY_CHANGED,
+    )
+    db.commit()
+    db.refresh(row)
+    return _connector_to_admin_out(
+        row, get_user_label(db, row.user_id), current_month_token_usage(db, row.id)
+    )
+```
+
+Also update `revoke_connector_admin`'s final return to pass usage:
+
+```python
+    return _connector_to_admin_out(
+        row, get_user_label(db, row.user_id), current_month_token_usage(db, row.id)
+    )
+```
+
+- [ ] **Step 4: Run tests to verify they pass**
+
+Run: `.venv/bin/pytest tests/test_llm_api.py -k cap -v`
+Expected: PASS
+
+- [ ] **Step 5: Commit**
+
+```bash
+git add server/app/api/admin_llm.py server/tests/test_llm_api.py
+git commit -m "feat(llm): admin endpoint to set/clear per-connector monthly cap"
+```
+
+---
+
+## Task 7: Surface `QuotaCapReached` as a clear DJ-facing error
+
+**Files:**
+- Modify: `server/app/api/events.py:923-988` (the `/recommendations/llm` endpoint)
+- Test: `server/tests/test_llm_recommendation_via_gateway.py` (or `test_llm_quota_cap.py`)
+
+- [ ] **Step 1: Write the failing test**
+
+Inspect `server/tests/test_llm_recommendation_via_gateway.py` for the existing event + DJ + connector fixture pattern and how `/recommendations/llm` is exercised. Add a test that pre-fills usage at/over a cap and asserts a 429 with the DJ-facing message:
+
+```python
+def test_llm_recommendation_returns_429_when_cap_reached(client, db, ...):
+    # ... set up event owned by a DJ with a capped, active connector and
+    # a connected music service (tidal/beatport token), then log usage >= cap.
+    # POST /api/events/{code}/recommendations/llm with a prompt.
+    assert resp.status_code == 429
+    assert "monthly token cap is reached" in resp.json()["detail"].lower()
+```
+
+Model this test on the existing setup in `test_llm_recommendation_via_gateway.py`. If that file's fixtures are too heavy to reuse cleanly, instead unit-test the mapping by patching `generate_recommendations_from_llm` to raise `QuotaCapReached` and asserting the endpoint returns 429 with the message.
+
+- [ ] **Step 2: Run test to verify it fails**
+
+Run: `.venv/bin/pytest tests/test_llm_recommendation_via_gateway.py -k cap -v`
+Expected: FAIL — endpoint returns 502 (generic) instead of 429 with the cap message.
+
+- [ ] **Step 3: Handle `QuotaCapReached` before the generic catch**
+
+In `server/app/api/events.py`, in `get_llm_recommendations`, change the try/except around `generate_recommendations_from_llm` to catch the cap error first:
+
+```python
+    from app.services.llm.exceptions import QuotaCapReached
+
+    try:
+        result = await generate_recommendations_from_llm(db, user, event, prompt_request.prompt)
+    except QuotaCapReached as exc:
+        # DJ-facing message only — no internal usage/cap details leaked.
+        raise HTTPException(status_code=429, detail=str(exc)) from exc
+    except Exception:
+        import logging
+
+        logging.getLogger(__name__).exception("LLM recommendation failed")
+        raise HTTPException(
+            status_code=502,
+            detail="LLM service error. Try again or use algorithmic recommendations.",
+        )
+```
+
+Place the `from app.services.llm.exceptions import QuotaCapReached` import with the other local imports at the top of the function (next to the existing `from app.services.recommendation...` imports).
+
+- [ ] **Step 4: Run test to verify it passes**
+
+Run: `.venv/bin/pytest tests/test_llm_recommendation_via_gateway.py -k cap -v`
+Expected: PASS
+
+- [ ] **Step 5: Commit**
+
+```bash
+git add server/app/api/events.py server/tests/test_llm_recommendation_via_gateway.py
+git commit -m "feat(llm): surface QuotaCapReached as 429 with DJ-facing message"
+```
+
+---
+
+## Task 8: Regenerate frontend types + add api.ts method
+
+**Files:**
+- Modify: `dashboard/lib/api-types.generated.ts` (regenerated)
+- Modify: `dashboard/lib/api-types.ts` (add `LlmAdminConnectorCapPatch` alias)
+- Modify: `dashboard/lib/api.ts`
+- Test: `dashboard/lib/__tests__/api.test.ts`
+
+- [ ] **Step 1: Regenerate types from backend OpenAPI**
+
+Run from `dashboard/`:
+```bash
+npm run types:export
+npm run types:generate
+```
+Verify `AdminConnectorCapPatch` and `current_month_tokens` / `monthly_token_cap` appear in `dashboard/lib/api-types.generated.ts`.
+
+- [ ] **Step 2: Add type alias**
+
+In `dashboard/lib/api-types.ts`, near the other LLM aliases:
+
+```typescript
+export type LlmAdminConnectorCapPatch = Schemas['AdminConnectorCapPatch'];
+```
+
+- [ ] **Step 3: Write the failing test**
+
+In `dashboard/lib/__tests__/api.test.ts`, add a test mirroring the existing admin-LLM method tests (find one like `revokeAdminLlmConnector`):
+
+```typescript
+it('setAdminLlmConnectorCap PATCHes the cap endpoint', async () => {
+  const connector = { id: 7, monthly_token_cap: 5000 };
+  mockFetchOnce(connector);
+  const result = await api.setAdminLlmConnectorCap(7, 5000);
+  expect(lastFetchUrl()).toContain('/api/admin/llm/connectors/7/cap');
+  expect(lastFetchInit().method).toBe('PATCH');
+  expect(JSON.parse(lastFetchInit().body as string)).toEqual({ monthly_token_cap: 5000 });
+  expect(result).toEqual(connector);
+});
+```
+
+Adjust `mockFetchOnce`/`lastFetchUrl`/`lastFetchInit` to match the helpers already used in that test file.
+
+- [ ] **Step 4: Run test to verify it fails**
+
+Run from `dashboard/`: `npm test -- --run api.test`
+Expected: FAIL — `api.setAdminLlmConnectorCap is not a function`
+
+- [ ] **Step 5: Add the method**
+
+In `dashboard/lib/api.ts`, in the "Admin LLM policy + oversight" section (after `getAdminLlmUsage`):
+
+```typescript
+  async setAdminLlmConnectorCap(
+    id: number,
+    monthlyTokenCap: number | null,
+  ): Promise<LlmAdminConnector> {
+    return this.fetch(`/api/admin/llm/connectors/${id}/cap`, {
+      method: 'PATCH',
+      body: JSON.stringify({ monthly_token_cap: monthlyTokenCap }),
+    });
+  }
+```
+
+Add `LlmAdminConnectorCapPatch` to the imports if you reference it; the method signature above uses primitives, so an import is optional.
+
+- [ ] **Step 6: Run test to verify it passes**
+
+Run from `dashboard/`: `npm test -- --run api.test`
+Expected: PASS
+
+- [ ] **Step 7: Commit**
+
+```bash
+git add dashboard/lib/api-types.generated.ts dashboard/lib/api-types.ts dashboard/lib/api.ts dashboard/lib/__tests__/api.test.ts
+git commit -m "feat(ai-ui): add setAdminLlmConnectorCap api client method + types"
+```
+
+---
+
+## Task 9: Admin UI — cap input + usage-vs-cap progress bar
+
+**Files:**
+- Modify: `dashboard/app/admin/ai/page.tsx`
+- Test: extend the page's test if one exists, otherwise a focused logic test for the percent helper.
+
+- [ ] **Step 1: Add a cap-percent helper + extract a small pure function (testable)**
+
+In `dashboard/app/admin/ai/page.tsx`, add near the top-level helpers (e.g. after `formatTimestamp`):
+
+```typescript
+// Percent of the monthly cap consumed. Returns null when there is no cap
+// (unlimited) so the UI can render "Unlimited" instead of a bar. Clamps to
+// 0–100 so an over-cap connector (possible: cap lowered mid-month) shows full.
+function capPercent(used: number, cap: number | null | undefined): number | null {
+  if (cap == null) return null;
+  if (cap === 0) return 100;
+  return Math.min(100, Math.max(0, Math.round((used / cap) * 100)));
+}
+```
+
+- [ ] **Step 2: Add a "Monthly cap" column to the connectors table**
+
+Add a `<PlainHeader label="Monthly cap" />` to the table head (after "Result", before "Actions").
+
+In each connector `<tr>`, add a cell that shows the current usage, an editable cap input, and a progress bar:
+
+```tsx
+                    <td style={{ padding: '0.5rem', minWidth: '180px' }}>
+                      <div style={{ display: 'flex', alignItems: 'center', gap: '0.5rem' }}>
+                        <input
+                          type="number"
+                          className="input"
+                          style={{ width: '110px' }}
+                          min={0}
+                          placeholder="∞"
+                          defaultValue={c.monthly_token_cap ?? ''}
+                          onBlur={(e) => handleCapBlur(c, e.target.value)}
+                          aria-label={`Monthly token cap for ${c.dj_username} ${c.display_name}`}
+                        />
+                      </div>
+                      <div style={{ marginTop: '0.35rem', fontSize: '0.75rem', color: 'var(--text-secondary)' }}>
+                        {c.monthly_token_cap == null
+                          ? `${c.current_month_tokens.toLocaleString()} this month · unlimited`
+                          : `${c.current_month_tokens.toLocaleString()} / ${c.monthly_token_cap.toLocaleString()}`}
+                      </div>
+                      {c.monthly_token_cap != null && (
+                        <div
+                          aria-hidden
+                          style={{
+                            marginTop: '0.25rem',
+                            height: '6px',
+                            borderRadius: '9999px',
+                            background: 'var(--border-color)',
+                            overflow: 'hidden',
+                          }}
+                        >
+                          <div
+                            style={{
+                              width: `${capPercent(c.current_month_tokens, c.monthly_token_cap) ?? 0}%`,
+                              height: '100%',
+                              background:
+                                (capPercent(c.current_month_tokens, c.monthly_token_cap) ?? 0) >= 100
+                                  ? 'var(--color-danger)'
+                                  : (capPercent(c.current_month_tokens, c.monthly_token_cap) ?? 0) >= 80
+                                    ? 'var(--color-warning, #c08418)'
+                                    : 'var(--color-success)',
+                            }}
+                          />
+                        </div>
+                      )}
+                    </td>
+```
+
+- [ ] **Step 3: Add the `handleCapBlur` handler**
+
+Add inside the component (near `handleRevoke`):
+
+```typescript
+  const handleCapBlur = async (connector: LlmAdminConnector, raw: string) => {
+    const trimmed = raw.trim();
+    // Empty input clears the cap (unlimited).
+    let next: number | null;
+    if (trimmed === '') {
+      next = null;
+    } else {
+      const parsed = parseInt(trimmed, 10);
+      if (Number.isNaN(parsed) || parsed < 0) {
+        setError('Monthly cap must be a non-negative whole number.');
+        return;
+      }
+      next = parsed;
+    }
+    // No-op when unchanged.
+    if (next === (connector.monthly_token_cap ?? null)) return;
+    try {
+      const updated = await api.setAdminLlmConnectorCap(connector.id, next);
+      setConnectors((prev) => prev.map((c) => (c.id === connector.id ? updated : c)));
+    } catch (err) {
+      setError(err instanceof Error ? err.message : 'Failed to update cap');
+    }
+  };
+```
+
+- [ ] **Step 4: Type check + lint + tests**
+
+Run from `dashboard/`:
+```bash
+npx tsc --noEmit
+npm run lint
+npm test -- --run
+git checkout next-env.d.ts 2>/dev/null || true
+```
+Expected: all green. Fix any type errors (e.g. `current_month_tokens` should be a `number` on `LlmAdminConnector` from the regenerated types).
+
+- [ ] **Step 5: Commit**
+
+```bash
+git add dashboard/app/admin/ai/page.tsx
+git commit -m "feat(ai-ui): admin cap input + usage-vs-cap progress bar per connector"
+```
+
+---
+
+## Task 10: Full local CI + finalize
+
+- [ ] **Step 1: Backend CI**
+
+From `server/`:
+```bash
+.venv/bin/ruff check .
+.venv/bin/ruff format --check .
+.venv/bin/bandit -r app -c pyproject.toml -q
+.venv/bin/pytest --tb=short -q
+```
+Fix anything red. Run `.venv/bin/ruff format .` then `.venv/bin/ruff check --fix .` if needed.
+
+- [ ] **Step 2: Alembic on isolated DB**
+
+```bash
+docker exec wrzdj-db-1 psql -U wrzdj -d postgres -c "DROP DATABASE IF EXISTS wrzdj_issue339;" -c "CREATE DATABASE wrzdj_issue339;"
+DATABASE_URL="postgresql+psycopg://wrzdj:wrzdj@localhost:5432/wrzdj_issue339" .venv/bin/alembic upgrade head
+DATABASE_URL="postgresql+psycopg://wrzdj:wrzdj@localhost:5432/wrzdj_issue339" .venv/bin/alembic check
+```
+Expected: `No new upgrade operations detected.`
+
+- [ ] **Step 3: Frontend CI**
+
+From `dashboard/`:
+```bash
+npm run lint
+npx tsc --noEmit
+npm test -- --run
+git checkout next-env.d.ts 2>/dev/null || true
+```
+
+- [ ] **Step 4: Push + PR**
+
+Use `superpowers:finishing-a-development-branch` option 2. Create the PR with `gh pr create --base epic/ai-engine`. PR body MUST include `Closes #339`, a `## Design decisions` section (direct-aggregation rationale, pre-flight-only enforcement, reuse of `AUDIT_POLICY_CHANGED`, 429 mapping), and a note that it targets `epic/ai-engine`.
+
+---
+
+## Self-Review Notes
+
+- **Spec coverage:** column (T2), aggregation (T3), pre-flight `QuotaCapReached` (T4), admin set/edit endpoint (T6), DJ-facing message (T4 msg + T7 mapping), admin UI cap input + progress bar (T9). Acceptance: cap enforced (T4), clear DJ error (T4/T7), admin edits without disrupting in-flight calls (pre-flight-only, documented T4/T6). ✓
+- **Type consistency:** `current_month_token_usage(db, connector_id)`, `set_monthly_cap(connector, cap)`, `monthly_token_cap`, `current_month_tokens`, `setAdminLlmConnectorCap(id, cap)`, `capPercent(used, cap)`, `handleCapBlur(connector, raw)` used consistently across tasks. ✓
+- **Security:** Pydantic `ge=0` + service `ValueError` guard; admin-only via `get_current_admin`; fixed DJ-facing message leaks no internals; parameterized SQLAlchemy queries only. ✓
diff --git a/docs/superpowers/plans/2026-05-28-llm-gateway-streaming.md b/docs/superpowers/plans/2026-05-28-llm-gateway-streaming.md
new file mode 100644
index 00000000..0b3b06b8
--- /dev/null
+++ b/docs/superpowers/plans/2026-05-28-llm-gateway-streaming.md
@@ -0,0 +1,1861 @@
+# LLM Gateway Streaming Support Implementation Plan
+
+> **For agentic workers:** REQUIRED SUB-SKILL: Use superpowers:subagent-driven-development (recommended) or superpowers:executing-plans to implement this plan task-by-task. Steps use checkbox (`- [ ]`) syntax for tracking.
+
+**Goal:** Add provider-agnostic streaming (`Gateway.stream`) to the LLM Gateway with native SSE for OpenAI, Anthropic, and OpenAI-compatible adapters, an authenticated SSE backend endpoint, and a minimal frontend consumer — closing GitHub issue #335.
+
+**Architecture:** A new `ChatResponseChunk` canonical model carries incremental text, partial tool-call fragments, and (on the final chunk) `stop_reason` + `usage`. The `LlmAdapter` ABC gains an `async def stream(self, request) -> AsyncIterator[ChatResponseChunk]` with a default that raises `StreamingUnsupported`. OpenAI-wire adapters (platform + compatible) parse SSE `data:` lines with incremental tool-call JSON assembly; the Anthropic adapter consumes the SDK's typed event stream (content_block_delta / input_json_delta). `Gateway.stream` mirrors `dispatch`'s connector resolution and writes a single counts-only `llm_call_log` row (plus auth/audit rows) when the stream completes or errors. A new authenticated `POST /api/llm/connectors/{id}/stream-test` endpoint emits `text/event-stream`; client disconnect cancels the upstream request via async generator cleanup. The frontend gets an `apiClient.streamConnectorTest()` consumer using `fetch` + `ReadableStream` (EventSource cannot send the Bearer header).
+
+**Tech Stack:** Python / FastAPI / `sse_starlette` (already a dep) / `httpx` async streaming / `anthropic` SDK `messages.stream()` / pytest-asyncio. Frontend: Next.js / TypeScript / `fetch` streaming.
+
+---
+
+## File Structure
+
+- **Create** `server/app/services/llm/streaming.py` — `ChatResponseChunk` model + `StreamingUnsupported` exception + shared SSE-line helpers (`iter_sse_data_lines`, OpenAI partial tool-call accumulator). One responsibility: streaming primitives shared by adapters.
+- **Modify** `server/app/services/llm/base.py` — add `stream()` to the `LlmAdapter` ABC with a non-abstract default that raises `StreamingUnsupported`; re-export `ChatResponseChunk`.
+- **Modify** `server/app/services/llm/exceptions.py` — add `StreamingUnsupported(LlmError)`.
+- **Modify** `server/app/services/llm/adapters/_httpx_openai.py` — add `stream_openai_chat(...)` async generator.
+- **Modify** `server/app/services/llm/adapters/openai_apikey.py` — implement `stream()`.
+- **Modify** `server/app/services/llm/adapters/openai_compatible.py` — implement `stream()`.
+- **Modify** `server/app/services/llm/adapters/anthropic_apikey.py` — implement `stream()`.
+- **Modify** `server/app/services/llm/gateway.py` — add `Gateway.stream(...)` + `_attempt_stream(...)` helper (additive, separate functions — no edits to existing `dispatch`/`_attempt` bodies, to minimize merge conflicts with siblings #337/#339).
+- **Modify** `server/app/api/llm.py` — add `POST /connectors/{id}/stream-test` SSE endpoint.
+- **Modify** `dashboard/lib/api.ts` — add `streamConnectorTest(id, onChunk)` consumer + a `StreamChunk` type.
+- **Modify** `dashboard/app/admin/ai/page.tsx` — wire a minimal "stream test" affordance OR document scope as plumbing-only (decision recorded in Task 11).
+- **Create** `server/tests/test_llm_streaming.py` — chunk model + adapter stream parsing (OpenAI text, OpenAI tool-call fragments, Anthropic deltas, compatible, unsupported default).
+- **Create** `server/tests/test_llm_gateway_stream.py` — gateway resolution + logging + cancellation propagation.
+- **Create** `server/tests/test_llm_stream_endpoint.py` — SSE endpoint auth + content-type + body shape.
+
+---
+
+## Task 1: `ChatResponseChunk` model + `StreamingUnsupported` exception
+
+**Files:**
+- Create: `server/app/services/llm/streaming.py`
+- Modify: `server/app/services/llm/exceptions.py`
+- Modify: `server/app/services/llm/base.py`
+- Test: `server/tests/test_llm_streaming.py`
+
+- [ ] **Step 1: Write the failing test**
+
+```python
+# server/tests/test_llm_streaming.py
+"""Tests for streaming primitives: ChatResponseChunk + SSE helpers."""
+
+from __future__ import annotations
+
+from app.services.llm.base import ChatResponseChunk, LlmAdapter
+from app.services.llm.exceptions import StreamingUnsupported
+
+
+def test_chunk_defaults_are_empty():
+    chunk = ChatResponseChunk()
+    assert chunk.text_delta == ""
+    assert chunk.tool_call_deltas == []
+    assert chunk.stop_reason is None
+    assert chunk.usage is None
+    assert chunk.done is False
+
+
+def test_chunk_final_carries_stop_reason_and_usage():
+    from app.services.llm.base import TokenUsage
+
+    chunk = ChatResponseChunk(
+        stop_reason="end_turn",
+        usage=TokenUsage(prompt=3, completion=5),
+        done=True,
+    )
+    assert chunk.done is True
+    assert chunk.stop_reason == "end_turn"
+    assert chunk.usage.completion == 5
+
+
+def test_tool_call_delta_fragment_shape():
+    from app.services.llm.base import ToolCallDelta
+
+    delta = ToolCallDelta(index=0, id="call_1", name="search", input_json_fragment='{"q":')
+    assert delta.index == 0
+    assert delta.id == "call_1"
+    assert delta.name == "search"
+    assert delta.input_json_fragment == '{"q":'
+```
+
+- [ ] **Step 2: Run test to verify it fails**
+
+Run: `cd server && .venv/bin/pytest tests/test_llm_streaming.py -q`
+Expected: FAIL with `ImportError: cannot import name 'ChatResponseChunk'`
+
+- [ ] **Step 3: Add `StreamingUnsupported` to exceptions**
+
+In `server/app/services/llm/exceptions.py`, append:
+
+```python
+
+
+class StreamingUnsupported(LlmError):
+    """The resolved adapter does not implement provider-native streaming."""
+```
+
+- [ ] **Step 4: Create `streaming.py` with chunk-side helpers (model lives in base.py)**
+
+The chunk + delta models live in `base.py` (Task adds them there) so they sit alongside `ChatResponse`. `streaming.py` holds the SSE-line helpers only — created in Task 4. For this task, only add the models to `base.py`.
+
+In `server/app/services/llm/base.py`, after `ChatResponse`, add:
+
+```python
+class ToolCallDelta(BaseModel):
+    """A fragment of a streamed tool call.
+
+    Providers emit tool-call arguments incrementally. ``index`` groups fragments
+    belonging to the same call (OpenAI sends an array index; Anthropic uses the
+    content-block index). ``id`` / ``name`` arrive once at the start of a call;
+    ``input_json_fragment`` carries the raw, possibly-partial argument JSON text.
+    Consumers concatenate fragments per ``index`` and JSON-parse the result when
+    the stream completes.
+    """
+
+    index: int
+    id: str | None = None
+    name: str | None = None
+    input_json_fragment: str = ""
+
+
+class ChatResponseChunk(BaseModel):
+    """One incremental chunk of a streamed chat response.
+
+    Non-final chunks carry ``text_delta`` and/or ``tool_call_deltas``. The final
+    chunk sets ``done=True`` and carries the canonical ``stop_reason`` plus
+    ``usage`` (when the provider reports it). ``stop_reason``/``usage`` may be
+    ``None`` on every non-final chunk.
+    """
+
+    text_delta: str = ""
+    tool_call_deltas: list[ToolCallDelta] = Field(default_factory=list)
+    stop_reason: Literal["end_turn", "tool_use", "max_tokens", "error"] | None = None
+    usage: TokenUsage | None = None
+    done: bool = False
+```
+
+- [ ] **Step 5: Add `stream()` default to the `LlmAdapter` ABC**
+
+In `server/app/services/llm/base.py`, add these imports at the top (merge with existing):
+
+```python
+from collections.abc import AsyncIterator
+```
+
+Then inside `class LlmAdapter`, after `health_check`, add:
+
+```python
+    async def stream(self, request: ChatRequest) -> AsyncIterator[ChatResponseChunk]:
+        """Stream a chat response as incremental chunks.
+
+        Default raises :class:`StreamingUnsupported`. Adapters that support
+        provider-native streaming override this. The body is unreachable but
+        present so the method is an async generator for type-checkers.
+        """
+        from app.services.llm.exceptions import StreamingUnsupported
+
+        raise StreamingUnsupported(
+            f"connector_type={self.connector_type!r} does not support streaming"
+        )
+        yield  # pragma: no cover  (makes this an async generator)
+```
+
+- [ ] **Step 6: Run test to verify it passes**
+
+Run: `cd server && .venv/bin/pytest tests/test_llm_streaming.py -q`
+Expected: PASS (3 tests)
+
+- [ ] **Step 7: Commit**
+
+```bash
+git add server/app/services/llm/base.py server/app/services/llm/exceptions.py server/tests/test_llm_streaming.py
+git commit -m "feat(llm): add ChatResponseChunk + streaming ABC default"
+```
+
+---
+
+## Task 2: Default `stream()` raises `StreamingUnsupported`
+
+**Files:**
+- Test: `server/tests/test_llm_streaming.py`
+
+- [ ] **Step 1: Write the failing test**
+
+Append to `server/tests/test_llm_streaming.py`:
+
+```python
+import pytest
+
+from app.services.llm.base import ChatRequest, Message
+
+
+class _BareAdapter(LlmAdapter):
+    connector_type = "bare"
+
+    async def chat(self, request):  # pragma: no cover
+        raise NotImplementedError
+
+    async def health_check(self):  # pragma: no cover
+        raise NotImplementedError
+
+
+@pytest.mark.asyncio
+async def test_default_stream_raises_streaming_unsupported():
+    adapter = _BareAdapter(connector=None)
+    req = ChatRequest(messages=[Message(role="user", content="hi")])
+    with pytest.raises(StreamingUnsupported):
+        async for _ in adapter.stream(req):
+            pass
+```
+
+- [ ] **Step 2: Run test to verify it passes (default already implemented in Task 1)**
+
+Run: `cd server && .venv/bin/pytest tests/test_llm_streaming.py::test_default_stream_raises_streaming_unsupported -q`
+Expected: PASS
+
+- [ ] **Step 3: Commit**
+
+```bash
+git add server/tests/test_llm_streaming.py
+git commit -m "test(llm): default adapter stream raises StreamingUnsupported"
+```
+
+---
+
+## Task 3: OpenAI partial tool-call accumulator helper
+
+**Files:**
+- Create: `server/app/services/llm/streaming.py`
+- Test: `server/tests/test_llm_streaming.py`
+
+- [ ] **Step 1: Write the failing test**
+
+Append to `server/tests/test_llm_streaming.py`:
+
+```python
+def test_parse_openai_stream_line_text():
+    from app.services.llm.streaming import parse_openai_stream_event
+
+    chunk = parse_openai_stream_event(
+        {"choices": [{"delta": {"content": "Hello"}, "finish_reason": None}]}
+    )
+    assert chunk is not None
+    assert chunk.text_delta == "Hello"
+    assert chunk.tool_call_deltas == []
+    assert chunk.done is False
+
+
+def test_parse_openai_stream_line_tool_call_fragment():
+    from app.services.llm.streaming import parse_openai_stream_event
+
+    chunk = parse_openai_stream_event(
+        {
+            "choices": [
+                {
+                    "delta": {
+                        "tool_calls": [
+                            {
+                                "index": 0,
+                                "id": "call_1",
+                                "function": {"name": "search", "arguments": '{"q":'},
+                            }
+                        ]
+                    },
+                    "finish_reason": None,
+                }
+            ]
+        }
+    )
+    assert chunk is not None
+    assert chunk.text_delta == ""
+    assert len(chunk.tool_call_deltas) == 1
+    d = chunk.tool_call_deltas[0]
+    assert d.index == 0 and d.id == "call_1" and d.name == "search"
+    assert d.input_json_fragment == '{"q":'
+
+
+def test_parse_openai_stream_line_finish():
+    from app.services.llm.streaming import parse_openai_stream_event
+
+    chunk = parse_openai_stream_event(
+        {
+            "choices": [{"delta": {}, "finish_reason": "tool_calls"}],
+            "usage": {"prompt_tokens": 7, "completion_tokens": 11},
+        }
+    )
+    assert chunk is not None
+    assert chunk.done is True
+    assert chunk.stop_reason == "tool_use"
+    assert chunk.usage is not None and chunk.usage.prompt == 7
+```
+
+- [ ] **Step 2: Run test to verify it fails**
+
+Run: `cd server && .venv/bin/pytest tests/test_llm_streaming.py -k parse_openai_stream -q`
+Expected: FAIL with `ModuleNotFoundError`/`ImportError` for `streaming.parse_openai_stream_event`
+
+- [ ] **Step 3: Create `streaming.py` helpers**
+
+```python
+# server/app/services/llm/streaming.py
+"""Shared streaming primitives for LLM adapters.
+
+Holds SSE-line parsing helpers reused by the OpenAI-wire adapters. The chunk /
+delta models themselves live in ``base.py`` alongside ``ChatResponse``.
+"""
+
+from __future__ import annotations
+
+from app.services.llm.base import ChatResponseChunk, ToolCallDelta, TokenUsage
+from app.services.llm.tool_translation import _normalise_finish_reason  # noqa: PLC2701
+
+# OpenAI streaming finish_reason → canonical, reusing the non-stream mapping.
+_FINISH_REASON_OPENAI = {
+    "stop": "end_turn",
+    "tool_calls": "tool_use",
+    "function_call": "tool_use",
+    "length": "max_tokens",
+}
+
+
+def parse_openai_stream_event(payload: dict) -> ChatResponseChunk | None:
+    """Translate one parsed OpenAI streaming JSON object into a chunk.
+
+    Returns ``None`` for payloads carrying no usable signal (e.g. the initial
+    role-only delta). The final event sets ``done=True`` with the mapped
+    ``stop_reason`` and (when present) token usage.
+    """
+    choices = payload.get("choices") or []
+    choice = choices[0] if choices else {}
+    delta = choice.get("delta") or {}
+
+    text_delta = delta.get("content") or ""
+
+    tool_call_deltas: list[ToolCallDelta] = []
+    for tc in delta.get("tool_calls") or []:
+        if not isinstance(tc, dict):
+            continue
+        fn = tc.get("function") or {}
+        tool_call_deltas.append(
+            ToolCallDelta(
+                index=int(tc.get("index", 0)),
+                id=tc.get("id"),
+                name=(fn.get("name") if isinstance(fn, dict) else None),
+                input_json_fragment=(
+                    (fn.get("arguments") or "") if isinstance(fn, dict) else ""
+                ),
+            )
+        )
+
+    finish_reason = choice.get("finish_reason")
+    usage_payload = payload.get("usage") or {}
+
+    done = finish_reason is not None
+    stop_reason = None
+    usage = None
+    if done:
+        stop_reason = _normalise_finish_reason(finish_reason, _FINISH_REASON_OPENAI)
+        if usage_payload:
+            usage = TokenUsage(
+                prompt=int(usage_payload.get("prompt_tokens", 0)),
+                completion=int(usage_payload.get("completion_tokens", 0)),
+            )
+
+    if not text_delta and not tool_call_deltas and not done:
+        return None
+
+    return ChatResponseChunk(
+        text_delta=text_delta,
+        tool_call_deltas=tool_call_deltas,
+        stop_reason=stop_reason,
+        usage=usage,
+        done=done,
+    )
+```
+
+- [ ] **Step 4: Run test to verify it passes**
+
+Run: `cd server && .venv/bin/pytest tests/test_llm_streaming.py -k parse_openai_stream -q`
+Expected: PASS (3 tests)
+
+- [ ] **Step 5: Commit**
+
+```bash
+git add server/app/services/llm/streaming.py server/tests/test_llm_streaming.py
+git commit -m "feat(llm): OpenAI streaming event → ChatResponseChunk parser"
+```
+
+---
+
+## Task 4: `stream_openai_chat` async generator (httpx)
+
+**Files:**
+- Modify: `server/app/services/llm/adapters/_httpx_openai.py`
+- Test: `server/tests/test_llm_streaming.py`
+
+- [ ] **Step 1: Write the failing test (mock httpx streaming response)**
+
+Append to `server/tests/test_llm_streaming.py`:
+
+```python
+class _FakeStreamResponse:
+    """Minimal stand-in for httpx streaming response."""
+
+    def __init__(self, lines: list[str], status_code: int = 200):
+        self._lines = lines
+        self.status_code = status_code
+        self.headers = {}
+
+    async def aiter_lines(self):
+        for line in self._lines:
+            yield line
+
+    async def aread(self):
+        return b""
+
+
+class _FakeStreamClient:
+    def __init__(self, response):
+        self._response = response
+
+    async def __aenter__(self):
+        return self
+
+    async def __aexit__(self, *exc):
+        return False
+
+    def stream(self, method, url, **kwargs):
+        client = self
+
+        class _Ctx:
+            async def __aenter__(self_inner):
+                return client._response
+
+            async def __aexit__(self_inner, *exc):
+                return False
+
+        return _Ctx()
+
+
+@pytest.mark.asyncio
+async def test_stream_openai_chat_yields_text_then_final(monkeypatch):
+    from app.services.llm.adapters import _httpx_openai
+
+    sse_lines = [
+        'data: {"choices":[{"delta":{"role":"assistant"},"finish_reason":null}]}',
+        'data: {"choices":[{"delta":{"content":"Hi"},"finish_reason":null}]}',
+        'data: {"choices":[{"delta":{"content":" there"},"finish_reason":null}]}',
+        'data: {"choices":[{"delta":{},"finish_reason":"stop"}],'
+        '"usage":{"prompt_tokens":4,"completion_tokens":2}}',
+        "data: [DONE]",
+    ]
+    fake_resp = _FakeStreamResponse(sse_lines)
+    monkeypatch.setattr(
+        _httpx_openai.httpx, "AsyncClient", lambda *a, **k: _FakeStreamClient(fake_resp)
+    )
+
+    req = ChatRequest(messages=[Message(role="user", content="hi")], model="gpt-x")
+    chunks = []
+    async for c in _httpx_openai.stream_openai_chat(
+        base_url="https://api.openai.com/v1",
+        api_key="sk-test",
+        request=req,
+        fallback_model="gpt-x",
+    ):
+        chunks.append(c)
+
+    text = "".join(c.text_delta for c in chunks)
+    assert text == "Hi there"
+    assert chunks[-1].done is True
+    assert chunks[-1].stop_reason == "end_turn"
+    assert chunks[-1].usage.prompt == 4
+```
+
+- [ ] **Step 2: Run test to verify it fails**
+
+Run: `cd server && .venv/bin/pytest tests/test_llm_streaming.py::test_stream_openai_chat_yields_text_then_final -q`
+Expected: FAIL — `stream_openai_chat` not defined
+
+- [ ] **Step 3: Implement `stream_openai_chat` in `_httpx_openai.py`**
+
+Add imports near the top of `server/app/services/llm/adapters/_httpx_openai.py`:
+
+```python
+from collections.abc import AsyncIterator
+
+from app.services.llm.base import ChatResponseChunk
+from app.services.llm.exceptions import AuthInvalid, QuotaExceeded, RateLimited
+from app.services.llm.streaming import parse_openai_stream_event
+```
+
+(Merge with the existing import block; `ProviderUnavailable` / `ToolTranslationError` are already imported.)
+
+Add this function after `call_openai_chat`:
+
+```python
+def _map_stream_status(status_code: int) -> None:
+    """Raise the canonical typed error for a non-2xx streaming status."""
+    if status_code in (401, 403):
+        raise AuthInvalid(f"Auth failed (HTTP {status_code})")
+    if status_code == 402:
+        raise QuotaExceeded("Quota or billing failure (HTTP 402)")
+    if status_code == 429:
+        raise RateLimited("Rate limited (HTTP 429)")
+    if 500 <= status_code < 600:
+        raise ProviderUnavailable(f"Upstream error (HTTP {status_code})")
+    raise ToolTranslationError(f"Upstream rejected request (HTTP {status_code})")
+
+
+async def stream_openai_chat(
+    *,
+    base_url: str,
+    api_key: str | None,
+    request: ChatRequest,
+    fallback_model: str | None,
+    extra_headers: dict | None = None,
+    max_tokens_field: str = "max_tokens",
+) -> AsyncIterator[ChatResponseChunk]:
+    """Issue a streaming Chat Completions request, yielding canonical chunks.
+
+    Cancellation: if the consumer stops iterating (e.g. SSE client disconnect),
+    the ``async with client.stream(...)`` context exits and httpx closes the
+    upstream connection, cancelling the provider request. Errors are mapped to
+    canonical typed exceptions before the first chunk; mid-stream network drops
+    surface as ``ProviderUnavailable``.
+    """
+    model = request.model or fallback_model
+    if not model:
+        raise ToolTranslationError(
+            "model is required (set ChatRequest.model or LlmConnector.model_hint)"
+        )
+
+    endpoint = _build_chat_endpoint(base_url)
+    headers: dict[str, str] = {
+        "Content-Type": "application/json",
+        "Accept": "text/event-stream",
+    }
+    if api_key:
+        headers["Authorization"] = f"Bearer {api_key}"  # nosec B106
+    if extra_headers:
+        headers.update(extra_headers)
+
+    timeout = request.timeout_seconds or DEFAULT_TIMEOUT_SECONDS
+    timeout = min(max(timeout, 1.0), MAX_TIMEOUT_SECONDS)
+
+    payload = _build_payload(request, model, max_tokens_field=max_tokens_field)
+    payload["stream"] = True
+    # Ask OpenAI to include usage in the terminal stream event.
+    payload["stream_options"] = {"include_usage": True}
+
+    try:
+        async with httpx.AsyncClient(timeout=timeout) as client:
+            async with client.stream(
+                "POST", endpoint, json=payload, headers=headers
+            ) as resp:
+                if resp.status_code >= 300:
+                    # Drain the (small) error body so the connection releases.
+                    await resp.aread()
+                    _map_stream_status(resp.status_code)
+                async for line in resp.aiter_lines():
+                    if not line or not line.startswith("data:"):
+                        continue
+                    data = line[len("data:") :].strip()
+                    if data == "[DONE]":
+                        break
+                    try:
+                        obj = json.loads(data)
+                    except json.JSONDecodeError:
+                        # Tolerate keepalive/comment lines.
+                        continue
+                    chunk = parse_openai_stream_event(obj)
+                    if chunk is not None:
+                        yield chunk
+    except httpx.TimeoutException as exc:
+        raise ProviderUnavailable("Upstream timeout") from exc
+    except httpx.HTTPError as exc:
+        raise ProviderUnavailable("Upstream network error") from exc
+```
+
+- [ ] **Step 4: Run test to verify it passes**
+
+Run: `cd server && .venv/bin/pytest tests/test_llm_streaming.py::test_stream_openai_chat_yields_text_then_final -q`
+Expected: PASS
+
+- [ ] **Step 5: Commit**
+
+```bash
+git add server/app/services/llm/adapters/_httpx_openai.py server/tests/test_llm_streaming.py
+git commit -m "feat(llm): httpx OpenAI-wire streaming generator"
+```
+
+---
+
+## Task 5: OpenAI Platform + OpenAI-compatible adapter `stream()`
+
+**Files:**
+- Modify: `server/app/services/llm/adapters/openai_apikey.py`
+- Modify: `server/app/services/llm/adapters/openai_compatible.py`
+- Test: `server/tests/test_llm_streaming.py`
+
+- [ ] **Step 1: Write the failing test**
+
+Append to `server/tests/test_llm_streaming.py`:
+
+```python
+@pytest.mark.asyncio
+async def test_openai_apikey_adapter_stream(monkeypatch):
+    import json as _json
+
+    from app.models.llm_connector import LlmConnector
+    from app.services.llm.adapters import openai_apikey
+    from app.services.llm.base import ChatResponseChunk
+
+    captured = {}
+
+    async def fake_stream(**kwargs):
+        captured.update(kwargs)
+        yield ChatResponseChunk(text_delta="ok", done=False)
+        yield ChatResponseChunk(stop_reason="end_turn", done=True)
+
+    monkeypatch.setattr(openai_apikey, "stream_openai_chat", fake_stream)
+
+    connector = LlmConnector(
+        user_id=1,
+        connector_type="openai_apikey",
+        display_name="x",
+        status="active",
+        credentials=_json.dumps({"api_key": "sk-test"}),
+        model_hint="gpt-x",
+    )
+    adapter = openai_apikey.OpenAIApiKeyAdapter(connector)
+    req = ChatRequest(messages=[Message(role="user", content="hi")])
+    chunks = [c async for c in adapter.stream(req)]
+    assert [c.text_delta for c in chunks] == ["ok", ""]
+    assert chunks[-1].done is True
+    assert captured["max_tokens_field"] == "max_completion_tokens"
+    assert captured["api_key"] == "sk-test"
+```
+
+- [ ] **Step 2: Run test to verify it fails**
+
+Run: `cd server && .venv/bin/pytest tests/test_llm_streaming.py::test_openai_apikey_adapter_stream -q`
+Expected: FAIL — adapter `stream` falls through to default `StreamingUnsupported`
+
+- [ ] **Step 3: Implement `stream()` in `openai_apikey.py`**
+
+Add to imports:
+
+```python
+from collections.abc import AsyncIterator
+
+from app.services.llm.adapters._httpx_openai import (
+    build_healthcheck_request,
+    call_openai_chat,
+    stream_openai_chat,
+)
+from app.services.llm.base import ChatResponseChunk
+```
+
+(Merge with the existing `_httpx_openai` import — add `stream_openai_chat`.)
+
+Add the method to `OpenAIApiKeyAdapter` (after `health_check`):
+
+```python
+    async def stream(self, request: ChatRequest) -> AsyncIterator[ChatResponseChunk]:
+        api_key = self._extract_api_key()
+        async for chunk in stream_openai_chat(
+            base_url=OPENAI_BASE_URL,
+            api_key=api_key,
+            request=request,
+            fallback_model=self.connector.model_hint or DEFAULT_MODEL,
+            max_tokens_field=_MAX_TOKENS_FIELD,
+        ):
+            yield chunk
+```
+
+- [ ] **Step 4: Implement `stream()` in `openai_compatible.py`**
+
+Add to imports:
+
+```python
+from collections.abc import AsyncIterator
+
+from app.services.llm.adapters._httpx_openai import (
+    build_healthcheck_request,
+    call_openai_chat,
+    stream_openai_chat,
+)
+from app.services.llm.base import ChatResponseChunk
+```
+
+Add the method to `OpenAICompatibleAdapter` (after `health_check`):
+
+```python
+    async def stream(self, request: ChatRequest) -> AsyncIterator[ChatResponseChunk]:
+        base_url, bearer = self._extract_credentials()
+        async for chunk in stream_openai_chat(
+            base_url=base_url,
+            api_key=bearer,
+            request=request,
+            fallback_model=self.connector.model_hint or DEFAULT_MODEL,
+        ):
+            yield chunk
+```
+
+- [ ] **Step 5: Add a compatible-adapter stream test**
+
+Append to `server/tests/test_llm_streaming.py`:
+
+```python
+@pytest.mark.asyncio
+async def test_openai_compatible_adapter_stream(monkeypatch):
+    import json as _json
+
+    from app.models.llm_connector import LlmConnector
+    from app.services.llm.adapters import openai_compatible
+    from app.services.llm.base import ChatResponseChunk
+
+    async def fake_stream(**kwargs):
+        assert kwargs["base_url"] == "http://127.0.0.1:1234/v1"
+        yield ChatResponseChunk(text_delta="hey", done=False)
+        yield ChatResponseChunk(stop_reason="end_turn", done=True)
+
+    monkeypatch.setattr(openai_compatible, "stream_openai_chat", fake_stream)
+
+    connector = LlmConnector(
+        user_id=1,
+        connector_type="openai_compatible",
+        display_name="local",
+        status="active",
+        credentials=_json.dumps({"base_url": "http://127.0.0.1:1234/v1"}),
+        model_hint="local-model",
+    )
+    adapter = openai_compatible.OpenAICompatibleAdapter(connector)
+    req = ChatRequest(messages=[Message(role="user", content="hi")])
+    chunks = [c async for c in adapter.stream(req)]
+    assert "".join(c.text_delta for c in chunks) == "hey"
+    assert chunks[-1].done is True
+```
+
+- [ ] **Step 6: Run tests to verify they pass**
+
+Run: `cd server && .venv/bin/pytest tests/test_llm_streaming.py -k "openai_apikey_adapter_stream or openai_compatible_adapter_stream" -q`
+Expected: PASS (2 tests)
+
+- [ ] **Step 7: Commit**
+
+```bash
+git add server/app/services/llm/adapters/openai_apikey.py server/app/services/llm/adapters/openai_compatible.py server/tests/test_llm_streaming.py
+git commit -m "feat(llm): streaming for OpenAI platform + compatible adapters"
+```
+
+---
+
+## Task 6: Anthropic adapter `stream()`
+
+**Files:**
+- Modify: `server/app/services/llm/adapters/anthropic_apikey.py`
+- Test: `server/tests/test_llm_streaming.py`
+
+- [ ] **Step 1: Write the failing test (fake SDK event stream)**
+
+Append to `server/tests/test_llm_streaming.py`:
+
+```python
+class _FakeEvent:
+    """Stand-in for an anthropic SDK stream event (attribute access)."""
+
+    def __init__(self, **kw):
+        for k, v in kw.items():
+            setattr(self, k, v)
+
+
+class _FakeAnthropicStream:
+    def __init__(self, events):
+        self._events = events
+
+    async def __aenter__(self):
+        return self
+
+    async def __aexit__(self, *exc):
+        return False
+
+    async def __aiter__(self):
+        for e in self._events:
+            yield e
+
+
+def _anthropic_text_events():
+    return [
+        _FakeEvent(type="message_start"),
+        _FakeEvent(
+            type="content_block_start",
+            index=0,
+            content_block=_FakeEvent(type="text", text=""),
+        ),
+        _FakeEvent(
+            type="content_block_delta",
+            index=0,
+            delta=_FakeEvent(type="text_delta", text="Hel"),
+        ),
+        _FakeEvent(
+            type="content_block_delta",
+            index=0,
+            delta=_FakeEvent(type="text_delta", text="lo"),
+        ),
+        _FakeEvent(type="content_block_stop", index=0),
+        _FakeEvent(
+            type="message_delta",
+            delta=_FakeEvent(stop_reason="end_turn"),
+            usage=_FakeEvent(output_tokens=5),
+        ),
+        _FakeEvent(type="message_stop"),
+    ]
+
+
+@pytest.mark.asyncio
+async def test_anthropic_adapter_stream_text(monkeypatch):
+    import json as _json
+
+    from app.models.llm_connector import LlmConnector
+    from app.services.llm.adapters import anthropic_apikey
+
+    class _FakeMessages:
+        def stream(self, **kwargs):
+            return _FakeAnthropicStream(_anthropic_text_events())
+
+    class _FakeClient:
+        def __init__(self, *a, **k):
+            self.messages = _FakeMessages()
+
+        async def __aenter__(self):
+            return self
+
+        async def __aexit__(self, *exc):
+            return False
+
+    monkeypatch.setattr(anthropic_apikey, "AsyncAnthropic", _FakeClient)
+
+    connector = LlmConnector(
+        user_id=1,
+        connector_type="anthropic_apikey",
+        display_name="claude",
+        status="active",
+        credentials=_json.dumps({"api_key": "sk-ant-test"}),
+        model_hint="claude-x",
+    )
+    adapter = anthropic_apikey.AnthropicApiKeyAdapter(connector)
+    req = ChatRequest(messages=[Message(role="user", content="hi")])
+    chunks = [c async for c in adapter.stream(req)]
+    assert "".join(c.text_delta for c in chunks) == "Hello"
+    assert chunks[-1].done is True
+    assert chunks[-1].stop_reason == "end_turn"
+    assert chunks[-1].usage.completion == 5
+
+
+def _anthropic_tool_events():
+    return [
+        _FakeEvent(type="message_start"),
+        _FakeEvent(
+            type="content_block_start",
+            index=0,
+            content_block=_FakeEvent(type="tool_use", id="toolu_1", name="search"),
+        ),
+        _FakeEvent(
+            type="content_block_delta",
+            index=0,
+            delta=_FakeEvent(type="input_json_delta", partial_json='{"q":'),
+        ),
+        _FakeEvent(
+            type="content_block_delta",
+            index=0,
+            delta=_FakeEvent(type="input_json_delta", partial_json='"house"}'),
+        ),
+        _FakeEvent(type="content_block_stop", index=0),
+        _FakeEvent(
+            type="message_delta",
+            delta=_FakeEvent(stop_reason="tool_use"),
+            usage=_FakeEvent(output_tokens=9),
+        ),
+        _FakeEvent(type="message_stop"),
+    ]
+
+
+@pytest.mark.asyncio
+async def test_anthropic_adapter_stream_tool_use(monkeypatch):
+    import json as _json
+
+    from app.models.llm_connector import LlmConnector
+    from app.services.llm.adapters import anthropic_apikey
+
+    class _FakeMessages:
+        def stream(self, **kwargs):
+            return _FakeAnthropicStream(_anthropic_tool_events())
+
+    class _FakeClient:
+        def __init__(self, *a, **k):
+            self.messages = _FakeMessages()
+
+        async def __aenter__(self):
+            return self
+
+        async def __aexit__(self, *exc):
+            return False
+
+    monkeypatch.setattr(anthropic_apikey, "AsyncAnthropic", _FakeClient)
+
+    connector = LlmConnector(
+        user_id=1,
+        connector_type="anthropic_apikey",
+        display_name="claude",
+        status="active",
+        credentials=_json.dumps({"api_key": "sk-ant-test"}),
+        model_hint="claude-x",
+    )
+    adapter = anthropic_apikey.AnthropicApiKeyAdapter(connector)
+    req = ChatRequest(messages=[Message(role="user", content="hi")])
+    chunks = [c async for c in adapter.stream(req)]
+
+    # Reassemble tool-call fragments by index.
+    frags = [d for c in chunks for d in c.tool_call_deltas]
+    assert frags[0].id == "toolu_1" and frags[0].name == "search"
+    joined = "".join(d.input_json_fragment for d in frags)
+    assert _json.loads(joined) == {"q": "house"}
+    assert chunks[-1].done is True
+    assert chunks[-1].stop_reason == "tool_use"
+```
+
+- [ ] **Step 2: Run test to verify it fails**
+
+Run: `cd server && .venv/bin/pytest tests/test_llm_streaming.py -k anthropic_adapter_stream -q`
+Expected: FAIL — `StreamingUnsupported`
+
+- [ ] **Step 3: Implement `stream()` in `anthropic_apikey.py`**
+
+Add to imports (merge with existing):
+
+```python
+from collections.abc import AsyncIterator
+
+from app.services.llm.base import (
+    ChatRequest,
+    ChatResponse,
+    ChatResponseChunk,
+    LlmAdapter,
+    Message,
+    TokenUsage,
+    ToolCallDelta,
+)
+from app.services.llm.exceptions import (
+    AuthInvalid,
+    ProviderUnavailable,
+    QuotaExceeded,
+    RateLimited,
+    ToolTranslationError,
+)
+```
+
+Add a module-level finish-reason map near `DEFAULT_MODEL`:
+
+```python
+_STREAM_FINISH_REASON = {
+    "end_turn": "end_turn",
+    "stop_sequence": "end_turn",
+    "tool_use": "tool_use",
+    "max_tokens": "max_tokens",
+}
+```
+
+Add the method (after `health_check`):
+
+```python
+    async def stream(self, request: ChatRequest) -> AsyncIterator[ChatResponseChunk]:
+        model = request.model or self.connector.model_hint or DEFAULT_MODEL
+        max_tokens = request.max_tokens or DEFAULT_MAX_TOKENS
+        timeout = min(
+            max(request.timeout_seconds or DEFAULT_TIMEOUT_SECONDS, 1.0),
+            MAX_TIMEOUT_SECONDS,
+        )
+
+        anthropic_messages = to_anthropic_messages(request.messages)
+        tools, choice = to_anthropic_tools(request.tools, request.force_tool)
+
+        kwargs: dict[str, Any] = {
+            "model": model,
+            "max_tokens": max_tokens,
+            "messages": anthropic_messages,
+        }
+        if request.system:
+            kwargs["system"] = request.system
+        if request.temperature is not None:
+            kwargs["temperature"] = request.temperature
+        if tools:
+            kwargs["tools"] = tools
+        if choice is not None:
+            kwargs["tool_choice"] = choice
+
+        # Per-content-block index → tool id/name (sent once at block start).
+        block_index_to_tool: dict[int, str] = {}
+        stop_reason: str | None = None
+        output_tokens: int | None = None
+
+        try:
+            async with self._client(timeout=timeout) as client:
+                async with client.messages.stream(**kwargs) as stream:
+                    async for event in stream:
+                        etype = getattr(event, "type", None)
+                        if etype == "content_block_start":
+                            block = getattr(event, "content_block", None)
+                            if getattr(block, "type", None) == "tool_use":
+                                idx = int(getattr(event, "index", 0))
+                                tool_id = getattr(block, "id", None)
+                                name = getattr(block, "name", None)
+                                block_index_to_tool[idx] = name or ""
+                                yield ChatResponseChunk(
+                                    tool_call_deltas=[
+                                        ToolCallDelta(index=idx, id=tool_id, name=name)
+                                    ]
+                                )
+                        elif etype == "content_block_delta":
+                            delta = getattr(event, "delta", None)
+                            dtype = getattr(delta, "type", None)
+                            if dtype == "text_delta":
+                                yield ChatResponseChunk(
+                                    text_delta=getattr(delta, "text", "") or ""
+                                )
+                            elif dtype == "input_json_delta":
+                                idx = int(getattr(event, "index", 0))
+                                yield ChatResponseChunk(
+                                    tool_call_deltas=[
+                                        ToolCallDelta(
+                                            index=idx,
+                                            input_json_fragment=getattr(
+                                                delta, "partial_json", ""
+                                            )
+                                            or "",
+                                        )
+                                    ]
+                                )
+                        elif etype == "message_delta":
+                            delta = getattr(event, "delta", None)
+                            sr = getattr(delta, "stop_reason", None)
+                            if sr is not None:
+                                stop_reason = sr
+                            usage = getattr(event, "usage", None)
+                            if usage is not None:
+                                ot = getattr(usage, "output_tokens", None)
+                                if ot is not None:
+                                    output_tokens = int(ot)
+        except APITimeoutError as exc:
+            raise ProviderUnavailable("Upstream timeout") from exc
+        except APIConnectionError as exc:
+            raise ProviderUnavailable("Upstream network error") from exc
+        except APIStatusError as exc:
+            self._raise_for_status(exc)
+        except APIError as exc:
+            raise ProviderUnavailable(
+                f"Anthropic API error: {type(exc).__name__}"
+            ) from exc
+
+        canonical_stop = _STREAM_FINISH_REASON.get(stop_reason or "", "end_turn")
+        if block_index_to_tool and canonical_stop != "tool_use":
+            canonical_stop = "tool_use"
+        final_usage = (
+            TokenUsage(prompt=0, completion=output_tokens)
+            if output_tokens is not None
+            else None
+        )
+        yield ChatResponseChunk(
+            stop_reason=canonical_stop,
+            usage=final_usage,
+            done=True,
+        )
+```
+
+Note: Anthropic streams `output_tokens` in `message_delta` but `input_tokens` only in `message_start.usage`. For the counts-only call log this completion count is sufficient; prompt is recorded as 0 when unavailable. (Documented as a design decision.)
+
+- [ ] **Step 4: Run tests to verify they pass**
+
+Run: `cd server && .venv/bin/pytest tests/test_llm_streaming.py -k anthropic_adapter_stream -q`
+Expected: PASS (2 tests)
+
+- [ ] **Step 5: Commit**
+
+```bash
+git add server/app/services/llm/adapters/anthropic_apikey.py server/tests/test_llm_streaming.py
+git commit -m "feat(llm): Anthropic provider-native streaming (text + tool_use deltas)"
+```
+
+---
+
+## Task 7: `Gateway.stream` + `_attempt_stream` with counts-only logging
+
+**Files:**
+- Modify: `server/app/services/llm/gateway.py`
+- Test: `server/tests/test_llm_gateway_stream.py`
+
+- [ ] **Step 1: Write the failing test**
+
+```python
+# server/tests/test_llm_gateway_stream.py
+"""Tests for Gateway.stream — resolution mirrors dispatch, counts-only logging."""
+
+from __future__ import annotations
+
+import json
+
+import pytest
+
+from app.models.llm_connector import LlmCallLog, LlmConnector
+from app.models.user import User
+from app.services.auth import get_password_hash
+from app.services.llm.adapters.openai_apikey import OpenAIApiKeyAdapter
+from app.services.llm.base import ChatRequest, ChatResponseChunk, Message, TokenUsage
+from app.services.llm.exceptions import NoLlmConfigured, ProviderUnavailable
+from app.services.llm.gateway import Gateway
+
+
+@pytest.fixture
+def dj_user(db) -> User:
+    user = User(
+        username="streamdj",
+        password_hash=get_password_hash("password123"),
+        role="dj",
+    )
+    db.add(user)
+    db.commit()
+    db.refresh(user)
+    return user
+
+
+def _make_connector(db, user, **kw) -> LlmConnector:
+    row = LlmConnector(
+        user_id=user.id,
+        connector_type=kw.get("connector_type", "openai_apikey"),
+        display_name=kw.get("display_name", "Test"),
+        status=kw.get("status", "active"),
+        credentials=json.dumps({"api_key": "sk-fake"}),
+        model_hint="gpt-5-mini",
+    )
+    db.add(row)
+    db.commit()
+    db.refresh(row)
+    return row
+
+
+def _fake_stream(chunks):
+    async def _gen(self, request):
+        for c in chunks:
+            yield c
+
+    return _gen
+
+
+@pytest.mark.asyncio
+async def test_stream_no_actor_no_default_raises(db):
+    req = ChatRequest(messages=[Message(role="user", content="hi")])
+    with pytest.raises(NoLlmConfigured):
+        async for _ in Gateway.stream(db, None, req, purpose="test"):
+            pass
+
+
+@pytest.mark.asyncio
+async def test_stream_dispatches_and_logs_counts_only(db, dj_user, monkeypatch):
+    connector = _make_connector(db, dj_user)
+    chunks = [
+        ChatResponseChunk(text_delta="Hel"),
+        ChatResponseChunk(text_delta="lo"),
+        ChatResponseChunk(
+            stop_reason="end_turn",
+            usage=TokenUsage(prompt=4, completion=2),
+            done=True,
+        ),
+    ]
+    monkeypatch.setattr(OpenAIApiKeyAdapter, "stream", _fake_stream(chunks))
+
+    req = ChatRequest(messages=[Message(role="user", content="hi")])
+    out = [c async for c in Gateway.stream(db, dj_user, req, purpose="recommendation")]
+    assert "".join(c.text_delta for c in out) == "Hello"
+
+    log = db.query(LlmCallLog).filter(LlmCallLog.connector_id == connector.id).one()
+    assert log.status == "ok"
+    assert log.purpose == "recommendation"
+    assert log.tokens_in == 4
+    assert log.tokens_out == 2
+    db.refresh(connector)
+    assert connector.last_used_at is not None
+
+
+@pytest.mark.asyncio
+async def test_stream_error_logs_provider_unavailable(db, dj_user, monkeypatch):
+    connector = _make_connector(db, dj_user)
+
+    async def _boom(self, request):
+        raise ProviderUnavailable("down")
+        yield  # pragma: no cover
+
+    monkeypatch.setattr(OpenAIApiKeyAdapter, "stream", _boom)
+
+    req = ChatRequest(messages=[Message(role="user", content="hi")])
+    with pytest.raises(ProviderUnavailable):
+        async for _ in Gateway.stream(db, dj_user, req, purpose="test"):
+            pass
+
+    log = db.query(LlmCallLog).filter(LlmCallLog.connector_id == connector.id).one()
+    assert log.status == "provider_unavailable"
+
+
+@pytest.mark.asyncio
+async def test_stream_consumer_cancel_logs_and_propagates(db, dj_user, monkeypatch):
+    """Consumer stops early (client disconnect) → GeneratorExit, log written once."""
+    connector = _make_connector(db, dj_user)
+
+    async def _infinite(self, request):
+        i = 0
+        while True:
+            yield ChatResponseChunk(text_delta=str(i))
+            i += 1
+
+    monkeypatch.setattr(OpenAIApiKeyAdapter, "stream", _infinite)
+
+    req = ChatRequest(messages=[Message(role="user", content="hi")])
+    agen = Gateway.stream(db, dj_user, req, purpose="test")
+    first = await agen.__anext__()
+    assert first.text_delta == "0"
+    await agen.aclose()  # simulate client disconnect
+
+    log = db.query(LlmCallLog).filter(LlmCallLog.connector_id == connector.id).one()
+    assert log.status in ("ok", "cancelled")
+```
+
+- [ ] **Step 2: Run test to verify it fails**
+
+Run: `cd server && .venv/bin/pytest tests/test_llm_gateway_stream.py -q`
+Expected: FAIL — `Gateway.stream` not defined
+
+- [ ] **Step 3: Implement `Gateway.stream` + `_attempt_stream`**
+
+Add imports at the top of `server/app/services/llm/gateway.py` (merge):
+
+```python
+from collections.abc import AsyncIterator
+
+from app.services.llm.base import ChatRequest, ChatResponse, ChatResponseChunk
+```
+
+Add a `stream` staticmethod inside `class Gateway` (after `dispatch`):
+
+```python
+    @staticmethod
+    async def stream(
+        db: Session,
+        actor: User | None,
+        request: ChatRequest,
+        *,
+        purpose: str,
+    ) -> AsyncIterator[ChatResponseChunk]:
+        """Stream a chat response, mirroring ``dispatch`` resolution + logging.
+
+        Resolution is identical to ``dispatch`` (per-DJ default → MRU → org
+        default). Logging differs only in timing: a single counts-only
+        ``llm_call_log`` row is written when the stream finishes (success),
+        errors, or is cancelled by the consumer (client disconnect → the async
+        generator is closed and ``GeneratorExit`` fires the ``finally``).
+
+        Auto-fallback (``fallback_policy``) is intentionally NOT applied to
+        streaming: chunks have already been delivered to the consumer by the
+        time a mid-stream error surfaces, so transparently restarting on another
+        connector would corrupt the output. Streaming always fails fast.
+        """
+        primary = _resolve_connector(db, actor)
+        actor_id = actor.id if actor else _system_actor_id(db, primary)
+        async for chunk in _attempt_stream(
+            db, primary, request, purpose=purpose, actor_id=actor_id
+        ):
+            yield chunk
+```
+
+Add the module-level `_attempt_stream` async generator (after `_attempt`):
+
+```python
+async def _attempt_stream(
+    db: Session,
+    connector: LlmConnector,
+    request: ChatRequest,
+    *,
+    purpose: str,
+    actor_id: int,
+) -> AsyncIterator[ChatResponseChunk]:
+    """Run a single adapter stream, logging exactly one outcome row.
+
+    The call log is written in a ``finally`` so it fires on success, on a typed
+    error, AND on consumer cancellation (``GeneratorExit`` raised into the
+    generator when the SSE client disconnects). The status reflects which path
+    fired; counts come only from a terminal chunk's ``usage`` (never content).
+    """
+    adapter_cls = get_adapter_class(connector.connector_type)
+    adapter = adapter_cls(connector)
+
+    started = monotonic()
+    status = "ok"
+    error_code: str | None = None
+    tokens_in: int | None = None
+    tokens_out: int | None = None
+    auth_failed = False
+
+    try:
+        async for chunk in adapter.stream(request):
+            if chunk.usage is not None:
+                tokens_in = chunk.usage.prompt
+                tokens_out = chunk.usage.completion
+            yield chunk
+    except GeneratorExit:
+        # Consumer disconnected — record as cancelled and re-raise so the
+        # adapter's own finally/cleanup closes the upstream connection.
+        status = "cancelled"
+        error_code = "client_disconnect"
+        raise
+    except AuthInvalid:
+        status = "auth_invalid"
+        error_code = "401"
+        auth_failed = True
+        raise
+    except RateLimited as exc:
+        status = "rate_limited"
+        error_code = str(exc.retry_after_seconds or "")
+        raise
+    except QuotaExceeded:
+        status = "quota_exceeded"
+        error_code = "402"
+        raise
+    except ProviderUnavailable as exc:
+        status = "provider_unavailable"
+        error_code = type(exc).__name__
+        raise
+    except ToolTranslationError:
+        status = "tool_translation_error"
+        error_code = "translation"
+        raise
+    except LlmError:
+        status = "error"
+        error_code = "llm_error"
+        raise
+    finally:
+        latency_ms = int((monotonic() - started) * 1000)
+        if status == "ok":
+            connector.last_used_at = utcnow()
+            connector.last_error = None
+        if auth_failed:
+            connector.status = STATUS_AUTH_INVALID
+            connector.last_error = "auth_invalid"
+        log_call(
+            db,
+            connector_id=connector.id,
+            purpose=purpose,
+            status=status,
+            latency_ms=latency_ms,
+            tokens_in=tokens_in if status == "ok" else None,
+            tokens_out=tokens_out if status == "ok" else None,
+            error_code=error_code,
+        )
+        if auth_failed:
+            audit_event(
+                db,
+                actor_user_id=actor_id,
+                target_connector_id=connector.id,
+                event_type=AUDIT_AUTH_INVALID_OBSERVED,
+            )
+        db.commit()
+```
+
+- [ ] **Step 4: Run tests to verify they pass**
+
+Run: `cd server && .venv/bin/pytest tests/test_llm_gateway_stream.py -q`
+Expected: PASS (4 tests)
+
+- [ ] **Step 5: Commit**
+
+```bash
+git add server/app/services/llm/gateway.py server/tests/test_llm_gateway_stream.py
+git commit -m "feat(llm): Gateway.stream with counts-only logging + cancellation"
+```
+
+---
+
+## Task 8: SSE backend endpoint `POST /api/llm/connectors/{id}/stream-test`
+
+**Files:**
+- Modify: `server/app/api/llm.py`
+- Test: `server/tests/test_llm_stream_endpoint.py`
+
+- [ ] **Step 1: Write the failing test**
+
+```python
+# server/tests/test_llm_stream_endpoint.py
+"""SSE stream-test endpoint: auth, content-type, body shape, ownership."""
+
+from __future__ import annotations
+
+import json
+
+import pytest
+
+from app.models.llm_connector import LlmConnector
+from app.services.llm.adapters.openai_apikey import OpenAIApiKeyAdapter
+from app.services.llm.base import ChatResponseChunk, TokenUsage
+
+
+def _make_connector(db, user) -> LlmConnector:
+    row = LlmConnector(
+        user_id=user.id,
+        connector_type="openai_apikey",
+        display_name="Test",
+        status="active",
+        credentials=json.dumps({"api_key": "sk-fake"}),
+        model_hint="gpt-5-mini",
+    )
+    db.add(row)
+    db.commit()
+    db.refresh(row)
+    return row
+
+
+def test_stream_test_requires_auth(client, db, test_user):
+    connector = _make_connector(db, test_user)
+    resp = client.post(f"/api/llm/connectors/{connector.id}/stream-test")
+    assert resp.status_code == 401
+
+
+def test_stream_test_404_for_unowned(client, db, test_user, auth_headers):
+    # Connector owned by a different user.
+    from app.models.user import User
+    from app.services.auth import get_password_hash
+
+    other = User(username="other", password_hash=get_password_hash("x123456789"), role="dj")
+    db.add(other)
+    db.commit()
+    db.refresh(other)
+    connector = _make_connector(db, other)
+    resp = client.post(
+        f"/api/llm/connectors/{connector.id}/stream-test", headers=auth_headers
+    )
+    assert resp.status_code == 404
+
+
+def test_stream_test_streams_chunks(client, db, test_user, auth_headers, monkeypatch):
+    connector = _make_connector(db, test_user)
+
+    async def _fake_stream(self, request):
+        yield ChatResponseChunk(text_delta="Hi")
+        yield ChatResponseChunk(text_delta=" there")
+        yield ChatResponseChunk(
+            stop_reason="end_turn", usage=TokenUsage(prompt=2, completion=2), done=True
+        )
+
+    monkeypatch.setattr(OpenAIApiKeyAdapter, "stream", _fake_stream)
+
+    resp = client.post(
+        f"/api/llm/connectors/{connector.id}/stream-test", headers=auth_headers
+    )
+    assert resp.status_code == 200
+    assert resp.headers["content-type"].startswith("text/event-stream")
+    body = resp.text
+    # Each SSE event line starts with "data:". Reconstruct the JSON payloads.
+    payloads = [
+        json.loads(line[len("data:") :].strip())
+        for line in body.splitlines()
+        if line.startswith("data:")
+    ]
+    text = "".join(p.get("text_delta", "") for p in payloads)
+    assert "Hi there" in text
+    assert any(p.get("done") for p in payloads)
+```
+
+- [ ] **Step 2: Run test to verify it fails**
+
+Run: `cd server && .venv/bin/pytest tests/test_llm_stream_endpoint.py -q`
+Expected: FAIL — 404/405 (endpoint missing)
+
+- [ ] **Step 3: Implement the SSE endpoint in `llm.py`**
+
+Add imports (merge with existing):
+
+```python
+import json as _json
+
+from sse_starlette.sse import EventSourceResponse
+
+from app.models.user import User
+from app.services.llm.base import ChatRequest, Message
+from app.services.llm.exceptions import LlmError, NoLlmConfigured
+from app.services.llm.gateway import Gateway
+```
+
+Add the endpoint (place after `test_connector`):
+
+```python
+# A short, fixed prompt for the streaming health probe. Streams a single
+# sentence so the DJ sees tokens arrive in real time, exercising the full
+# resolve → adapter.stream → SSE path end-to-end.
+_STREAM_TEST_PROMPT = "Reply with one short friendly sentence confirming you are online."
+
+
+@router.post("/connectors/{connector_id}/stream-test")
+@limiter.limit("10/minute")
+async def stream_test_connector(
+    request: FastAPIRequest,
+    connector_id: int,
+    user: User = Depends(get_current_active_user),
+    db: Session = Depends(get_db),
+) -> EventSourceResponse:
+    """Stream a short sentence through the connector as ``text/event-stream``.
+
+    Validates ownership up front (404 for connectors the DJ doesn't own — never
+    leaks existence). Each SSE ``data:`` frame is a JSON ``ChatResponseChunk``.
+    On a typed gateway error, a terminal ``event: error`` frame is emitted with a
+    sanitised code (never the upstream payload), then the stream ends. Client
+    disconnect cancels the upstream provider request (the gateway generator's
+    ``finally`` writes the counts-only call log + closes the adapter).
+    """
+    row = _get_owned_connector_or_404(db, connector_id, user.id)
+
+    chat_request = ChatRequest(
+        messages=[Message(role="user", content=_STREAM_TEST_PROMPT)],
+        max_tokens=64,
+        temperature=0.0,
+        model=row.model_hint or None,
+    )
+
+    async def _publisher():
+        try:
+            async for chunk in Gateway.stream(
+                db, user, chat_request, purpose="stream_test"
+            ):
+                yield {"data": _json.dumps(chunk.model_dump())}
+        except NoLlmConfigured:
+            yield {"event": "error", "data": _json.dumps({"code": "no_connector"})}
+        except LlmError as exc:
+            # Map to a sanitised, stable code — never echo the provider message.
+            code = type(exc).__name__
+            logger.info("stream-test failed for connector %s: %s", connector_id, code)
+            yield {"event": "error", "data": _json.dumps({"code": code})}
+
+    return EventSourceResponse(
+        _publisher(),
+        media_type="text/event-stream",
+        headers={"X-Accel-Buffering": "no"},
+    )
+```
+
+- [ ] **Step 4: Run tests to verify they pass**
+
+Run: `cd server && .venv/bin/pytest tests/test_llm_stream_endpoint.py -q`
+Expected: PASS (3 tests)
+
+- [ ] **Step 5: Commit**
+
+```bash
+git add server/app/api/llm.py server/tests/test_llm_stream_endpoint.py
+git commit -m "feat(api): authenticated SSE stream-test endpoint for connectors"
+```
+
+---
+
+## Task 9: Backend CI green (ruff / format / bandit / full pytest)
+
+**Files:** none new — fix-ups only.
+
+- [ ] **Step 1: Auto-format + lint-fix**
+
+Run: `cd server && .venv/bin/ruff format . && .venv/bin/ruff check --fix .`
+
+- [ ] **Step 2: Lint check**
+
+Run: `cd server && .venv/bin/ruff check . && .venv/bin/ruff format --check .`
+Expected: no errors. If `_normalise_finish_reason` import triggers a private-import lint (PLC2701), keep the `# noqa` already added in Task 3, or inline a local copy of the 4-line mapping function into `streaming.py` to avoid importing a private name.
+
+- [ ] **Step 3: Bandit**
+
+Run: `cd server && .venv/bin/bandit -r app -c pyproject.toml -q`
+Expected: no new findings (the `# nosec B106` on the Authorization header is preserved).
+
+- [ ] **Step 4: Full backend test suite + coverage gate**
+
+Run: `cd server && .venv/bin/pytest --tb=short -q`
+Expected: PASS, coverage ≥ gate. If new streaming files drag coverage, the dedicated stream tests above should cover them; add targeted tests for any uncovered branch the report flags.
+
+- [ ] **Step 5: Commit any fix-ups**
+
+```bash
+git add -A
+git commit -m "chore(llm): backend lint/format/coverage fix-ups for streaming"
+```
+
+---
+
+## Task 10: Frontend SSE consumer `streamConnectorTest`
+
+**Files:**
+- Modify: `dashboard/lib/api.ts`
+- Test: `dashboard/lib/__tests__/api.test.ts` (append)
+
+- [ ] **Step 1: Write the failing test**
+
+Append to `dashboard/lib/__tests__/api.test.ts` (match the file's existing import + setup style):
+
+```typescript
+describe('streamConnectorTest', () => {
+  it('parses SSE data frames and invokes onChunk per frame', async () => {
+    const sse =
+      'data: {"text_delta":"Hi","done":false}\n\n' +
+      'data: {"text_delta":" there","done":false}\n\n' +
+      'data: {"text_delta":"","stop_reason":"end_turn","done":true}\n\n';
+    const encoder = new TextEncoder();
+    const stream = new ReadableStream<Uint8Array>({
+      start(controller) {
+        controller.enqueue(encoder.encode(sse));
+        controller.close();
+      },
+    });
+    const fetchMock = vi.fn().mockResolvedValue(
+      new Response(stream, {
+        status: 200,
+        headers: { 'Content-Type': 'text/event-stream' },
+      }),
+    );
+    vi.stubGlobal('fetch', fetchMock);
+
+    apiClient.setToken('jwt-token');
+    const chunks: Array<{ text_delta?: string; done?: boolean }> = [];
+    await apiClient.streamConnectorTest(7, (c) => chunks.push(c));
+
+    expect(chunks.map((c) => c.text_delta).join('')).toBe('Hi there');
+    expect(chunks.at(-1)?.done).toBe(true);
+    // Auth header present.
+    const init = fetchMock.mock.calls[0][1] as RequestInit;
+    const headers = new Headers(init.headers);
+    expect(headers.get('Authorization')).toBe('Bearer jwt-token');
+    vi.unstubAllGlobals();
+  });
+});
+```
+
+- [ ] **Step 2: Run test to verify it fails**
+
+Run: `cd dashboard && npm test -- --run lib/__tests__/api.test.ts`
+Expected: FAIL — `apiClient.streamConnectorTest is not a function`
+
+- [ ] **Step 3: Add the type + method to `api.ts`**
+
+Add near the other LLM types (search for `LlmConnectorTestResult`):
+
+```typescript
+export interface LlmStreamChunk {
+  text_delta?: string;
+  tool_call_deltas?: Array<{
+    index: number;
+    id?: string | null;
+    name?: string | null;
+    input_json_fragment?: string;
+  }>;
+  stop_reason?: 'end_turn' | 'tool_use' | 'max_tokens' | 'error' | null;
+  usage?: { prompt: number; completion: number } | null;
+  done?: boolean;
+}
+```
+
+Add the method to the `ApiClient` class (near `testLlmConnector`):
+
+```typescript
+  /**
+   * Stream a short health-check sentence through a connector via SSE.
+   *
+   * Uses fetch + ReadableStream rather than EventSource because EventSource
+   * cannot send the Authorization header this authenticated endpoint requires.
+   * Pass an AbortSignal to cancel — aborting closes the connection, which the
+   * backend treats as a client disconnect and cancels the upstream provider
+   * request. ``onChunk`` is invoked for every parsed SSE data frame.
+   */
+  async streamConnectorTest(
+    id: number,
+    onChunk: (chunk: LlmStreamChunk) => void,
+    signal?: AbortSignal,
+  ): Promise<void> {
+    const headers = new Headers({ Accept: 'text/event-stream' });
+    if (this.token) headers.set('Authorization', `Bearer ${this.token}`);
+
+    const response = await fetch(
+      `${getApiUrl()}/api/llm/connectors/${id}/stream-test`,
+      { method: 'POST', headers, signal },
+    );
+    if (!response.ok || !response.body) {
+      if (response.status === 401 && this.onUnauthorized) this.onUnauthorized();
+      throw new ApiError('Stream test failed', response.status);
+    }
+
+    const reader = response.body.getReader();
+    const decoder = new TextDecoder();
+    let buffer = '';
+    try {
+      while (true) {
+        const { done, value } = await reader.read();
+        if (done) break;
+        buffer += decoder.decode(value, { stream: true });
+        // SSE frames are separated by a blank line.
+        let sep: number;
+        while ((sep = buffer.indexOf('\n\n')) !== -1) {
+          const frame = buffer.slice(0, sep);
+          buffer = buffer.slice(sep + 2);
+          for (const line of frame.split('\n')) {
+            if (!line.startsWith('data:')) continue;
+            const data = line.slice('data:'.length).trim();
+            if (!data || data === '[DONE]') continue;
+            try {
+              onChunk(JSON.parse(data) as LlmStreamChunk);
+            } catch {
+              // Ignore unparseable keepalive frames.
+            }
+          }
+        }
+      }
+    } finally {
+      reader.releaseLock();
+    }
+  }
+```
+
+- [ ] **Step 4: Run test to verify it passes**
+
+Run: `cd dashboard && npm test -- --run lib/__tests__/api.test.ts`
+Expected: PASS
+
+- [ ] **Step 5: Commit**
+
+```bash
+git add dashboard/lib/api.ts dashboard/lib/__tests__/api.test.ts
+git commit -m "feat(ai-ui): SSE stream consumer for connector stream-test"
+```
+
+---
+
+## Task 11: Minimal UI consumer wiring (admin/ai stream test) + scope note
+
+**Files:**
+- Modify: `dashboard/app/admin/ai/page.tsx`
+
+**Decision:** The recommendation flow is a backend background pipeline that returns a final JSON payload to the UI (not a live token feed), so retrofitting it to SSE would be a large, risky change outside this issue's intent. Per the issue's "use reasonable judgment on scope and document it", the frontend consumer is the reusable `apiClient.streamConnectorTest` plumbing (Task 10) plus a minimal live "Stream test" affordance on the existing AI settings surface. The recommendation UI migration to SSE is explicitly deferred (future set-builder UI, §11.6) and noted in the PR body.
+
+- [ ] **Step 1: Read the admin/ai page to find the connector row / actions area**
+
+Run: `cd dashboard && grep -n "testLlmConnector\|Test\|connector" app/admin/ai/page.tsx | head -30`
+
+- [ ] **Step 2: Add a "Stream test" button that appends streamed text into local state**
+
+Add (adapt names to the file's existing component structure — this is the behavior to wire, not a verbatim drop-in):
+
+```tsx
+// Local state near the component's other useState hooks:
+const [streamText, setStreamText] = useState<string>('');
+const [streaming, setStreaming] = useState<number | null>(null);
+
+async function handleStreamTest(connectorId: number) {
+  setStreamText('');
+  setStreaming(connectorId);
+  try {
+    await apiClient.streamConnectorTest(connectorId, (chunk) => {
+      if (chunk.text_delta) setStreamText((prev) => prev + chunk.text_delta);
+    });
+  } catch {
+    setStreamText('(stream test failed)');
+  } finally {
+    setStreaming(null);
+  }
+}
+```
+
+And in the per-connector action area, next to the existing test button:
+
+```tsx
+<button
+  type="button"
+  onClick={() => handleStreamTest(connector.id)}
+  disabled={streaming !== null}
+>
+  {streaming === connector.id ? 'Streaming…' : 'Stream test'}
+</button>
+{streaming === connector.id && streamText && (
+  <p style={{ marginTop: 8, opacity: 0.8 }}>{streamText}</p>
+)}
+```
+
+- [ ] **Step 3: Type-check + existing page tests**
+
+Run: `cd dashboard && npx tsc --noEmit`
+Run: `cd dashboard && npm test -- --run app/admin/ai`
+Expected: PASS. If the admin/ai page has snapshot/DOM tests that assert exact button sets, update those fixtures to include the new button.
+
+- [ ] **Step 4: Commit**
+
+```bash
+git checkout dashboard/next-env.d.ts 2>/dev/null || true
+git add dashboard/app/admin/ai/page.tsx
+git commit -m "feat(ai-ui): minimal live stream-test affordance on AI settings"
+```
+
+---
+
+## Task 12: Full local CI sweep + finishing the branch
+
+**Files:** none new.
+
+- [ ] **Step 1: Backend CI**
+
+Run from `server/`:
+```bash
+.venv/bin/ruff check .
+.venv/bin/ruff format --check .
+.venv/bin/bandit -r app -c pyproject.toml -q
+.venv/bin/pytest --tb=short -q
+```
+Expected: all green, coverage gate satisfied.
+
+- [ ] **Step 2: Frontend CI**
+
+Run from `dashboard/`:
+```bash
+npm run lint
+npx tsc --noEmit
+npm test -- --run
+```
+Expected: all green. Then `git checkout dashboard/next-env.d.ts` if auto-modified.
+
+- [ ] **Step 3: Confirm no Alembic migration was introduced**
+
+Run: `cd server && git diff --name-only origin/epic/ai-engine...HEAD | grep alembic || echo "no migrations — correct"`
+Expected: `no migrations — correct` (streaming requires no schema change).
+
+- [ ] **Step 4: Use superpowers:finishing-a-development-branch (option 2: Push + PR)**
+
+Create the PR with `gh pr create --base epic/ai-engine`. PR body must include `Closes #335`, a `## Design decisions` section, and a note that the PR targets `epic/ai-engine`.
+
+---
+
+## Self-Review
+
+**Spec coverage (issue #335 acceptance criteria):**
+- `Gateway.stream(...) -> AsyncIterator[ChatResponseChunk]` → Task 7. ✅
+- `ChatResponseChunk` carries incremental text + partial tool_calls + final stop_reason + usage → Task 1 (model), Tasks 3/4/6 (population). ✅
+- Each adapter implements provider-native streaming (OpenAI, Anthropic, OpenAI-compatible) → Tasks 5, 6. ✅
+- Non-streaming adapters degrade gracefully (`StreamingUnsupported`) → Tasks 1, 2. ✅
+- SSE backend endpoint (text/event-stream) → Task 8. ✅
+- Tool-use mid-stream parses across providers (OpenAI partial JSON, Anthropic delta blocks) → Task 3 (OpenAI tool frags), Task 6 (`input_json_delta`). ✅
+- Cancellation propagates upstream (frontend disconnect → adapter cancels upstream) → Task 7 (`GeneratorExit` → adapter `async with` cleanup closes httpx/SDK stream), Task 10 (`AbortSignal`). ✅
+- Counts-only call log + audit consistency with non-stream path → Task 7 `_attempt_stream`. ✅
+- Frontend consumer → Tasks 10 (plumbing) + 11 (minimal UI, recommendation-migration deferral documented). ✅
+
+**Placeholder scan:** No TBD/TODO. Frontend Task 11 step 2 is explicitly behavior-to-wire (adapt to existing component) because the exact JSX scaffold depends on the live file — the implementer reads it in step 1.
+
+**Type consistency:** `ChatResponseChunk` fields (`text_delta`, `tool_call_deltas`, `stop_reason`, `usage`, `done`) and `ToolCallDelta` fields (`index`, `id`, `name`, `input_json_fragment`) are used identically in base.py, streaming.py, adapters, gateway, endpoint, and frontend type. `stream_openai_chat` signature matches its callers in both OpenAI adapters. `Gateway.stream` / `_attempt_stream` signatures match `dispatch` / `_attempt`.
diff --git a/docs/superpowers/plans/2026-05-28-per-feature-connector-preference.md b/docs/superpowers/plans/2026-05-28-per-feature-connector-preference.md
new file mode 100644
index 00000000..58fc2f36
--- /dev/null
+++ b/docs/superpowers/plans/2026-05-28-per-feature-connector-preference.md
@@ -0,0 +1,1314 @@
+# Per-Feature Connector Preference Implementation Plan
+
+> **For agentic workers:** REQUIRED SUB-SKILL: Use superpowers:subagent-driven-development (recommended) or superpowers:executing-plans to implement this plan task-by-task. Steps use checkbox (`- [ ]`) syntax for tracking.
+
+**Goal:** Let each DJ pin a specific LLM connector to a specific agentic feature (e.g. recommendation → connector A, set_builder → connector B), with graceful fallback when the pinned connector is gone or auth-invalid.
+
+**Architecture:** A new `LlmFeaturePreference` table maps `(user_id, feature) → connector_id` with a UNIQUE constraint. `Gateway.dispatch` already receives `purpose` (the feature key), so resolution gains a new first step: look up the DJ's pinned connector for `purpose`, use it if active, else fall through to the existing chain (per-DJ default → MRU → org default → `NoLlmConfigured`). New `/api/llm/feature-preferences` endpoints (set/clear/list) are scoped to the current DJ and validate connector ownership + feature against an allowlist. The DJ AI settings UI gains a "Per-feature defaults" section.
+
+**Tech Stack:** FastAPI, SQLAlchemy 2.0, Alembic, slowapi, Pydantic v2, Next.js/React 19/TypeScript, vitest.
+
+---
+
+## File Structure
+
+**Backend (create):**
+- `server/app/models/llm_feature_preference.py` — the new model + feature allowlist constants.
+- `server/alembic/versions/050_llm_feature_preference.py` — migration (down_revision = `049`).
+- `server/tests/test_llm_feature_preference.py` — model + gateway resolution + endpoint tests.
+
+**Backend (modify):**
+- `server/app/models/__init__.py` — register `LlmFeaturePreference`.
+- `server/app/services/llm/connector_storage.py` — feature-preference CRUD helpers.
+- `server/app/services/llm/gateway.py` — add feature-preference as the first resolution step.
+- `server/app/api/llm.py` — set/clear/list feature-preference endpoints.
+- `server/app/schemas/llm.py` — request/response schemas + known-feature constant.
+
+**Frontend (modify):**
+- `dashboard/lib/api.ts` — `listFeaturePreferences`, `setFeaturePreference`, `clearFeaturePreference`.
+- `dashboard/components/AiProvidersSection.tsx` — "Per-feature defaults" section.
+- `dashboard/lib/api-types.ts` — re-export the new generated schema types.
+- `dashboard/lib/api-types.generated.ts` — regenerated from OpenAPI (via `npm run types:export && npm run types:generate`).
+
+**Design decisions (locked in):**
+- Feature key reuses the gateway `purpose` string. Known features allowlist: `{"recommendation", "set_builder"}`. `recommendation` is the only `purpose` in use today; `set_builder` is named in the issue spec for an upcoming feature. The allowlist lives in one place (`schemas/llm.py`) and is imported by both the API validation and the model docstring reference.
+- The endpoint surface is `POST /api/llm/feature-preferences` (upsert set), `DELETE /api/llm/feature-preferences/{feature}` (clear), `GET /api/llm/feature-preferences` (list). Upsert semantics keep "set" and "change" as one operation (the UNIQUE constraint makes change == replace).
+- Ownership: setting a preference validates the connector belongs to the current DJ (404 if not, mirroring the existing connector-ownership 404 convention so another DJ's connector existence is never leaked).
+- Graceful fallback: gateway resolution skips a pinned preference whose connector is deleted (FK row gone) or whose status != `active`. No exception — falls through to the next resolution step.
+- We do NOT add a frontend "set inactive connector" guard beyond what the picker offers; the gateway already skips inactive pins, and the API rejects pinning a non-active connector with 400 (mirrors the per-DJ default endpoint), so a DJ can't silently break their own routing.
+
+---
+
+## Task 1: LlmFeaturePreference model + feature allowlist
+
+**Files:**
+- Create: `server/app/models/llm_feature_preference.py`
+- Modify: `server/app/models/__init__.py`
+- Test: `server/tests/test_llm_feature_preference.py`
+
+- [ ] **Step 1: Write the failing test**
+
+Create `server/tests/test_llm_feature_preference.py`:
+
+```python
+"""Tests for per-feature connector preference (issue #337)."""
+
+from __future__ import annotations
+
+import json
+
+import pytest
+from sqlalchemy.exc import IntegrityError
+
+from app.models.llm_connector import LlmConnector
+from app.models.llm_feature_preference import KNOWN_FEATURES, LlmFeaturePreference
+from app.models.user import User
+from app.services.auth import get_password_hash
+
+
+@pytest.fixture
+def dj_user(db) -> User:
+    user = User(
+        username="prefdj",
+        password_hash=get_password_hash("password123"),
+        role="dj",
+    )
+    db.add(user)
+    db.commit()
+    db.refresh(user)
+    return user
+
+
+def _make_connector(db, user, *, display_name="Pref connector", status="active"):
+    row = LlmConnector(
+        user_id=user.id,
+        connector_type="openai_apikey",
+        display_name=display_name,
+        status=status,
+        credentials=json.dumps({"api_key": "sk-fake-key"}),
+        model_hint="gpt-5-mini",
+    )
+    db.add(row)
+    db.commit()
+    db.refresh(row)
+    return row
+
+
+def test_known_features_contains_recommendation_and_set_builder():
+    assert "recommendation" in KNOWN_FEATURES
+    assert "set_builder" in KNOWN_FEATURES
+
+
+def test_unique_constraint_one_pref_per_user_feature(db, dj_user):
+    c1 = _make_connector(db, dj_user, display_name="A")
+    c2 = _make_connector(db, dj_user, display_name="B")
+    db.add(
+        LlmFeaturePreference(user_id=dj_user.id, feature="recommendation", connector_id=c1.id)
+    )
+    db.commit()
+    db.add(
+        LlmFeaturePreference(user_id=dj_user.id, feature="recommendation", connector_id=c2.id)
+    )
+    with pytest.raises(IntegrityError):
+        db.commit()
+    db.rollback()
+```
+
+- [ ] **Step 2: Run test to verify it fails**
+
+Run: `cd server && .venv/bin/pytest tests/test_llm_feature_preference.py -x -q`
+Expected: FAIL with `ModuleNotFoundError: No module named 'app.models.llm_feature_preference'`
+
+- [ ] **Step 3: Write the model**
+
+Create `server/app/models/llm_feature_preference.py`:
+
+```python
+"""Per-feature connector preference — pins a DJ's connector to a feature.
+
+A DJ can pin the recommendation engine to one connector and the set-builder
+to another. The gateway consults this table first (keyed by ``purpose``)
+before falling back to the per-DJ default / MRU / org-default chain.
+
+See issue #337, spec §11.8.
+"""
+
+from datetime import datetime
+
+from sqlalchemy import DateTime, ForeignKey, Integer, String, UniqueConstraint, func
+from sqlalchemy.orm import Mapped, mapped_column
+
+from app.models.base import Base
+
+# Allowlist of feature keys a DJ may pin. These mirror the gateway ``purpose``
+# strings. ``recommendation`` is the only purpose dispatched today;
+# ``set_builder`` is reserved for the upcoming set-builder feature (issue spec
+# §11.8). Validation of API input against this set lives in ``schemas/llm.py``
+# (KNOWN_FEATURES is re-exported there to keep a single source of truth).
+KNOWN_FEATURES = frozenset({"recommendation", "set_builder"})
+
+
+class LlmFeaturePreference(Base):
+    """Maps ``(user_id, feature)`` to a pinned ``connector_id``.
+
+    At most one row per ``(user_id, feature)`` — enforced by a UNIQUE
+    constraint. Deleting the connector cascades (ON DELETE CASCADE) so a stale
+    preference never points at a missing connector.
+    """
+
+    __tablename__ = "llm_feature_preferences"
+
+    id: Mapped[int] = mapped_column(Integer, primary_key=True)
+    user_id: Mapped[int] = mapped_column(
+        ForeignKey("users.id", ondelete="CASCADE"), index=True, nullable=False
+    )
+    feature: Mapped[str] = mapped_column(String(40), nullable=False)
+    connector_id: Mapped[int] = mapped_column(
+        ForeignKey("llm_connectors.id", ondelete="CASCADE"), index=True, nullable=False
+    )
+    created_at: Mapped[datetime] = mapped_column(
+        DateTime, nullable=False, server_default=func.now()
+    )
+
+    __table_args__ = (
+        UniqueConstraint("user_id", "feature", name="uq_llm_feature_pref_user_feature"),
+    )
+```
+
+- [ ] **Step 4: Register the model**
+
+Modify `server/app/models/__init__.py` — add the import after the `llm_connector` import line and the name to `__all__` (alphabetical-ish, keep grouped with other Llm names):
+
+```python
+from app.models.llm_connector import LlmAuditEvent, LlmCallLog, LlmConnector
+from app.models.llm_feature_preference import LlmFeaturePreference
+```
+
+And add `"LlmFeaturePreference",` to the `__all__` list (right after `"LlmConnector",`).
+
+- [ ] **Step 5: Run test to verify it passes**
+
+Run: `cd server && .venv/bin/pytest tests/test_llm_feature_preference.py -x -q`
+Expected: PASS (3 tests)
+
+- [ ] **Step 6: Commit**
+
+```bash
+git add server/app/models/llm_feature_preference.py server/app/models/__init__.py server/tests/test_llm_feature_preference.py
+git commit -m "feat(llm): add LlmFeaturePreference model + feature allowlist"
+```
+
+---
+
+## Task 2: Alembic migration
+
+**Files:**
+- Create: `server/alembic/versions/050_llm_feature_preference.py`
+
+- [ ] **Step 1: Write the migration**
+
+Create `server/alembic/versions/050_llm_feature_preference.py`:
+
+```python
+"""Add llm_feature_preferences table.
+
+Revision ID: 050
+Revises: 049
+Create Date: 2026-05-28
+
+Per-feature connector preference (issue #337). Maps ``(user_id, feature)`` to a
+pinned ``connector_id`` with a UNIQUE constraint so a DJ has at most one pinned
+connector per feature. Both FKs cascade on delete so a deleted user or
+connector never leaves a dangling preference.
+"""
+
+import sqlalchemy as sa
+
+from alembic import op
+
+revision: str = "050"
+down_revision: str | None = "049"
+branch_labels = None
+depends_on = None
+
+
+def upgrade() -> None:
+    op.create_table(
+        "llm_feature_preferences",
+        sa.Column("id", sa.Integer(), nullable=False),
+        sa.Column("user_id", sa.Integer(), nullable=False),
+        sa.Column("feature", sa.String(length=40), nullable=False),
+        sa.Column("connector_id", sa.Integer(), nullable=False),
+        sa.Column(
+            "created_at",
+            sa.DateTime(),
+            server_default=sa.func.now(),
+            nullable=False,
+        ),
+        sa.ForeignKeyConstraint(["user_id"], ["users.id"], ondelete="CASCADE"),
+        sa.ForeignKeyConstraint(["connector_id"], ["llm_connectors.id"], ondelete="CASCADE"),
+        sa.PrimaryKeyConstraint("id"),
+        sa.UniqueConstraint("user_id", "feature", name="uq_llm_feature_pref_user_feature"),
+    )
+    op.create_index(
+        "ix_llm_feature_preferences_user_id",
+        "llm_feature_preferences",
+        ["user_id"],
+    )
+    op.create_index(
+        "ix_llm_feature_preferences_connector_id",
+        "llm_feature_preferences",
+        ["connector_id"],
+    )
+
+
+def downgrade() -> None:
+    op.drop_index("ix_llm_feature_preferences_connector_id", table_name="llm_feature_preferences")
+    op.drop_index("ix_llm_feature_preferences_user_id", table_name="llm_feature_preferences")
+    op.drop_table("llm_feature_preferences")
+```
+
+- [ ] **Step 2: Run migration + drift check**
+
+Run: `cd server && .venv/bin/alembic upgrade head && .venv/bin/alembic check`
+Expected: `upgrade` runs cleanly to revision `050`, and `alembic check` prints `No new upgrade operations detected.`
+
+If `alembic check` reports drift, reconcile the migration columns/indexes with the model (`index=True` on `user_id` and `connector_id` matches the two `create_index` calls).
+
+- [ ] **Step 3: Commit**
+
+```bash
+git add server/alembic/versions/050_llm_feature_preference.py
+git commit -m "feat(llm): migration 050 for llm_feature_preferences"
+```
+
+---
+
+## Task 3: connector_storage CRUD helpers
+
+**Files:**
+- Modify: `server/app/services/llm/connector_storage.py`
+- Test: `server/tests/test_llm_feature_preference.py`
+
+- [ ] **Step 1: Write the failing test**
+
+Append to `server/tests/test_llm_feature_preference.py`:
+
+```python
+def test_set_feature_preference_upserts(db, dj_user):
+    from app.services.llm.connector_storage import (
+        get_feature_preferences_for_user,
+        set_feature_preference,
+    )
+
+    c1 = _make_connector(db, dj_user, display_name="A")
+    c2 = _make_connector(db, dj_user, display_name="B")
+
+    set_feature_preference(db, user_id=dj_user.id, feature="recommendation", connector_id=c1.id)
+    db.commit()
+    prefs = get_feature_preferences_for_user(db, dj_user.id)
+    assert {p.feature: p.connector_id for p in prefs} == {"recommendation": c1.id}
+
+    # Re-set the same feature → replace, not duplicate.
+    set_feature_preference(db, user_id=dj_user.id, feature="recommendation", connector_id=c2.id)
+    db.commit()
+    prefs = get_feature_preferences_for_user(db, dj_user.id)
+    assert {p.feature: p.connector_id for p in prefs} == {"recommendation": c2.id}
+
+
+def test_clear_feature_preference_removes_row(db, dj_user):
+    from app.services.llm.connector_storage import (
+        clear_feature_preference,
+        get_feature_preferences_for_user,
+        set_feature_preference,
+    )
+
+    c1 = _make_connector(db, dj_user, display_name="A")
+    set_feature_preference(db, user_id=dj_user.id, feature="recommendation", connector_id=c1.id)
+    db.commit()
+
+    removed = clear_feature_preference(db, user_id=dj_user.id, feature="recommendation")
+    db.commit()
+    assert removed is True
+    assert get_feature_preferences_for_user(db, dj_user.id) == []
+
+    # Clearing a non-existent preference is a no-op (returns False).
+    assert clear_feature_preference(db, user_id=dj_user.id, feature="recommendation") is False
+```
+
+- [ ] **Step 2: Run test to verify it fails**
+
+Run: `cd server && .venv/bin/pytest tests/test_llm_feature_preference.py -x -q`
+Expected: FAIL with `ImportError: cannot import name 'set_feature_preference'`
+
+- [ ] **Step 3: Add the helpers**
+
+In `server/app/services/llm/connector_storage.py`, add the model import to the existing `from app.models.llm_connector import (...)` block is NOT possible (different module). Add a new import near the top imports:
+
+```python
+from app.models.llm_feature_preference import LlmFeaturePreference
+```
+
+Then add these functions (place them after `unset_default_for_user`):
+
+```python
+def get_feature_preferences_for_user(db: Session, user_id: int) -> list[LlmFeaturePreference]:
+    """Return all of a DJ's per-feature connector pins."""
+    return (
+        db.query(LlmFeaturePreference)
+        .filter(LlmFeaturePreference.user_id == user_id)
+        .order_by(LlmFeaturePreference.feature.asc())
+        .all()
+    )
+
+
+def get_feature_preference(
+    db: Session, *, user_id: int, feature: str
+) -> LlmFeaturePreference | None:
+    """Return the DJ's pin for ``feature``, or ``None`` if unset."""
+    return (
+        db.query(LlmFeaturePreference)
+        .filter(
+            LlmFeaturePreference.user_id == user_id,
+            LlmFeaturePreference.feature == feature,
+        )
+        .one_or_none()
+    )
+
+
+def set_feature_preference(
+    db: Session, *, user_id: int, feature: str, connector_id: int
+) -> LlmFeaturePreference:
+    """Upsert the DJ's pin for ``feature`` → ``connector_id``. Caller commits.
+
+    Replace-in-place when a row already exists so the UNIQUE constraint on
+    ``(user_id, feature)`` is never violated.
+    """
+    existing = get_feature_preference(db, user_id=user_id, feature=feature)
+    if existing is not None:
+        existing.connector_id = connector_id
+        db.flush()
+        return existing
+    row = LlmFeaturePreference(user_id=user_id, feature=feature, connector_id=connector_id)
+    db.add(row)
+    db.flush()
+    return row
+
+
+def clear_feature_preference(db: Session, *, user_id: int, feature: str) -> bool:
+    """Delete the DJ's pin for ``feature``. Returns True iff a row was removed.
+
+    Caller commits.
+    """
+    existing = get_feature_preference(db, user_id=user_id, feature=feature)
+    if existing is None:
+        return False
+    db.delete(existing)
+    db.flush()
+    return True
+```
+
+Add the four function names to the `__all__` list alphabetically:
+`"clear_feature_preference",`, `"get_feature_preference",`, `"get_feature_preferences_for_user",`, `"set_feature_preference",`.
+
+- [ ] **Step 4: Run test to verify it passes**
+
+Run: `cd server && .venv/bin/pytest tests/test_llm_feature_preference.py -x -q`
+Expected: PASS
+
+- [ ] **Step 5: Commit**
+
+```bash
+git add server/app/services/llm/connector_storage.py server/tests/test_llm_feature_preference.py
+git commit -m "feat(llm): feature-preference CRUD helpers in connector_storage"
+```
+
+---
+
+## Task 4: Gateway resolution — feature preference first
+
+**Files:**
+- Modify: `server/app/services/llm/gateway.py`
+- Test: `server/tests/test_llm_feature_preference.py`
+
+- [ ] **Step 1: Write the failing test**
+
+Append to `server/tests/test_llm_feature_preference.py`:
+
+```python
+from unittest.mock import AsyncMock, patch  # noqa: E402  (grouped with gateway tests)
+
+from app.services.llm.adapters.openai_apikey import OpenAIApiKeyAdapter  # noqa: E402
+from app.services.llm.base import ChatRequest, ChatResponse, Message, TokenUsage  # noqa: E402
+from app.services.llm.gateway import Gateway  # noqa: E402
+
+
+def _ok_response() -> ChatResponse:
+    return ChatResponse(
+        text="ok", tool_calls=[], stop_reason="end_turn", usage=TokenUsage(prompt=1, completion=1)
+    )
+
+
+@pytest.mark.asyncio
+async def test_gateway_prefers_feature_pin_over_default(db, dj_user):
+    from app.services.llm.connector_storage import set_default_for_user, set_feature_preference
+
+    pinned = _make_connector(db, dj_user, display_name="pinned")
+    other = _make_connector(db, dj_user, display_name="default")
+    set_default_for_user(db, connector=other)  # per-DJ default points elsewhere
+    set_feature_preference(
+        db, user_id=dj_user.id, feature="recommendation", connector_id=pinned.id
+    )
+    db.commit()
+
+    captured = {}
+
+    async def fake_chat(self, request):  # noqa: ANN001
+        captured["connector_id"] = self.connector.id
+        return _ok_response()
+
+    with patch.object(OpenAIApiKeyAdapter, "chat", new=fake_chat):
+        await Gateway.dispatch(
+            db,
+            dj_user,
+            ChatRequest(messages=[Message(role="user", content="hi")]),
+            purpose="recommendation",
+        )
+    assert captured["connector_id"] == pinned.id
+
+
+@pytest.mark.asyncio
+async def test_gateway_falls_back_when_pinned_connector_auth_invalid(db, dj_user):
+    from app.services.llm.connector_storage import set_default_for_user, set_feature_preference
+
+    pinned = _make_connector(db, dj_user, display_name="pinned", status="auth_invalid")
+    fallback = _make_connector(db, dj_user, display_name="fallback")
+    set_default_for_user(db, connector=fallback)
+    set_feature_preference(
+        db, user_id=dj_user.id, feature="recommendation", connector_id=pinned.id
+    )
+    db.commit()
+
+    captured = {}
+
+    async def fake_chat(self, request):  # noqa: ANN001
+        captured["connector_id"] = self.connector.id
+        return _ok_response()
+
+    with patch.object(OpenAIApiKeyAdapter, "chat", new=fake_chat):
+        await Gateway.dispatch(
+            db,
+            dj_user,
+            ChatRequest(messages=[Message(role="user", content="hi")]),
+            purpose="recommendation",
+        )
+    # Skips the auth_invalid pin, falls through to the per-DJ default.
+    assert captured["connector_id"] == fallback.id
+
+
+@pytest.mark.asyncio
+async def test_gateway_ignores_pin_for_unknown_feature(db, dj_user):
+    """A pin set for one feature must not leak into another purpose."""
+    from app.services.llm.connector_storage import set_feature_preference
+
+    pinned = _make_connector(db, dj_user, display_name="pinned")
+    mru = _make_connector(db, dj_user, display_name="mru")
+    set_feature_preference(
+        db, user_id=dj_user.id, feature="recommendation", connector_id=pinned.id
+    )
+    db.commit()
+
+    captured = {}
+
+    async def fake_chat(self, request):  # noqa: ANN001
+        captured["connector_id"] = self.connector.id
+        return _ok_response()
+
+    with patch.object(OpenAIApiKeyAdapter, "chat", new=fake_chat):
+        await Gateway.dispatch(
+            db,
+            dj_user,
+            ChatRequest(messages=[Message(role="user", content="hi")]),
+            purpose="set_builder",
+        )
+    # No pin for set_builder → MRU resolution (most recently created here is `mru`).
+    assert captured["connector_id"] == mru.id
+```
+
+- [ ] **Step 2: Run test to verify it fails**
+
+Run: `cd server && .venv/bin/pytest tests/test_llm_feature_preference.py -x -q -k gateway`
+Expected: FAIL — the pin is ignored because `_resolve_connector` doesn't know about `purpose`.
+
+- [ ] **Step 3: Thread purpose into resolution**
+
+In `server/app/services/llm/gateway.py`:
+
+Add the storage import near the existing imports:
+
+```python
+from app.services.llm.connector_storage import audit_event, get_feature_preference, log_call
+```
+
+(modify the existing `from app.services.llm.connector_storage import audit_event, log_call` line)
+
+In `Gateway.dispatch`, change the resolve call to pass `purpose`:
+
+```python
+        primary = _resolve_connector(db, actor, purpose=purpose)
+```
+
+Update `_resolve_connector`'s signature and add the feature-preference step as the FIRST check inside the `if actor is not None:` block:
+
+```python
+def _resolve_connector(db: Session, actor: User | None, *, purpose: str) -> LlmConnector:
+    if actor is not None:
+        # 0. Per-feature pin (issue #337) takes precedence over the per-DJ
+        #    default and MRU. Skipped gracefully when the pinned connector was
+        #    deleted (FK row gone) or is no longer active, so a stale/broken
+        #    pin never silently breaks the DJ — resolution falls through.
+        pref = get_feature_preference(db, user_id=actor.id, feature=purpose)
+        if pref is not None:
+            pinned = db.get(LlmConnector, pref.connector_id)
+            if (
+                pinned is not None
+                and pinned.user_id == actor.id
+                and pinned.status == STATUS_ACTIVE
+            ):
+                return pinned
+
+        # Per-DJ explicit default takes precedence over MRU (issue #336).
+        ...
+```
+
+(Leave the rest of `_resolve_connector` unchanged — the `pinned` default block, the MRU block, the org-default fallback.)
+
+- [ ] **Step 4: Run test to verify it passes**
+
+Run: `cd server && .venv/bin/pytest tests/test_llm_feature_preference.py -x -q -k gateway`
+Expected: PASS
+
+Then run the full gateway suite to confirm no regression:
+Run: `cd server && .venv/bin/pytest tests/test_llm_gateway.py tests/test_llm_default_connector.py -q`
+Expected: PASS
+
+- [ ] **Step 5: Update gateway module docstring**
+
+In `server/app/services/llm/gateway.py`, update the "Resolution order" docstring at the top to list the feature-preference step first:
+
+```
+Resolution order:
+1. If ``actor`` is not ``None``:
+   a. The DJ's per-feature pin for ``purpose`` if set and the pinned connector
+      is active (``LlmFeaturePreference`` — issue #337).
+   b. Else: the DJ's explicit default active connector if one is pinned
+      (``LlmConnector.is_default = True``) — issue #336.
+   c. Else: most-recently-used active connector for the DJ.
+2. Else: ``SystemSettings.llm_default_connector_id`` if set and active.
+3. Else: raise :class:`NoLlmConfigured`.
+```
+
+- [ ] **Step 6: Commit**
+
+```bash
+git add server/app/services/llm/gateway.py server/tests/test_llm_feature_preference.py
+git commit -m "feat(llm): gateway resolves per-feature pin first, falls back gracefully"
+```
+
+---
+
+## Task 5: API schemas
+
+**Files:**
+- Modify: `server/app/schemas/llm.py`
+
+- [ ] **Step 1: Add the schemas + feature literal**
+
+In `server/app/schemas/llm.py`, after the existing imports add the known-feature import + a `Literal`-derived alias. Near the top (after `from typing import Literal`):
+
+```python
+from app.models.llm_feature_preference import KNOWN_FEATURES
+
+# Sorted tuple so the OpenAPI enum + frontend list are deterministic.
+KNOWN_FEATURE_VALUES: tuple[str, ...] = tuple(sorted(KNOWN_FEATURES))
+FeatureKey = Literal["recommendation", "set_builder"]
+```
+
+At the end of the file add:
+
+```python
+class FeaturePreferenceOut(BaseModel):
+    """A single per-feature connector pin."""
+
+    model_config = ConfigDict(from_attributes=True)
+
+    feature: FeatureKey
+    connector_id: int
+
+
+class FeaturePreferencesListOut(BaseModel):
+    """All of a DJ's per-feature pins + the catalogue of pinnable features."""
+
+    preferences: list[FeaturePreferenceOut]
+    known_features: list[FeatureKey]
+
+
+class FeaturePreferenceSet(BaseModel):
+    """Set/change a per-feature pin. Upsert — replaces any existing pin."""
+
+    feature: FeatureKey
+    connector_id: int = Field(..., ge=1)
+```
+
+> Note: `FeatureKey` is hand-maintained to match `KNOWN_FEATURES` (Pydantic `Literal` can't be built from a runtime frozenset and still emit a static OpenAPI enum). The model docstring in `llm_feature_preference.py` flags that both must stay in sync; a test in Task 7 asserts they match.
+
+- [ ] **Step 2: Verify it imports**
+
+Run: `cd server && .venv/bin/python -c "from app.schemas.llm import FeaturePreferenceSet, FeaturePreferencesListOut, KNOWN_FEATURE_VALUES; print(KNOWN_FEATURE_VALUES)"`
+Expected: prints `('recommendation', 'set_builder')`
+
+- [ ] **Step 3: Commit**
+
+```bash
+git add server/app/schemas/llm.py
+git commit -m "feat(llm): feature-preference API schemas"
+```
+
+---
+
+## Task 6: API endpoints
+
+**Files:**
+- Modify: `server/app/api/llm.py`
+- Test: `server/tests/test_llm_feature_preference.py`
+
+- [ ] **Step 1: Write the failing test**
+
+Append to `server/tests/test_llm_feature_preference.py`:
+
+```python
+from fastapi.testclient import TestClient  # noqa: E402
+
+
+def _login(client: TestClient, username: str, password: str) -> dict[str, str]:
+    resp = client.post("/api/auth/login", data={"username": username, "password": password})
+    assert resp.status_code == 200, resp.json()
+    return {"Authorization": f"Bearer {resp.json()['access_token']}"}
+
+
+def test_set_list_clear_feature_preference_endpoints(client, db, test_user, auth_headers):
+    c = _make_connector(db, test_user, display_name="Endpoint connector")
+
+    # Set
+    resp = client.post(
+        "/api/llm/feature-preferences",
+        json={"feature": "recommendation", "connector_id": c.id},
+        headers=auth_headers,
+    )
+    assert resp.status_code == 200, resp.json()
+    body = resp.json()
+    assert {p["feature"]: p["connector_id"] for p in body["preferences"]} == {
+        "recommendation": c.id
+    }
+    assert "set_builder" in body["known_features"]
+
+    # List
+    resp = client.get("/api/llm/feature-preferences", headers=auth_headers)
+    assert resp.status_code == 200
+    assert resp.json()["preferences"][0]["connector_id"] == c.id
+
+    # Clear
+    resp = client.delete("/api/llm/feature-preferences/recommendation", headers=auth_headers)
+    assert resp.status_code == 200
+    assert resp.json()["preferences"] == []
+
+
+def test_set_feature_preference_rejects_unknown_feature(client, db, test_user, auth_headers):
+    c = _make_connector(db, test_user, display_name="X")
+    resp = client.post(
+        "/api/llm/feature-preferences",
+        json={"feature": "totally_made_up", "connector_id": c.id},
+        headers=auth_headers,
+    )
+    assert resp.status_code == 422  # Pydantic Literal rejects it
+
+
+def test_set_feature_preference_rejects_other_djs_connector(
+    client, db, test_user, auth_headers
+):
+    # Another DJ owns this connector.
+    other = User(
+        username="otherdj", password_hash=get_password_hash("password123"), role="dj"
+    )
+    db.add(other)
+    db.commit()
+    db.refresh(other)
+    foreign = _make_connector(db, other, display_name="Not yours")
+
+    resp = client.post(
+        "/api/llm/feature-preferences",
+        json={"feature": "recommendation", "connector_id": foreign.id},
+        headers=auth_headers,
+    )
+    assert resp.status_code == 404  # ownership not leaked
+
+
+def test_set_feature_preference_rejects_inactive_connector(
+    client, db, test_user, auth_headers
+):
+    c = _make_connector(db, test_user, display_name="Broken", status="auth_invalid")
+    resp = client.post(
+        "/api/llm/feature-preferences",
+        json={"feature": "recommendation", "connector_id": c.id},
+        headers=auth_headers,
+    )
+    assert resp.status_code == 400
+
+
+def test_clear_unknown_feature_returns_422(client, auth_headers):
+    resp = client.delete("/api/llm/feature-preferences/bogus", headers=auth_headers)
+    assert resp.status_code == 422
+```
+
+- [ ] **Step 2: Run test to verify it fails**
+
+Run: `cd server && .venv/bin/pytest tests/test_llm_feature_preference.py -x -q -k endpoint`
+Expected: FAIL with 404 (route not found) on the first POST.
+
+- [ ] **Step 3: Add the endpoints**
+
+In `server/app/api/llm.py`:
+
+Add to the schema import block:
+
+```python
+from app.schemas.llm import (
+    ConnectorCreate,
+    ConnectorCredentialsRotate,
+    ConnectorOut,
+    ConnectorPatch,
+    ConnectorTestResult,
+    DjPolicyOut,
+    FeatureKey,
+    FeaturePreferenceSet,
+    FeaturePreferencesListOut,
+)
+```
+
+Add to the connector_storage import block:
+
+```python
+from app.services.llm.connector_storage import (
+    ...existing names...,
+    clear_feature_preference,
+    get_feature_preferences_for_user,
+    set_feature_preference,
+)
+```
+
+Add a small helper near `_get_owned_connector_or_404`:
+
+```python
+def _feature_prefs_response(db: Session, user_id: int) -> FeaturePreferencesListOut:
+    """Build the list response: the DJ's current pins + the pinnable catalogue."""
+    from app.schemas.llm import KNOWN_FEATURE_VALUES, FeaturePreferenceOut
+
+    rows = get_feature_preferences_for_user(db, user_id)
+    return FeaturePreferencesListOut(
+        preferences=[FeaturePreferenceOut.model_validate(r) for r in rows],
+        known_features=list(KNOWN_FEATURE_VALUES),  # type: ignore[arg-type]
+    )
+```
+
+Add the three endpoints (place after the unset-default endpoint, before the delete-connector endpoint):
+
+```python
+@router.get("/feature-preferences", response_model=FeaturePreferencesListOut)
+@limiter.limit("60/minute")
+def list_feature_preferences(
+    request: FastAPIRequest,
+    user: User = Depends(get_current_active_user),
+    db: Session = Depends(get_db),
+) -> FeaturePreferencesListOut:
+    """List the DJ's per-feature connector pins (issue #337)."""
+    return _feature_prefs_response(db, user.id)
+
+
+@router.post(
+    "/feature-preferences",
+    response_model=FeaturePreferencesListOut,
+    responses={
+        400: {"description": "Connector is not active and cannot be pinned."},
+        404: {"description": "Connector not found for current user."},
+    },
+)
+@limiter.limit("30/minute")
+def set_feature_preference_endpoint(
+    request: FastAPIRequest,
+    payload: FeaturePreferenceSet,
+    user: User = Depends(get_current_active_user),
+    db: Session = Depends(get_db),
+) -> FeaturePreferencesListOut:
+    """Pin (or re-pin) a connector to a feature for the current DJ.
+
+    Validates connector ownership server-side (404 for IDs the DJ doesn't own,
+    so another DJ's connector existence is never leaked) and rejects pinning a
+    non-active connector (400) — the gateway would skip it anyway, so silently
+    accepting it is a footgun.
+    """
+    row = _get_owned_connector_or_404(db, payload.connector_id, user.id)
+    if row.status != "active":
+        raise HTTPException(
+            status_code=400,
+            detail="Only an active connector can be pinned to a feature",
+        )
+    set_feature_preference(
+        db, user_id=user.id, feature=payload.feature, connector_id=row.id
+    )
+    db.commit()
+    return _feature_prefs_response(db, user.id)
+
+
+@router.delete("/feature-preferences/{feature}", response_model=FeaturePreferencesListOut)
+@limiter.limit("30/minute")
+def clear_feature_preference_endpoint(
+    request: FastAPIRequest,
+    feature: FeatureKey,
+    user: User = Depends(get_current_active_user),
+    db: Session = Depends(get_db),
+) -> FeaturePreferencesListOut:
+    """Clear the DJ's pin for ``feature`` (no-op if unset). Returns the new list."""
+    clear_feature_preference(db, user_id=user.id, feature=feature)
+    db.commit()
+    return _feature_prefs_response(db, user.id)
+```
+
+> Path-param `feature: FeatureKey` makes FastAPI return 422 for unknown features automatically.
+
+- [ ] **Step 4: Run test to verify it passes**
+
+Run: `cd server && .venv/bin/pytest tests/test_llm_feature_preference.py -x -q -k "endpoint or feature"`
+Expected: PASS
+
+- [ ] **Step 5: Commit**
+
+```bash
+git add server/app/api/llm.py server/tests/test_llm_feature_preference.py
+git commit -m "feat(llm): set/clear/list feature-preference endpoints"
+```
+
+---
+
+## Task 7: Consistency guard + full backend CI
+
+**Files:**
+- Test: `server/tests/test_llm_feature_preference.py`
+
+- [ ] **Step 1: Add a guard test that FeatureKey == KNOWN_FEATURES**
+
+Append to `server/tests/test_llm_feature_preference.py`:
+
+```python
+def test_feature_key_literal_matches_known_features():
+    """FeatureKey (the OpenAPI enum) must stay in sync with KNOWN_FEATURES."""
+    import typing
+
+    from app.schemas.llm import FeatureKey
+
+    literal_values = set(typing.get_args(FeatureKey))
+    assert literal_values == set(KNOWN_FEATURES)
+```
+
+- [ ] **Step 2: Run the full new test file**
+
+Run: `cd server && .venv/bin/pytest tests/test_llm_feature_preference.py -q`
+Expected: PASS (all tests)
+
+- [ ] **Step 3: Run full backend CI**
+
+```bash
+cd server
+.venv/bin/ruff check .
+.venv/bin/ruff format --check .
+.venv/bin/bandit -r app -c pyproject.toml -q
+.venv/bin/alembic upgrade head && .venv/bin/alembic check
+.venv/bin/pytest --tb=short -q
+```
+
+Expected: ruff clean, bandit clean, alembic check clean, pytest passes with coverage ≥ gate. Fix any failures before committing.
+
+- [ ] **Step 4: Commit**
+
+```bash
+git add server/tests/test_llm_feature_preference.py
+git commit -m "test(llm): guard FeatureKey/KNOWN_FEATURES sync"
+```
+
+---
+
+## Task 8: Frontend — regenerate types + api.ts methods
+
+**Files:**
+- Modify: `dashboard/lib/api-types.generated.ts` (regenerated), `dashboard/lib/api-types.ts`, `dashboard/lib/api.ts`
+
+- [ ] **Step 1: Regenerate OpenAPI types**
+
+```bash
+cd dashboard
+npm run types:export
+npm run types:generate
+git checkout ../dashboard/next-env.d.ts 2>/dev/null || true
+```
+
+Expected: `lib/api-types.generated.ts` now contains `FeaturePreferenceOut`, `FeaturePreferencesListOut`, `FeaturePreferenceSet` schemas.
+
+- [ ] **Step 2: Re-export the new types**
+
+In `dashboard/lib/api-types.ts`, in the LLM gateway block, add:
+
+```typescript
+export type LlmFeaturePreference = Schemas['FeaturePreferenceOut'];
+export type LlmFeaturePreferences = Schemas['FeaturePreferencesListOut'];
+export type LlmFeaturePreferenceSet = Schemas['FeaturePreferenceSet'];
+export type LlmFeatureKey = Schemas['FeaturePreferenceOut']['feature'];
+```
+
+- [ ] **Step 3: Add api.ts methods**
+
+In `dashboard/lib/api.ts`, add the type imports to the existing LLM import + re-export blocks:
+`LlmFeaturePreferences`, `LlmFeaturePreferenceSet`, `LlmFeatureKey`.
+
+Then add methods after `unsetLlmConnectorDefault`:
+
+```typescript
+  async listLlmFeaturePreferences(): Promise<LlmFeaturePreferences> {
+    return this.fetch('/api/llm/feature-preferences');
+  }
+
+  async setLlmFeaturePreference(
+    data: LlmFeaturePreferenceSet,
+  ): Promise<LlmFeaturePreferences> {
+    return this.fetch('/api/llm/feature-preferences', {
+      method: 'POST',
+      body: JSON.stringify(data),
+    });
+  }
+
+  async clearLlmFeaturePreference(
+    feature: LlmFeatureKey,
+  ): Promise<LlmFeaturePreferences> {
+    return this.fetch(`/api/llm/feature-preferences/${feature}`, {
+      method: 'DELETE',
+    });
+  }
+```
+
+- [ ] **Step 4: Type-check**
+
+Run: `cd dashboard && npx tsc --noEmit`
+Expected: no errors.
+
+- [ ] **Step 5: Commit**
+
+```bash
+git add dashboard/lib/api-types.generated.ts dashboard/lib/api-types.ts dashboard/lib/api.ts server/openapi.json
+git commit -m "feat(ai-ui): api client methods + types for feature preferences"
+```
+
+---
+
+## Task 9: Frontend — "Per-feature defaults" section
+
+**Files:**
+- Modify: `dashboard/components/AiProvidersSection.tsx`
+- Test: `dashboard/components/__tests__/AiProvidersSection.featurePrefs.test.tsx` (create)
+
+- [ ] **Step 1: Write the failing test**
+
+Check first whether a test file already exists for this component:
+Run: `ls dashboard/components/__tests__/ 2>/dev/null | grep -i aiprovider || ls dashboard/**/__tests__/ 2>/dev/null`
+
+Create `dashboard/components/__tests__/AiProvidersSection.featurePrefs.test.tsx`:
+
+```tsx
+import { render, screen, waitFor, fireEvent } from '@testing-library/react';
+import { describe, it, expect, vi, beforeEach } from 'vitest';
+
+import AiProvidersSection from '../AiProvidersSection';
+import { api } from '@/lib/api';
+
+vi.mock('@/lib/api', () => ({
+  api: {
+    listLlmConnectors: vi.fn(),
+    getLlmPolicy: vi.fn(),
+    listOpenRouterModels: vi.fn(),
+    listLlmFeaturePreferences: vi.fn(),
+    setLlmFeaturePreference: vi.fn(),
+    clearLlmFeaturePreference: vi.fn(),
+  },
+}));
+
+const connector = {
+  id: 1,
+  user_id: 1,
+  connector_type: 'openai_apikey',
+  display_name: 'My OpenAI',
+  status: 'active',
+  base_url_plain: null,
+  model_hint: null,
+  created_at: '2026-01-01T00:00:00Z',
+  updated_at: '2026-01-01T00:00:00Z',
+  last_used_at: null,
+  last_error: null,
+  is_default: false,
+  last_health_check_at: null,
+  last_health_check_status: null,
+};
+
+beforeEach(() => {
+  vi.clearAllMocks();
+  (api.listLlmConnectors as any).mockResolvedValue([connector]);
+  (api.getLlmPolicy as any).mockResolvedValue({
+    llm_apikey_connectors_enabled: true,
+    llm_compatible_connector_enabled: true,
+    allowed_connector_types: ['openai_apikey'],
+  });
+  (api.listLlmFeaturePreferences as any).mockResolvedValue({
+    preferences: [],
+    known_features: ['recommendation', 'set_builder'],
+  });
+});
+
+describe('AiProvidersSection per-feature defaults', () => {
+  it('renders a picker per known feature and sets a pin', async () => {
+    (api.setLlmFeaturePreference as any).mockResolvedValue({
+      preferences: [{ feature: 'recommendation', connector_id: 1 }],
+      known_features: ['recommendation', 'set_builder'],
+    });
+
+    render(<AiProvidersSection />);
+
+    await waitFor(() => expect(screen.getByText(/Per-feature defaults/i)).toBeInTheDocument());
+
+    const select = screen.getByLabelText(/recommendation/i) as HTMLSelectElement;
+    fireEvent.change(select, { target: { value: '1' } });
+
+    await waitFor(() =>
+      expect(api.setLlmFeaturePreference).toHaveBeenCalledWith({
+        feature: 'recommendation',
+        connector_id: 1,
+      }),
+    );
+  });
+
+  it('clears a pin when "Use account default" is selected', async () => {
+    (api.listLlmFeaturePreferences as any).mockResolvedValue({
+      preferences: [{ feature: 'recommendation', connector_id: 1 }],
+      known_features: ['recommendation', 'set_builder'],
+    });
+    (api.clearLlmFeaturePreference as any).mockResolvedValue({
+      preferences: [],
+      known_features: ['recommendation', 'set_builder'],
+    });
+
+    render(<AiProvidersSection />);
+    await waitFor(() => expect(screen.getByText(/Per-feature defaults/i)).toBeInTheDocument());
+
+    const select = screen.getByLabelText(/recommendation/i) as HTMLSelectElement;
+    fireEvent.change(select, { target: { value: '' } });
+
+    await waitFor(() =>
+      expect(api.clearLlmFeaturePreference).toHaveBeenCalledWith('recommendation'),
+    );
+  });
+});
+```
+
+- [ ] **Step 2: Run test to verify it fails**
+
+Run: `cd dashboard && npm test -- --run AiProvidersSection.featurePrefs`
+Expected: FAIL — no "Per-feature defaults" section yet.
+
+- [ ] **Step 3: Implement the section**
+
+In `dashboard/components/AiProvidersSection.tsx`:
+
+Add to the type import block:
+
+```typescript
+import type {
+  AIModelInfo,
+  LlmConnector,
+  LlmConnectorCreate,
+  LlmConnectorType,
+  LlmDjPolicy,
+  LlmFeaturePreferences,
+  LlmFeatureKey,
+} from '@/lib/api-types';
+```
+
+Add a human-readable feature label map near `CONNECTOR_TYPE_LABELS`:
+
+```typescript
+const FEATURE_LABELS: Record<string, string> = {
+  recommendation: 'Recommendations',
+  set_builder: 'Set builder',
+};
+```
+
+Add state inside the component (next to the other `useState` hooks):
+
+```typescript
+  const [featurePrefs, setFeaturePrefs] = useState<LlmFeaturePreferences | null>(null);
+```
+
+Add `api.listLlmFeaturePreferences()` to the initial `Promise.all`:
+
+```typescript
+    Promise.all([api.listLlmConnectors(), fetchPolicySoft(), fetchFeaturePrefsSoft()])
+      .then(([rows, p, prefs]) => {
+        if (!active) return;
+        setConnectors(rows);
+        setPolicy(p);
+        setFeaturePrefs(prefs);
+      })
+```
+
+Add handlers near `handleUnsetDefault`:
+
+```typescript
+  const handleFeaturePrefChange = async (feature: LlmFeatureKey, value: string) => {
+    try {
+      const updated =
+        value === ''
+          ? await api.clearLlmFeaturePreference(feature)
+          : await api.setLlmFeaturePreference({
+              feature,
+              connector_id: Number(value),
+            });
+      setFeaturePrefs(updated);
+      setError('');
+    } catch (err) {
+      setError(err instanceof Error ? err.message : 'Failed to update feature default');
+    }
+  };
+```
+
+Add the section JSX after the "Connected providers" `</section>` (before the "Add provider" section). Only render it when there is at least one active connector to pin:
+
+```tsx
+      {featurePrefs && featurePrefs.known_features.length > 0 && (
+        <section style={{ marginTop: '2rem' }}>
+          <h3 style={{ marginTop: 0 }}>Per-feature defaults</h3>
+          <p style={{ color: 'var(--text-secondary)' }}>
+            Pin a specific provider to each AI feature. Unpinned features use your account
+            default (or most-recently-used) connector. Inactive connectors are skipped
+            automatically.
+          </p>
+          {featurePrefs.known_features.map((feature) => {
+            const current =
+              featurePrefs.preferences.find((p) => p.feature === feature)?.connector_id ?? '';
+            const selectId = `feature-pref-${feature}`;
+            const activeConnectors = connectors.filter((c) => c.status === 'active');
+            return (
+              <div className="form-group" key={feature}>
+                <label htmlFor={selectId}>{FEATURE_LABELS[feature] ?? feature}</label>
+                <select
+                  id={selectId}
+                  className="input"
+                  value={current === '' ? '' : String(current)}
+                  onChange={(e) =>
+                    handleFeaturePrefChange(feature as LlmFeatureKey, e.target.value)
+                  }
+                >
+                  <option value="">Use account default</option>
+                  {activeConnectors.map((c) => (
+                    <option key={c.id} value={String(c.id)}>
+                      {c.display_name}
+                    </option>
+                  ))}
+                </select>
+              </div>
+            );
+          })}
+        </section>
+      )}
+```
+
+Add the soft-fetch helper near `fetchPolicySoft` at the bottom:
+
+```typescript
+async function fetchFeaturePrefsSoft(): Promise<LlmFeaturePreferences | null> {
+  try {
+    return await api.listLlmFeaturePreferences();
+  } catch {
+    return null;
+  }
+}
+```
+
+> Design note: the `<label htmlFor>` text is the feature label ("Recommendations") so `getByLabelText(/recommendation/i)` in the test matches. The picker uses connector_id values as strings; empty string = "Use account default" → clears the pin.
+
+- [ ] **Step 4: Run test to verify it passes**
+
+Run: `cd dashboard && npm test -- --run AiProvidersSection.featurePrefs`
+Expected: PASS
+
+- [ ] **Step 5: Run full frontend CI**
+
+```bash
+cd dashboard
+npm run lint
+npx tsc --noEmit
+npm test -- --run
+git checkout lib/../next-env.d.ts 2>/dev/null || git checkout next-env.d.ts 2>/dev/null || true
+```
+
+Expected: lint clean, tsc clean, all vitest pass. (Coverage thresholds enforced — if the new component branch drops coverage, the existing tests + the two new tests should cover the added code paths.)
+
+- [ ] **Step 6: Commit**
+
+```bash
+git add dashboard/components/AiProvidersSection.tsx dashboard/components/__tests__/AiProvidersSection.featurePrefs.test.tsx
+git commit -m "feat(ai-ui): per-feature defaults section on DJ AI settings"
+```
+
+---
+
+## Task 10: Final verification + PR
+
+- [ ] **Step 1: Full backend + frontend CI once more (all green)**
+
+```bash
+cd server && .venv/bin/ruff check . && .venv/bin/ruff format --check . && .venv/bin/bandit -r app -c pyproject.toml -q && .venv/bin/alembic upgrade head && .venv/bin/alembic check && .venv/bin/pytest --tb=short -q
+cd ../dashboard && npm run lint && npx tsc --noEmit && npm test -- --run
+git -C .. checkout dashboard/next-env.d.ts 2>/dev/null || true
+```
+
+- [ ] **Step 2: Push + open PR (use superpowers:finishing-a-development-branch, option 2)**
+
+```bash
+git push -u origin feat/issue-337
+gh pr create --base epic/ai-engine --title "feat(llm): per-feature connector preference (#337)" --body "..."
+```
+
+PR body MUST include `Closes #337`, a `## Design decisions` section, and a note that it targets `epic/ai-engine`.
+
+---
+
+## Self-Review
+
+**Spec coverage:**
+- New `LlmFeaturePreference` model (id, user_id, feature, connector_id, created_at) — Task 1. ✓
+- UNIQUE (user_id, feature) — Task 1 (`__table_args__`) + Task 2 (migration). ✓
+- Migration off rev 049, named `050_*` — Task 2. ✓
+- Resolution order feature → per-DJ default → MRU → org default → NoLlmConfigured — Task 4. ✓
+- Graceful fallback when pinned connector deleted or auth_invalid — Task 4 (tests + skip logic). ✓
+- Endpoints set/change/clear scoped to current user, rate-limited, feature allowlist — Tasks 5+6. ✓
+- Connector ownership validation (no cross-DJ pin) — Task 6 (404 test). ✓
+- Frontend "Per-feature defaults" section + api.ts methods + api-types — Tasks 8+9. ✓
+- DJ can set, change, clear a pin (acceptance) — Tasks 6 (set=upsert covers change) + 9. ✓
+
+**Placeholder scan:** No TBD/TODO; every code step shows full content. PR body content deferred to Task 10 (acceptable — it's prose, drafted at PR time from commit history).
+
+**Type consistency:** `set_feature_preference`, `clear_feature_preference`, `get_feature_preferences_for_user`, `get_feature_preference` used consistently across Tasks 3/4/6. `FeatureKey` / `FeaturePreferenceSet` / `FeaturePreferencesListOut` / `FeaturePreferenceOut` consistent across Tasks 5/6/8. `LlmFeaturePreferences` / `LlmFeatureKey` / `LlmFeaturePreferenceSet` consistent across Tasks 8/9.
diff --git a/docs/superpowers/plans/2026-06-07-wrzdjset-phase0.md b/docs/superpowers/plans/2026-06-07-wrzdjset-phase0.md
deleted file mode 100644
index 3a4509e3..00000000
--- a/docs/superpowers/plans/2026-06-07-wrzdjset-phase0.md
+++ /dev/null
@@ -1,2061 +0,0 @@
-# WrzDJSet Phase 0: Foundation Implementation Plan
-
-> **For agentic workers:** REQUIRED SUB-SKILL: Use superpowers:subagent-driven-development (recommended) or superpowers:executing-plans to implement this plan task-by-task. Steps use checkbox (`- [ ]`) syntax for tracking.
-
-**Goal:** Lay the foundational scaffold for WrzDJSet — SQLAlchemy models, one Alembic migration, a `/api/setbuilder/*` router with set CRUD, an LLM gateway interface stub, and a dashboard builder shell (set list + 4-panel workspace).
-
-**Architecture:** Backend follows the existing WrzDJ FastAPI/SQLAlchemy 2.0 pattern: models in `app/models/`, Pydantic schemas in `app/schemas/`, business logic in `app/services/`, thin routers in `app/api/`. Auth uses the existing `get_current_active_user` dependency (rejects pending users). Sets are owner-scoped; ownership checks return 404 (not 403) to avoid leaking existence, matching `get_owned_event_by_id`. The LLM gateway is a provider-agnostic interface (`services/llm/gateway.py`) whose temporary implementation delegates to the existing `services/recommendation/llm_client.py` — no setbuilder code imports a provider SDK directly. Frontend lives under the `(dj)` route group (shares auth-gated layout) at `dashboard/app/setbuilder/`, matching the existing dashboard page conventions (vanilla CSS + inline styles, dark theme, `api` client singleton).
-
-**Tech Stack:** Python 3.11+ / FastAPI / SQLAlchemy 2.0 / Alembic / Pydantic v2 / pytest (SQLite in-memory) on the backend; Next.js 16 / React 19 / TypeScript / vitest on the frontend.
-
----
-
-## File Structure
-
-**Backend (create):**
-- `server/app/models/set.py` — `Set`, `SetSlot`, `SetCurvePoint`, `SetCollaborator` ORM models
-- `server/app/models/track_vibe.py` — `TrackVibe`, `TrackVibeOverride` ORM models (incl. the 5-col UNIQUE on TrackVibe)
-- `server/app/schemas/setbuilder.py` — Pydantic request/response models for set CRUD
-- `server/app/services/setbuilder/__init__.py` — package marker
-- `server/app/services/setbuilder/set_service.py` — set CRUD business logic (owner-scoped)
-- `server/app/services/llm/__init__.py` — package marker
-- `server/app/services/llm/gateway.py` — provider-agnostic gateway interface + temporary delegating impl
-- `server/app/api/setbuilder.py` — FastAPI router, `/api/setbuilder/*`, set CRUD only
-- `server/alembic/versions/046_add_setbuilder_tables.py` — one migration creating all 6 tables
-- `server/tests/test_setbuilder_models.py` — model + constraint tests
-- `server/tests/test_setbuilder_api.py` — CRUD endpoint + auth-gating tests
-- `server/tests/test_llm_gateway.py` — gateway interface/stub tests
-
-**Backend (modify):**
-- `server/app/models/__init__.py` — register the 6 new models
-- `server/app/api/__init__.py` — include the setbuilder router
-
-**Frontend (create):**
-- `dashboard/app/setbuilder/page.tsx` — set list (create/list/rename/delete)
-- `dashboard/app/setbuilder/[setId]/page.tsx` — builder workspace, 4-panel grid
-- `dashboard/app/setbuilder/setbuilder.module.css` — scoped styles for the 4-panel grid
-- `dashboard/app/setbuilder/__tests__/page.test.tsx` — set list render/CRUD test
-
-**Frontend (modify):**
-- `dashboard/lib/api-types.ts` — add `SetSummary`, `SetDetail`, `SetCreate`, `SetRename` types
-- `dashboard/lib/api.ts` — add `listSets`/`createSet`/`getSet`/`renameSet`/`deleteSet` methods
-
----
-
-## Design decisions (locked for this phase)
-
-These resolve ambiguities in the issue/exec-summary. Document them in the PR body too.
-
-1. **Set must move under the `(dj)` route group?** The issue says `dashboard/app/setbuilder/page.tsx`. But the existing auth-gated DJ pages live under `dashboard/app/(dj)/`. Route groups `(dj)` do **not** change the URL — `app/(dj)/dashboard` serves `/dashboard`. Putting setbuilder at `app/setbuilder/` (outside the group) serves `/setbuilder` but does NOT inherit the `(dj)` layout (ThemeToggle). **Decision:** Follow the issue literally — create at `dashboard/app/setbuilder/` (URL `/setbuilder`). Each page does its own auth guard via `useAuth` (same pattern the dashboard page uses internally), so no functionality is lost. This honors the issue's explicit path.
-2. **`track_id` is a free-form string, not an FK.** The exec-summary models `TrackVibe.track_id`/`SetSlot.track_id` against a global track identity that does not yet exist in WrzDJ (requests use Spotify/Tidal/Beatport source URLs, not a unified track table). **Decision:** model `track_id` as an indexed `String(255)` (a service-namespaced external ID like `tidal:12345`), nullable on `SetSlot` (a slot can be empty pre-fill). No FK in Phase 0.
-3. **TrackVibe nullability:** energy/mood/era/transitional_role/confidence are LLM-derived and absent until enrichment runs (Phase 1). **Decision:** all vibe-signal columns nullable except the 5 identity columns in the UNIQUE constraint (`track_id`, `llm_provider`, `llm_model`, `prompt_version`, `schema_version`), which are `nullable=False`.
-4. **Enums as `String(N)` columns, not DB enums** — matches every existing WrzDJ model (`User.role`, `Event.collection_phase_override`, request status). Pydantic `Literal[...]` enforces values at the API boundary.
-5. **Ownership errors return 404, not 403** — matches `get_owned_event_by_id`; avoids leaking set existence to non-owners.
-6. **Gateway stub surface:** a single async `dispatch(messages, tool, *, model_hint, ...)` entrypoint returning a normalized `GatewayResponse{tool_calls, text}`. The temporary impl maps `dispatch` onto the existing `call_llm`-style Anthropic path **inside `gateway.py` only** by importing the existing `llm_client` module — setbuilder code imports `gateway`, never `anthropic` or `llm_client`. Provider/model identifiers are passed as data (strings), never imported.
-
----
-
-## Task 1: TrackVibe + TrackVibeOverride models
-
-**Files:**
-- Create: `server/app/models/track_vibe.py`
-- Modify: `server/app/models/__init__.py`
-- Test: `server/tests/test_setbuilder_models.py`
-
-- [ ] **Step 1: Write the failing test**
-
-Create `server/tests/test_setbuilder_models.py`:
-
-```python
-"""Model + constraint tests for WrzDJSet Phase 0 tables."""
-
-import pytest
-from sqlalchemy.exc import IntegrityError
-
-from app.models.track_vibe import TrackVibe, TrackVibeOverride
-
-
-def test_track_vibe_persists_with_identity_columns(db):
-    vibe = TrackVibe(
-        track_id="tidal:12345",
-        llm_provider="anthropic",
-        llm_model="claude-haiku-4-5",
-        prompt_version="v1",
-        schema_version="v1",
-        energy=7,
-        mood="euphoric",
-        era="2010s",
-        sing_along=True,
-        dance_floor=True,
-        transitional_role="peak",
-        confidence=0.8,
-    )
-    db.add(vibe)
-    db.commit()
-    db.refresh(vibe)
-    assert vibe.id is not None
-    assert vibe.energy == 7
-    assert vibe.created_at is not None
-
-
-def test_track_vibe_unique_constraint(db):
-    """UNIQUE(track_id, llm_provider, llm_model, prompt_version, schema_version)."""
-    kwargs = dict(
-        track_id="tidal:12345",
-        llm_provider="anthropic",
-        llm_model="claude-haiku-4-5",
-        prompt_version="v1",
-        schema_version="v1",
-    )
-    db.add(TrackVibe(**kwargs))
-    db.commit()
-    db.add(TrackVibe(**kwargs))
-    with pytest.raises(IntegrityError):
-        db.commit()
-    db.rollback()
-
-
-def test_track_vibe_same_track_different_model_allowed(db):
-    """Same track under a different model is a distinct cache row."""
-    db.add(
-        TrackVibe(
-            track_id="tidal:12345",
-            llm_provider="anthropic",
-            llm_model="claude-haiku-4-5",
-            prompt_version="v1",
-            schema_version="v1",
-        )
-    )
-    db.add(
-        TrackVibe(
-            track_id="tidal:12345",
-            llm_provider="openai",
-            llm_model="gpt-5-mini",
-            prompt_version="v1",
-            schema_version="v1",
-        )
-    )
-    db.commit()
-    assert db.query(TrackVibe).count() == 2
-
-
-def test_track_vibe_override_persists(db):
-    override = TrackVibeOverride(
-        track_id="tidal:12345",
-        user_id=1,
-        energy_override=9,
-        mood_override="dark",
-        energy_was=7,
-        mood_was="euphoric",
-        source="explicit_edit",
-    )
-    db.add(override)
-    db.commit()
-    db.refresh(override)
-    assert override.id is not None
-    assert override.source == "explicit_edit"
-    assert override.created_at is not None
-```
-
-- [ ] **Step 2: Run the tests to verify they fail**
-
-Run: `cd server && .venv/bin/pytest tests/test_setbuilder_models.py -v`
-Expected: FAIL with `ModuleNotFoundError: No module named 'app.models.track_vibe'`
-
-- [ ] **Step 3: Write the model implementation**
-
-Create `server/app/models/track_vibe.py`:
-
-```python
-"""WrzDJSet vibe-signal models (Phase 0 scaffold).
-
-TrackVibe is a GLOBAL LLM cache — one row per (track, provider, model,
-prompt_version, schema_version). TrackVibeOverride is a per-DJ taste signal
-that aggregates upward into a community consensus (read-time precedence:
-DJ override -> community consensus -> LLM cached). Vibe-signal columns are
-nullable: they are filled by the enrichment pipeline in a later phase.
-"""
-
-from datetime import datetime
-
-from sqlalchemy import (
-    Boolean,
-    DateTime,
-    Float,
-    Integer,
-    String,
-    Text,
-    UniqueConstraint,
-)
-from sqlalchemy.orm import Mapped, mapped_column
-
-from app.core.time import utcnow
-from app.models.base import Base
-
-
-class TrackVibe(Base):
-    """Global LLM vibe cache. One row per track+provider+model+prompt+schema."""
-
-    __tablename__ = "track_vibes"
-    __table_args__ = (
-        UniqueConstraint(
-            "track_id",
-            "llm_provider",
-            "llm_model",
-            "prompt_version",
-            "schema_version",
-            name="uq_track_vibe_identity",
-        ),
-    )
-
-    id: Mapped[int] = mapped_column(primary_key=True)
-    track_id: Mapped[str] = mapped_column(String(255), nullable=False, index=True)
-
-    # Vibe signal (LLM-derived, filled by enrichment in a later phase)
-    energy: Mapped[int | None] = mapped_column(Integer, nullable=True)  # 0-10
-    mood: Mapped[str | None] = mapped_column(String(50), nullable=True)
-    era: Mapped[str | None] = mapped_column(String(50), nullable=True)
-    sing_along: Mapped[bool | None] = mapped_column(Boolean, nullable=True)
-    dance_floor: Mapped[bool | None] = mapped_column(Boolean, nullable=True)
-    # "intro" | "build" | "peak" | "cool" | "any"
-    transitional_role: Mapped[str | None] = mapped_column(String(20), nullable=True)
-    confidence: Mapped[float | None] = mapped_column(Float, nullable=True)  # 0-1
-
-    # Provenance / granular invalidation (identity columns — part of UNIQUE)
-    llm_provider: Mapped[str] = mapped_column(String(50), nullable=False)
-    llm_model: Mapped[str] = mapped_column(String(100), nullable=False)
-    prompt_version: Mapped[str] = mapped_column(String(20), nullable=False)
-    schema_version: Mapped[str] = mapped_column(String(20), nullable=False)
-
-    created_at: Mapped[datetime] = mapped_column(DateTime, default=utcnow)
-
-
-class TrackVibeOverride(Base):
-    """Per-DJ taste override. Aggregated upward into community consensus."""
-
-    __tablename__ = "track_vibe_overrides"
-
-    id: Mapped[int] = mapped_column(primary_key=True)
-    track_id: Mapped[str] = mapped_column(String(255), nullable=False, index=True)
-    user_id: Mapped[int] = mapped_column(Integer, nullable=False, index=True)
-
-    energy_override: Mapped[int | None] = mapped_column(Integer, nullable=True)
-    mood_override: Mapped[str | None] = mapped_column(String(50), nullable=True)
-
-    # Good-citizen provenance for future taste training
-    overridden_from_vibe_id: Mapped[int | None] = mapped_column(Integer, nullable=True)
-    energy_was: Mapped[int | None] = mapped_column(Integer, nullable=True)
-    mood_was: Mapped[str | None] = mapped_column(String(50), nullable=True)
-    # "explicit_edit" | "upvote" | "downvote_implicit"
-    source: Mapped[str] = mapped_column(String(30), nullable=False)
-    notes: Mapped[str | None] = mapped_column(Text, nullable=True)
-
-    created_at: Mapped[datetime] = mapped_column(DateTime, default=utcnow)
-```
-
-- [ ] **Step 4: Register models in the package `__init__`**
-
-In `server/app/models/__init__.py`, add the import after the `system_settings` import line and the names to `__all__`. The file currently imports alphabetically and lists names in `__all__`. Add:
-
-```python
-from app.models.track_vibe import TrackVibe, TrackVibeOverride
-```
-
-(place it after the `from app.models.system_settings import SystemSettings` line)
-
-And add `"TrackVibe"` and `"TrackVibeOverride"` to the `__all__` list (keep it alphabetical — they go after `"SystemSettings"`).
-
-- [ ] **Step 5: Run the tests to verify they pass**
-
-Run: `cd server && .venv/bin/pytest tests/test_setbuilder_models.py -v`
-Expected: 4 PASS (the TrackVibe tests). (Set/SetSlot tests are added in Task 2.)
-
-- [ ] **Step 6: Commit**
-
-```bash
-git add server/app/models/track_vibe.py server/app/models/__init__.py server/tests/test_setbuilder_models.py
-git commit -m "feat(setbuilder): add TrackVibe + TrackVibeOverride models"
-```
-
----
-
-## Task 2: Set, SetSlot, SetCurvePoint, SetCollaborator models
-
-**Files:**
-- Create: `server/app/models/set.py`
-- Modify: `server/app/models/__init__.py`
-- Test: `server/tests/test_setbuilder_models.py` (append)
-
-- [ ] **Step 1: Write the failing tests (append to the existing test file)**
-
-Append to `server/tests/test_setbuilder_models.py`:
-
-```python
-from app.models.set import Set, SetCollaborator, SetCurvePoint, SetSlot
-
-
-def _make_user(db):
-    from app.models.user import User
-    from app.services.auth import get_password_hash
-
-    user = User(username="setowner", password_hash=get_password_hash("x" * 12), role="dj")
-    db.add(user)
-    db.commit()
-    db.refresh(user)
-    return user
-
-
-def test_set_persists_with_defaults(db):
-    user = _make_user(db)
-    s = Set(owner_id=user.id, name="Friday Wedding")
-    db.add(s)
-    db.commit()
-    db.refresh(s)
-    assert s.id is not None
-    assert s.status == "draft"
-    assert s.sharing_mode == "private"
-    assert s.key_strictness == 0.2
-    assert s.event_id is None
-    assert s.created_at is not None
-    assert s.updated_at is not None
-
-
-def test_set_slot_cascade_delete(db):
-    user = _make_user(db)
-    s = Set(owner_id=user.id, name="Set")
-    db.add(s)
-    db.commit()
-    db.add(SetSlot(set_id=s.id, position=0, track_id="tidal:1"))
-    db.add(SetCurvePoint(set_id=s.id, position_sec=0, energy=3))
-    db.add(SetCollaborator(set_id=s.id, user_id=user.id, role="editor", invited_by=user.id))
-    db.commit()
-    assert db.query(SetSlot).count() == 1
-    assert db.query(SetCurvePoint).count() == 1
-    assert db.query(SetCollaborator).count() == 1
-
-    db.delete(s)
-    db.commit()
-    assert db.query(SetSlot).count() == 0
-    assert db.query(SetCurvePoint).count() == 0
-    assert db.query(SetCollaborator).count() == 0
-
-
-def test_set_slot_locked_defaults_false(db):
-    user = _make_user(db)
-    s = Set(owner_id=user.id, name="Set")
-    db.add(s)
-    db.commit()
-    slot = SetSlot(set_id=s.id, position=0, track_id="tidal:1")
-    db.add(slot)
-    db.commit()
-    db.refresh(slot)
-    assert slot.locked is False
-    assert slot.transition_score is None
-
-
-def test_set_slot_empty_track_allowed(db):
-    user = _make_user(db)
-    s = Set(owner_id=user.id, name="Set")
-    db.add(s)
-    db.commit()
-    slot = SetSlot(set_id=s.id, position=0)
-    db.add(slot)
-    db.commit()
-    db.refresh(slot)
-    assert slot.track_id is None
-```
-
-- [ ] **Step 2: Run the tests to verify they fail**
-
-Run: `cd server && .venv/bin/pytest tests/test_setbuilder_models.py -v -k "set"`
-Expected: FAIL with `ModuleNotFoundError: No module named 'app.models.set'`
-
-- [ ] **Step 3: Write the model implementation**
-
-Create `server/app/models/set.py`:
-
-```python
-"""WrzDJSet core models (Phase 0 scaffold).
-
-A Set is a standalone, owner-private DJ set with an optional event link.
-SetSlot rows are the ordered timeline; SetCurvePoint rows are the energy
-curve; SetCollaborator is modeled now (per exec-summary) but invite/enforce
-flows ship in v3. Child rows cascade-delete with their parent Set.
-
-Enum-like columns are String(N) (matching every other WrzDJ model);
-allowed values are enforced at the API boundary via Pydantic Literals.
-"""
-
-from datetime import datetime
-
-from sqlalchemy import (
-    Boolean,
-    DateTime,
-    Float,
-    ForeignKey,
-    Integer,
-    String,
-    Text,
-)
-from sqlalchemy.orm import Mapped, mapped_column, relationship
-
-from app.core.time import utcnow
-from app.models.base import Base
-
-
-class Set(Base):
-    __tablename__ = "sets"
-
-    id: Mapped[int] = mapped_column(primary_key=True)
-    owner_id: Mapped[int] = mapped_column(
-        ForeignKey("users.id", ondelete="CASCADE"), nullable=False, index=True
-    )
-    event_id: Mapped[int | None] = mapped_column(
-        ForeignKey("events.id", ondelete="SET NULL"), nullable=True, index=True
-    )
-    name: Mapped[str] = mapped_column(String(120), nullable=False)
-    vibe_theme: Mapped[str | None] = mapped_column(String(50), nullable=True)
-
-    target_duration_sec: Mapped[int | None] = mapped_column(Integer, nullable=True)
-    bpm_floor: Mapped[int | None] = mapped_column(Integer, nullable=True)
-    bpm_ceiling: Mapped[int | None] = mapped_column(Integer, nullable=True)
-    # 0.0 ignore Camelot ... 1.0 strict +/-1
-    key_strictness: Mapped[float] = mapped_column(
-        Float, nullable=False, default=0.2, server_default="0.2"
-    )
-
-    # "draft" | "locked" | "exported"
-    status: Mapped[str] = mapped_column(
-        String(20), nullable=False, default="draft", server_default="draft"
-    )
-    # "private" | "invite_only"  (v3 enforced)
-    sharing_mode: Mapped[str] = mapped_column(
-        String(20), nullable=False, default="private", server_default="private"
-    )
-
-    tidal_playlist_id: Mapped[str | None] = mapped_column(String(100), nullable=True)
-    exported_at: Mapped[datetime | None] = mapped_column(DateTime, nullable=True)
-
-    created_at: Mapped[datetime] = mapped_column(DateTime, default=utcnow)
-    updated_at: Mapped[datetime] = mapped_column(DateTime, default=utcnow, onupdate=utcnow)
-
-    slots: Mapped[list["SetSlot"]] = relationship(
-        "SetSlot",
-        back_populates="set",
-        cascade="all, delete-orphan",
-        passive_deletes=True,
-    )
-    curve_points: Mapped[list["SetCurvePoint"]] = relationship(
-        "SetCurvePoint",
-        back_populates="set",
-        cascade="all, delete-orphan",
-        passive_deletes=True,
-    )
-    collaborators: Mapped[list["SetCollaborator"]] = relationship(
-        "SetCollaborator",
-        back_populates="set",
-        cascade="all, delete-orphan",
-        passive_deletes=True,
-    )
-
-
-class SetSlot(Base):
-    __tablename__ = "set_slots"
-
-    id: Mapped[int] = mapped_column(primary_key=True)
-    set_id: Mapped[int] = mapped_column(
-        ForeignKey("sets.id", ondelete="CASCADE"), nullable=False, index=True
-    )
-    position: Mapped[int] = mapped_column(Integer, nullable=False)
-    track_id: Mapped[str | None] = mapped_column(String(255), nullable=True, index=True)
-    locked: Mapped[bool] = mapped_column(
-        Boolean, nullable=False, default=False, server_default="0"
-    )
-    notes: Mapped[str | None] = mapped_column(Text, nullable=True)
-    transition_score: Mapped[float | None] = mapped_column(Float, nullable=True)
-    transition_warnings: Mapped[str | None] = mapped_column(Text, nullable=True)  # JSON
-
-    set: Mapped["Set"] = relationship("Set", back_populates="slots")
-
-
-class SetCurvePoint(Base):
-    __tablename__ = "set_curve_points"
-
-    id: Mapped[int] = mapped_column(primary_key=True)
-    set_id: Mapped[int] = mapped_column(
-        ForeignKey("sets.id", ondelete="CASCADE"), nullable=False, index=True
-    )
-    position_sec: Mapped[int] = mapped_column(Integer, nullable=False)
-    energy: Mapped[int] = mapped_column(Integer, nullable=False)  # 0-10
-    label: Mapped[str | None] = mapped_column(String(50), nullable=True)
-    is_slow_window_start: Mapped[bool] = mapped_column(
-        Boolean, nullable=False, default=False, server_default="0"
-    )
-    is_slow_window_end: Mapped[bool] = mapped_column(
-        Boolean, nullable=False, default=False, server_default="0"
-    )
-
-    set: Mapped["Set"] = relationship("Set", back_populates="curve_points")
-
-
-class SetCollaborator(Base):
-    """Modeled v1, enforced v3."""
-
-    __tablename__ = "set_collaborators"
-
-    id: Mapped[int] = mapped_column(primary_key=True)
-    set_id: Mapped[int] = mapped_column(
-        ForeignKey("sets.id", ondelete="CASCADE"), nullable=False, index=True
-    )
-    user_id: Mapped[int] = mapped_column(
-        ForeignKey("users.id", ondelete="CASCADE"), nullable=False, index=True
-    )
-    role: Mapped[str] = mapped_column(String(20), nullable=False)  # "editor" | "viewer"
-    invited_by: Mapped[int | None] = mapped_column(
-        ForeignKey("users.id", ondelete="SET NULL"), nullable=True
-    )
-    invited_at: Mapped[datetime] = mapped_column(DateTime, default=utcnow)
-
-    set: Mapped["Set"] = relationship("Set", back_populates="collaborators")
-```
-
-- [ ] **Step 4: Register models in the package `__init__`**
-
-In `server/app/models/__init__.py`, add (after the `from app.models.search_cache import SearchCache` line, keeping rough alpha order — `set` sorts after `search_cache`):
-
-```python
-from app.models.set import Set, SetCollaborator, SetCurvePoint, SetSlot
-```
-
-Add `"Set"`, `"SetCollaborator"`, `"SetCurvePoint"`, `"SetSlot"` to `__all__` (after `"SearchCache"`).
-
-- [ ] **Step 5: Run the tests to verify they pass**
-
-Run: `cd server && .venv/bin/pytest tests/test_setbuilder_models.py -v`
-Expected: all PASS (8 tests total: 4 from Task 1, 4 here).
-
-- [ ] **Step 6: Commit**
-
-```bash
-git add server/app/models/set.py server/app/models/__init__.py server/tests/test_setbuilder_models.py
-git commit -m "feat(setbuilder): add Set/SetSlot/SetCurvePoint/SetCollaborator models"
-```
-
----
-
-## Task 3: Alembic migration for all 6 tables
-
-**Files:**
-- Create: `server/alembic/versions/046_add_setbuilder_tables.py`
-
-The current single head is `a11334c031bb`. The new migration goes ON TOP of it (`down_revision = "a11334c031bb"`). The migration must EXACTLY match the models (CI runs `alembic check`).
-
-- [ ] **Step 1: Write the migration**
-
-Create `server/alembic/versions/046_add_setbuilder_tables.py`:
-
-```python
-"""Add WrzDJSet Phase 0 tables (sets, slots, curve points, collaborators, vibes)
-
-Revision ID: 046
-Revises: a11334c031bb
-Create Date: 2026-06-07 00:00:00.000000
-
-"""
-
-from collections.abc import Sequence
-
-import sqlalchemy as sa
-
-from alembic import op
-
-# revision identifiers, used by Alembic.
-revision: str = "046"
-down_revision: str | None = "a11334c031bb"
-branch_labels: str | Sequence[str] | None = None
-depends_on: str | Sequence[str] | None = None
-
-
-def upgrade() -> None:
-    op.create_table(
-        "sets",
-        sa.Column("id", sa.Integer(), primary_key=True),
-        sa.Column(
-            "owner_id",
-            sa.Integer(),
-            sa.ForeignKey("users.id", ondelete="CASCADE"),
-            nullable=False,
-        ),
-        sa.Column(
-            "event_id",
-            sa.Integer(),
-            sa.ForeignKey("events.id", ondelete="SET NULL"),
-            nullable=True,
-        ),
-        sa.Column("name", sa.String(120), nullable=False),
-        sa.Column("vibe_theme", sa.String(50), nullable=True),
-        sa.Column("target_duration_sec", sa.Integer(), nullable=True),
-        sa.Column("bpm_floor", sa.Integer(), nullable=True),
-        sa.Column("bpm_ceiling", sa.Integer(), nullable=True),
-        sa.Column("key_strictness", sa.Float(), nullable=False, server_default="0.2"),
-        sa.Column("status", sa.String(20), nullable=False, server_default="draft"),
-        sa.Column("sharing_mode", sa.String(20), nullable=False, server_default="private"),
-        sa.Column("tidal_playlist_id", sa.String(100), nullable=True),
-        sa.Column("exported_at", sa.DateTime(), nullable=True),
-        sa.Column("created_at", sa.DateTime(), nullable=True),
-        sa.Column("updated_at", sa.DateTime(), nullable=True),
-    )
-    op.create_index("ix_sets_owner_id", "sets", ["owner_id"])
-    op.create_index("ix_sets_event_id", "sets", ["event_id"])
-
-    op.create_table(
-        "set_slots",
-        sa.Column("id", sa.Integer(), primary_key=True),
-        sa.Column(
-            "set_id",
-            sa.Integer(),
-            sa.ForeignKey("sets.id", ondelete="CASCADE"),
-            nullable=False,
-        ),
-        sa.Column("position", sa.Integer(), nullable=False),
-        sa.Column("track_id", sa.String(255), nullable=True),
-        sa.Column("locked", sa.Boolean(), nullable=False, server_default="0"),
-        sa.Column("notes", sa.Text(), nullable=True),
-        sa.Column("transition_score", sa.Float(), nullable=True),
-        sa.Column("transition_warnings", sa.Text(), nullable=True),
-    )
-    op.create_index("ix_set_slots_set_id", "set_slots", ["set_id"])
-    op.create_index("ix_set_slots_track_id", "set_slots", ["track_id"])
-
-    op.create_table(
-        "set_curve_points",
-        sa.Column("id", sa.Integer(), primary_key=True),
-        sa.Column(
-            "set_id",
-            sa.Integer(),
-            sa.ForeignKey("sets.id", ondelete="CASCADE"),
-            nullable=False,
-        ),
-        sa.Column("position_sec", sa.Integer(), nullable=False),
-        sa.Column("energy", sa.Integer(), nullable=False),
-        sa.Column("label", sa.String(50), nullable=True),
-        sa.Column("is_slow_window_start", sa.Boolean(), nullable=False, server_default="0"),
-        sa.Column("is_slow_window_end", sa.Boolean(), nullable=False, server_default="0"),
-    )
-    op.create_index("ix_set_curve_points_set_id", "set_curve_points", ["set_id"])
-
-    op.create_table(
-        "set_collaborators",
-        sa.Column("id", sa.Integer(), primary_key=True),
-        sa.Column(
-            "set_id",
-            sa.Integer(),
-            sa.ForeignKey("sets.id", ondelete="CASCADE"),
-            nullable=False,
-        ),
-        sa.Column(
-            "user_id",
-            sa.Integer(),
-            sa.ForeignKey("users.id", ondelete="CASCADE"),
-            nullable=False,
-        ),
-        sa.Column("role", sa.String(20), nullable=False),
-        sa.Column(
-            "invited_by",
-            sa.Integer(),
-            sa.ForeignKey("users.id", ondelete="SET NULL"),
-            nullable=True,
-        ),
-        sa.Column("invited_at", sa.DateTime(), nullable=True),
-    )
-    op.create_index("ix_set_collaborators_set_id", "set_collaborators", ["set_id"])
-    op.create_index("ix_set_collaborators_user_id", "set_collaborators", ["user_id"])
-
-    op.create_table(
-        "track_vibes",
-        sa.Column("id", sa.Integer(), primary_key=True),
-        sa.Column("track_id", sa.String(255), nullable=False),
-        sa.Column("energy", sa.Integer(), nullable=True),
-        sa.Column("mood", sa.String(50), nullable=True),
-        sa.Column("era", sa.String(50), nullable=True),
-        sa.Column("sing_along", sa.Boolean(), nullable=True),
-        sa.Column("dance_floor", sa.Boolean(), nullable=True),
-        sa.Column("transitional_role", sa.String(20), nullable=True),
-        sa.Column("confidence", sa.Float(), nullable=True),
-        sa.Column("llm_provider", sa.String(50), nullable=False),
-        sa.Column("llm_model", sa.String(100), nullable=False),
-        sa.Column("prompt_version", sa.String(20), nullable=False),
-        sa.Column("schema_version", sa.String(20), nullable=False),
-        sa.Column("created_at", sa.DateTime(), nullable=True),
-        sa.UniqueConstraint(
-            "track_id",
-            "llm_provider",
-            "llm_model",
-            "prompt_version",
-            "schema_version",
-            name="uq_track_vibe_identity",
-        ),
-    )
-    op.create_index("ix_track_vibes_track_id", "track_vibes", ["track_id"])
-
-    op.create_table(
-        "track_vibe_overrides",
-        sa.Column("id", sa.Integer(), primary_key=True),
-        sa.Column("track_id", sa.String(255), nullable=False),
-        sa.Column("user_id", sa.Integer(), nullable=False),
-        sa.Column("energy_override", sa.Integer(), nullable=True),
-        sa.Column("mood_override", sa.String(50), nullable=True),
-        sa.Column("overridden_from_vibe_id", sa.Integer(), nullable=True),
-        sa.Column("energy_was", sa.Integer(), nullable=True),
-        sa.Column("mood_was", sa.String(50), nullable=True),
-        sa.Column("source", sa.String(30), nullable=False),
-        sa.Column("notes", sa.Text(), nullable=True),
-        sa.Column("created_at", sa.DateTime(), nullable=True),
-    )
-    op.create_index("ix_track_vibe_overrides_track_id", "track_vibe_overrides", ["track_id"])
-    op.create_index("ix_track_vibe_overrides_user_id", "track_vibe_overrides", ["user_id"])
-
-
-def downgrade() -> None:
-    op.drop_index("ix_track_vibe_overrides_user_id")
-    op.drop_index("ix_track_vibe_overrides_track_id")
-    op.drop_table("track_vibe_overrides")
-    op.drop_index("ix_track_vibes_track_id")
-    op.drop_table("track_vibes")
-    op.drop_index("ix_set_collaborators_user_id")
-    op.drop_index("ix_set_collaborators_set_id")
-    op.drop_table("set_collaborators")
-    op.drop_index("ix_set_curve_points_set_id")
-    op.drop_table("set_curve_points")
-    op.drop_index("ix_set_slots_track_id")
-    op.drop_index("ix_set_slots_set_id")
-    op.drop_table("set_slots")
-    op.drop_index("ix_sets_event_id")
-    op.drop_index("ix_sets_owner_id")
-    op.drop_table("sets")
-```
-
-- [ ] **Step 2: Apply the migration and verify no drift**
-
-Ensure the dev DB is up (`docker compose up -d db` from the worktree root if needed).
-Run: `cd server && .venv/bin/alembic upgrade head && .venv/bin/alembic check`
-Expected: `alembic upgrade head` runs without error; `alembic check` prints `No new upgrade operations detected.`
-
-If `alembic check` reports drift, reconcile the migration column types/nullability/server_default/indexes with the models until it is clean. Common cause: a model column with `index=True` lacks a matching `op.create_index`, or a `server_default` mismatch.
-
-- [ ] **Step 3: Commit**
-
-```bash
-git add server/alembic/versions/046_add_setbuilder_tables.py
-git commit -m "feat(setbuilder): add migration 046 for setbuilder tables"
-```
-
----
-
-## Task 4: LLM gateway interface stub
-
-**Files:**
-- Create: `server/app/services/llm/__init__.py`
-- Create: `server/app/services/llm/gateway.py`
-- Test: `server/tests/test_llm_gateway.py`
-
-The gateway is the ONLY surface setbuilder code calls for LLM work. Its temporary implementation delegates to the existing Anthropic path inside `llm_client.py`. **No provider SDK import lives in setbuilder code** — the `anthropic` import stays confined to `services/recommendation/llm_client.py`, which `gateway.py` reuses indirectly.
-
-- [ ] **Step 1: Write the failing test**
-
-Create `server/tests/test_llm_gateway.py`:
-
-```python
-"""Tests for the provider-agnostic LLM gateway stub (Phase 0).
-
-The gateway is the single surface WrzDJSet codes against. Phase 0 ships an
-interface + a temporary delegating implementation. These tests pin the
-interface shape and the normalization contract, NOT the live LLM.
-"""
-
-import ast
-from pathlib import Path
-
-import pytest
-
-from app.services.llm import gateway
-
-
-def test_gateway_response_shape():
-    resp = gateway.GatewayResponse(tool_calls=[{"name": "x", "input": {}}], text="hi")
-    assert resp.tool_calls == [{"name": "x", "input": {}}]
-    assert resp.text == "hi"
-
-
-def test_gateway_response_defaults():
-    resp = gateway.GatewayResponse()
-    assert resp.tool_calls == []
-    assert resp.text == ""
-
-
-def test_model_hint_literal_values_documented():
-    # The two documented hints from the exec summary.
-    assert gateway.MODEL_HINTS == ("fast", "strong")
-
-
-@pytest.mark.asyncio
-async def test_dispatch_normalizes_delegated_response(monkeypatch):
-    """dispatch() returns a GatewayResponse normalized from the provider call."""
-
-    class _FakeBlock:
-        def __init__(self, type, **kw):
-            self.type = type
-            for k, v in kw.items():
-                setattr(self, k, v)
-
-    class _FakeResponse:
-        content = [
-            _FakeBlock("text", text="thinking"),
-            _FakeBlock("tool_use", name="critique_set", input={"grade": "A"}),
-        ]
-
-    async def _fake_raw_call(*, model, system, tools, tool_choice, messages, max_tokens):
-        # Assert the gateway passed a concrete model string (data, not import).
-        assert isinstance(model, str) and model
-        return _FakeResponse()
-
-    monkeypatch.setattr(gateway, "_raw_provider_call", _fake_raw_call)
-
-    result = await gateway.dispatch(
-        messages=[{"role": "user", "content": "grade this set"}],
-        tool={"name": "critique_set", "input_schema": {"type": "object"}},
-        model_hint="strong",
-    )
-    assert isinstance(result, gateway.GatewayResponse)
-    assert result.text == "thinking"
-    assert result.tool_calls == [{"name": "critique_set", "input": {"grade": "A"}}]
-
-
-def test_no_provider_sdk_import_in_gateway_module():
-    """gateway.py must not import a provider SDK directly (anthropic/openai/etc.)."""
-    src = Path(gateway.__file__).read_text()
-    tree = ast.parse(src)
-    banned = {"anthropic", "openai", "google", "cohere", "mistralai", "litellm"}
-    for node in ast.walk(tree):
-        if isinstance(node, ast.Import):
-            for alias in node.names:
-                assert alias.name.split(".")[0] not in banned
-        elif isinstance(node, ast.ImportFrom):
-            root = (node.module or "").split(".")[0]
-            assert root not in banned
-```
-
-- [ ] **Step 2: Run the tests to verify they fail**
-
-Run: `cd server && .venv/bin/pytest tests/test_llm_gateway.py -v`
-Expected: FAIL with `ModuleNotFoundError: No module named 'app.services.llm'`
-
-- [ ] **Step 3: Create the package marker and gateway implementation**
-
-Create `server/app/services/llm/__init__.py`:
-
-```python
-"""Provider-agnostic LLM gateway package.
-
-WrzDJSet (and any future agentic feature) MUST call LLMs only through
-`app.services.llm.gateway`. Direct provider SDK imports are forbidden in
-feature code — provider/model identifiers are data, not imports.
-"""
-```
-
-Create `server/app/services/llm/gateway.py`:
-
-```python
-"""Provider-agnostic LLM gateway (Phase 0 interface stub).
-
-This is the single call surface WrzDJSet codes against. The real gateway
-(OAuth multi-provider dispatch) ships in a parallel worktree; until it merges
-this stub delegates to the existing Anthropic path in
-`services/recommendation/llm_client.py`. Per exec-summary 6/9 ("slip
-insurance"), WrzDJSet is NOT blocked on the gateway merge.
-
-CRITICAL: no provider SDK is imported here. Model identifiers are plain
-strings resolved from a model_hint. The actual provider call is isolated in
-`_raw_provider_call`, which reuses the existing recommendation LLM plumbing.
-"""
-
-from dataclasses import dataclass, field
-from typing import Any, Literal
-
-ModelHint = Literal["fast", "strong"]
-MODEL_HINTS: tuple[str, ...] = ("fast", "strong")
-
-
-@dataclass
-class GatewayResponse:
-    """Normalized LLM response: tool calls + free text, provider-agnostic."""
-
-    tool_calls: list[dict[str, Any]] = field(default_factory=list)
-    text: str = ""
-
-
-def _resolve_model(model_hint: ModelHint) -> str:
-    """Map a coarse capability hint to a concrete model string.
-
-    Reads the configured Anthropic model for the temporary delegating impl.
-    When the OAuth gateway lands this becomes a provider-aware lookup driven
-    by SystemSettings; the hint contract ("fast" vs "strong") stays stable.
-    """
-    from app.core.config import get_settings
-
-    settings = get_settings()
-    # Phase 0: single-provider delegation. Both hints resolve to the
-    # configured model; the gateway epic differentiates fast/strong tiers.
-    return settings.anthropic_model
-
-
-async def _raw_provider_call(
-    *,
-    model: str,
-    system: str,
-    tools: list[dict[str, Any]],
-    tool_choice: dict[str, Any] | None,
-    messages: list[dict[str, Any]],
-    max_tokens: int,
-) -> Any:
-    """Isolated provider call. Reuses the existing recommendation LLM client.
-
-    Importing the client lazily and locally keeps any provider SDK transitively
-    out of this module's import graph at module scope and out of feature code.
-    """
-    from anthropic import AsyncAnthropic  # noqa: PLC0415 — isolation point
-
-    from app.core.config import get_settings
-
-    settings = get_settings()
-    client = AsyncAnthropic(
-        api_key=settings.anthropic_api_key,
-        timeout=settings.anthropic_timeout_seconds,
-    )
-    kwargs: dict[str, Any] = {
-        "model": model,
-        "max_tokens": max_tokens,
-        "messages": messages,
-    }
-    if system:
-        kwargs["system"] = system
-    if tools:
-        kwargs["tools"] = tools
-    if tool_choice:
-        kwargs["tool_choice"] = tool_choice
-    return await client.messages.create(**kwargs)
-
-
-def _normalize(response: Any) -> GatewayResponse:
-    """Translate a provider response into the normalized GatewayResponse."""
-    text = ""
-    tool_calls: list[dict[str, Any]] = []
-    for block in getattr(response, "content", []) or []:
-        btype = getattr(block, "type", None)
-        if btype == "text":
-            text += getattr(block, "text", "")
-        elif btype == "tool_use":
-            tool_calls.append(
-                {"name": getattr(block, "name", ""), "input": getattr(block, "input", {})}
-            )
-    return GatewayResponse(tool_calls=tool_calls, text=text)
-
-
-async def dispatch(
-    *,
-    messages: list[dict[str, Any]],
-    tool: dict[str, Any] | None = None,
-    system: str = "",
-    model_hint: ModelHint = "fast",
-    max_tokens: int = 2048,
-) -> GatewayResponse:
-    """Dispatch a single LLM turn and return a normalized response.
-
-    Args:
-        messages: provider-agnostic message list ([{"role", "content"}]).
-        tool: a single JSONSchema tool spec ({"name", "input_schema"});
-            when provided, the gateway forces tool use.
-        system: optional system prompt.
-        model_hint: "fast" (batch/chat) or "strong" (critique/grading).
-        max_tokens: response token cap.
-
-    Returns:
-        GatewayResponse with `tool_calls` and `text`.
-    """
-    model = _resolve_model(model_hint)
-    tools = [tool] if tool else []
-    tool_choice = {"type": "tool", "name": tool["name"]} if tool else None
-    response = await _raw_provider_call(
-        model=model,
-        system=system,
-        tools=tools,
-        tool_choice=tool_choice,
-        messages=messages,
-        max_tokens=max_tokens,
-    )
-    return _normalize(response)
-```
-
-Note on the test for `_raw_provider_call`: the async test monkeypatches `gateway._raw_provider_call`, so the real `anthropic` import inside it never executes during tests. The `test_no_provider_sdk_import_in_gateway_module` test only forbids **module-scope** imports — the lazy import inside `_raw_provider_call` is a function-body import, which the AST walk over the whole module WOULD catch. To keep this test passing AND honor the gateway-only rule, the `anthropic` import must NOT appear anywhere in `gateway.py`. **Revise `_raw_provider_call` to delegate to a helper in the existing `llm_client` module instead of importing `anthropic` here.**
-
-Apply this revision to `_raw_provider_call` in `gateway.py`:
-
-```python
-async def _raw_provider_call(
-    *,
-    model: str,
-    system: str,
-    tools: list[dict[str, Any]],
-    tool_choice: dict[str, Any] | None,
-    messages: list[dict[str, Any]],
-    max_tokens: int,
-) -> Any:
-    """Isolated provider call. Delegates to the existing recommendation client.
-
-    The provider SDK import lives ONLY in services/recommendation/llm_client.py.
-    This module never imports a provider SDK (enforced by test).
-    """
-    from app.services.recommendation import llm_client
-
-    return await llm_client.raw_messages_create(
-        model=model,
-        system=system,
-        tools=tools,
-        tool_choice=tool_choice,
-        messages=messages,
-        max_tokens=max_tokens,
-    )
-```
-
-And add the thin reusable helper to `server/app/services/recommendation/llm_client.py` (append near `call_llm`):
-
-```python
-async def raw_messages_create(
-    *,
-    model: str,
-    system: str,
-    tools: list[dict] | None,
-    tool_choice: dict | None,
-    messages: list[dict],
-    max_tokens: int,
-):
-    """Low-level Anthropic messages.create passthrough.
-
-    Exists so the provider-agnostic gateway can delegate here without importing
-    a provider SDK itself. The `anthropic` import stays confined to this module.
-    """
-    settings = get_settings()
-    client = AsyncAnthropic(
-        api_key=settings.anthropic_api_key,
-        timeout=settings.anthropic_timeout_seconds,
-    )
-    kwargs: dict = {"model": model, "max_tokens": max_tokens, "messages": messages}
-    if system:
-        kwargs["system"] = system
-    if tools:
-        kwargs["tools"] = tools
-    if tool_choice:
-        kwargs["tool_choice"] = tool_choice
-    return await client.messages.create(**kwargs)
-```
-
-- [ ] **Step 4: Run the tests to verify they pass**
-
-Run: `cd server && .venv/bin/pytest tests/test_llm_gateway.py -v`
-Expected: all PASS (5 tests). If `test_no_provider_sdk_import_in_gateway_module` fails, confirm `gateway.py` has zero `anthropic`/provider imports (the delegation goes through `llm_client.raw_messages_create`).
-
-- [ ] **Step 5: Commit**
-
-```bash
-git add server/app/services/llm/ server/app/services/recommendation/llm_client.py server/tests/test_llm_gateway.py
-git commit -m "feat(setbuilder): add provider-agnostic LLM gateway stub"
-```
-
----
-
-## Task 5: Set CRUD service + Pydantic schemas
-
-**Files:**
-- Create: `server/app/schemas/setbuilder.py`
-- Create: `server/app/services/setbuilder/__init__.py`
-- Create: `server/app/services/setbuilder/set_service.py`
-- Test: covered by Task 6's API tests (the service is exercised through the router). No standalone service test — boundary tests at the API beat internal unit tests here.
-
-- [ ] **Step 1: Write the Pydantic schemas**
-
-Create `server/app/schemas/setbuilder.py`:
-
-```python
-"""Pydantic schemas for WrzDJSet set-CRUD endpoints (Phase 0)."""
-
-from datetime import datetime
-from typing import Literal
-
-from pydantic import BaseModel, ConfigDict, Field
-
-
-class SetCreate(BaseModel):
-    """Body for creating a new (empty) set."""
-
-    name: str = Field(..., min_length=1, max_length=120)
-    event_id: int | None = None
-
-
-class SetRename(BaseModel):
-    """Body for renaming a set."""
-
-    name: str = Field(..., min_length=1, max_length=120)
-
-
-class SetSummary(BaseModel):
-    """Set list item (no children)."""
-
-    model_config = ConfigDict(from_attributes=True)
-
-    id: int
-    name: str
-    event_id: int | None
-    status: Literal["draft", "locked", "exported"]
-    sharing_mode: Literal["private", "invite_only"]
-    created_at: datetime
-    updated_at: datetime
-
-
-class SetDetail(SetSummary):
-    """Full set record (Phase 0: no slot/curve expansion yet)."""
-
-    vibe_theme: str | None
-    target_duration_sec: int | None
-    bpm_floor: int | None
-    bpm_ceiling: int | None
-    key_strictness: float
-    tidal_playlist_id: str | None
-    exported_at: datetime | None
-```
-
-- [ ] **Step 2: Write the service package marker and CRUD logic**
-
-Create `server/app/services/setbuilder/__init__.py`:
-
-```python
-"""WrzDJSet backend services (Phase 0)."""
-```
-
-Create `server/app/services/setbuilder/set_service.py`:
-
-```python
-"""Owner-scoped CRUD for WrzDJSet sets (Phase 0).
-
-All reads/mutations are scoped to the owner. The API layer surfaces a 404
-(not 403) for a missing-or-unowned set to avoid leaking existence, matching
-the rest of WrzDJ (see deps.get_owned_event_by_id).
-"""
-
-from sqlalchemy.orm import Session
-
-from app.models.set import Set
-
-
-def create_set(db: Session, owner_id: int, name: str, event_id: int | None = None) -> Set:
-    """Create a new empty set owned by `owner_id`."""
-    new_set = Set(owner_id=owner_id, name=name, event_id=event_id)
-    db.add(new_set)
-    db.commit()
-    db.refresh(new_set)
-    return new_set
-
-
-def list_sets(db: Session, owner_id: int) -> list[Set]:
-    """List the owner's sets, newest first."""
-    return (
-        db.query(Set)
-        .filter(Set.owner_id == owner_id)
-        .order_by(Set.created_at.desc())
-        .all()
-    )
-
-
-def get_owned_set(db: Session, set_id: int, owner_id: int) -> Set | None:
-    """Fetch a set by id, scoped to the owner. None if missing or unowned."""
-    return (
-        db.query(Set)
-        .filter(Set.id == set_id, Set.owner_id == owner_id)
-        .one_or_none()
-    )
-
-
-def rename_set(db: Session, set_obj: Set, name: str) -> Set:
-    """Rename a set."""
-    set_obj.name = name
-    db.commit()
-    db.refresh(set_obj)
-    return set_obj
-
-
-def delete_set(db: Session, set_obj: Set) -> None:
-    """Delete a set (children cascade via FK ondelete + ORM cascade)."""
-    db.delete(set_obj)
-    db.commit()
-```
-
-- [ ] **Step 3: Run the existing suite to confirm nothing imports break**
-
-Run: `cd server && .venv/bin/pytest tests/test_setbuilder_models.py -q`
-Expected: PASS (imports resolve; no regressions).
-
-- [ ] **Step 4: Commit**
-
-```bash
-git add server/app/schemas/setbuilder.py server/app/services/setbuilder/
-git commit -m "feat(setbuilder): add set schemas + owner-scoped CRUD service"
-```
-
----
-
-## Task 6: Setbuilder API router + registration
-
-**Files:**
-- Create: `server/app/api/setbuilder.py`
-- Modify: `server/app/api/__init__.py`
-- Test: `server/tests/test_setbuilder_api.py`
-
-- [ ] **Step 1: Write the failing API tests**
-
-Create `server/tests/test_setbuilder_api.py`:
-
-```python
-"""API tests for /api/setbuilder set CRUD (Phase 0).
-
-Pins auth gating (pending users rejected, unauthenticated rejected),
-owner isolation (404 on another DJ's set), and the create/list/get/
-rename/delete happy paths.
-"""
-
-from app.services.auth import get_password_hash
-
-
-def _make_second_dj(db):
-    from app.models.user import User
-
-    user = User(username="otherdj", password_hash=get_password_hash("x" * 12), role="dj")
-    db.add(user)
-    db.commit()
-    db.refresh(user)
-    return user
-
-
-def _login(client, username, password):
-    resp = client.post("/api/auth/login", data={"username": username, "password": password})
-    assert resp.status_code == 200, resp.json()
-    return {"Authorization": f"Bearer {resp.json()['access_token']}"}
-
-
-def test_create_set(client, auth_headers):
-    resp = client.post("/api/setbuilder/sets", json={"name": "Friday Set"}, headers=auth_headers)
-    assert resp.status_code == 201, resp.json()
-    body = resp.json()
-    assert body["name"] == "Friday Set"
-    assert body["status"] == "draft"
-    assert body["sharing_mode"] == "private"
-    assert body["id"] > 0
-
-
-def test_create_set_requires_auth(client):
-    resp = client.post("/api/setbuilder/sets", json={"name": "X"})
-    assert resp.status_code == 401
-
-
-def test_create_set_rejects_pending_user(client, pending_headers):
-    resp = client.post("/api/setbuilder/sets", json={"name": "X"}, headers=pending_headers)
-    assert resp.status_code == 403
-
-
-def test_create_set_validates_name(client, auth_headers):
-    resp = client.post("/api/setbuilder/sets", json={"name": ""}, headers=auth_headers)
-    assert resp.status_code == 422
-
-
-def test_list_sets_only_owner(client, auth_headers, db):
-    client.post("/api/setbuilder/sets", json={"name": "Mine"}, headers=auth_headers)
-    other = _make_second_dj(db)
-    other_headers = _login(client, "otherdj", "xxxxxxxxxxxx")
-    client.post("/api/setbuilder/sets", json={"name": "Theirs"}, headers=other_headers)
-
-    resp = client.get("/api/setbuilder/sets", headers=auth_headers)
-    assert resp.status_code == 200
-    names = [s["name"] for s in resp.json()]
-    assert names == ["Mine"]
-
-
-def test_get_set(client, auth_headers):
-    created = client.post(
-        "/api/setbuilder/sets", json={"name": "Detail"}, headers=auth_headers
-    ).json()
-    resp = client.get(f"/api/setbuilder/sets/{created['id']}", headers=auth_headers)
-    assert resp.status_code == 200
-    assert resp.json()["key_strictness"] == 0.2
-
-
-def test_get_other_dj_set_returns_404(client, auth_headers, db):
-    other = _make_second_dj(db)
-    other_headers = _login(client, "otherdj", "xxxxxxxxxxxx")
-    theirs = client.post(
-        "/api/setbuilder/sets", json={"name": "Theirs"}, headers=other_headers
-    ).json()
-    resp = client.get(f"/api/setbuilder/sets/{theirs['id']}", headers=auth_headers)
-    assert resp.status_code == 404
-
-
-def test_rename_set(client, auth_headers):
-    created = client.post(
-        "/api/setbuilder/sets", json={"name": "Old"}, headers=auth_headers
-    ).json()
-    resp = client.patch(
-        f"/api/setbuilder/sets/{created['id']}", json={"name": "New"}, headers=auth_headers
-    )
-    assert resp.status_code == 200
-    assert resp.json()["name"] == "New"
-
-
-def test_rename_other_dj_set_returns_404(client, auth_headers, db):
-    other = _make_second_dj(db)
-    other_headers = _login(client, "otherdj", "xxxxxxxxxxxx")
-    theirs = client.post(
-        "/api/setbuilder/sets", json={"name": "Theirs"}, headers=other_headers
-    ).json()
-    resp = client.patch(
-        f"/api/setbuilder/sets/{theirs['id']}", json={"name": "Hax"}, headers=auth_headers
-    )
-    assert resp.status_code == 404
-
-
-def test_delete_set(client, auth_headers):
-    created = client.post(
-        "/api/setbuilder/sets", json={"name": "Doomed"}, headers=auth_headers
-    ).json()
-    resp = client.delete(f"/api/setbuilder/sets/{created['id']}", headers=auth_headers)
-    assert resp.status_code == 204
-    assert client.get(
-        f"/api/setbuilder/sets/{created['id']}", headers=auth_headers
-    ).status_code == 404
-
-
-def test_delete_other_dj_set_returns_404(client, auth_headers, db):
-    other = _make_second_dj(db)
-    other_headers = _login(client, "otherdj", "xxxxxxxxxxxx")
-    theirs = client.post(
-        "/api/setbuilder/sets", json={"name": "Theirs"}, headers=other_headers
-    ).json()
-    resp = client.delete(f"/api/setbuilder/sets/{theirs['id']}", headers=auth_headers)
-    assert resp.status_code == 404
-```
-
-- [ ] **Step 2: Run the tests to verify they fail**
-
-Run: `cd server && .venv/bin/pytest tests/test_setbuilder_api.py -v`
-Expected: FAIL (404 on every route — router not registered yet).
-
-- [ ] **Step 3: Write the router**
-
-Create `server/app/api/setbuilder.py`:
-
-```python
-"""WrzDJSet set-CRUD router (Phase 0).
-
-Mounted at /api/setbuilder. Every endpoint requires an active DJ
-(get_current_active_user rejects pending users). Sets are owner-private;
-missing-or-unowned sets return 404 to avoid leaking existence.
-"""
-
-from fastapi import APIRouter, Depends, HTTPException, Request, status
-from sqlalchemy.orm import Session
-
-from app.api.deps import get_current_active_user, get_db
-from app.core.rate_limit import limiter
-from app.models.user import User
-from app.schemas.setbuilder import SetCreate, SetDetail, SetRename, SetSummary
-from app.services.setbuilder import set_service
-
-router = APIRouter()
-
-
-def _get_owned_or_404(db: Session, set_id: int, user: User):
-    set_obj = set_service.get_owned_set(db, set_id, user.id)
-    if set_obj is None:
-        raise HTTPException(status_code=404, detail="Set not found")
-    return set_obj
-
-
-@router.post("/sets", response_model=SetDetail, status_code=status.HTTP_201_CREATED)
-@limiter.limit("30/minute")
-def create_set(
-    payload: SetCreate,
-    request: Request,
-    db: Session = Depends(get_db),
-    current_user: User = Depends(get_current_active_user),
-) -> SetDetail:
-    """Create a new empty set owned by the current DJ."""
-    set_obj = set_service.create_set(
-        db, owner_id=current_user.id, name=payload.name, event_id=payload.event_id
-    )
-    return SetDetail.model_validate(set_obj)
-
-
-@router.get("/sets", response_model=list[SetSummary])
-@limiter.limit("60/minute")
-def list_sets(
-    request: Request,
-    db: Session = Depends(get_db),
-    current_user: User = Depends(get_current_active_user),
-) -> list[SetSummary]:
-    """List the current DJ's sets, newest first."""
-    return [SetSummary.model_validate(s) for s in set_service.list_sets(db, current_user.id)]
-
-
-@router.get("/sets/{set_id}", response_model=SetDetail)
-@limiter.limit("60/minute")
-def get_set(
-    set_id: int,
-    request: Request,
-    db: Session = Depends(get_db),
-    current_user: User = Depends(get_current_active_user),
-) -> SetDetail:
-    """Get one of the current DJ's sets, or 404."""
-    return SetDetail.model_validate(_get_owned_or_404(db, set_id, current_user))
-
-
-@router.patch("/sets/{set_id}", response_model=SetDetail)
-@limiter.limit("30/minute")
-def rename_set(
-    set_id: int,
-    payload: SetRename,
-    request: Request,
-    db: Session = Depends(get_db),
-    current_user: User = Depends(get_current_active_user),
-) -> SetDetail:
-    """Rename one of the current DJ's sets, or 404."""
-    set_obj = _get_owned_or_404(db, set_id, current_user)
-    return SetDetail.model_validate(set_service.rename_set(db, set_obj, payload.name))
-
-
-@router.delete("/sets/{set_id}", status_code=status.HTTP_204_NO_CONTENT)
-@limiter.limit("30/minute")
-def delete_set(
-    set_id: int,
-    request: Request,
-    db: Session = Depends(get_db),
-    current_user: User = Depends(get_current_active_user),
-) -> None:
-    """Delete one of the current DJ's sets, or 404."""
-    set_obj = _get_owned_or_404(db, set_id, current_user)
-    set_service.delete_set(db, set_obj)
-```
-
-- [ ] **Step 4: Register the router**
-
-In `server/app/api/__init__.py`, add `setbuilder` to the import block (alphabetically — after `search`/before `sse`) and add the include line near the other authenticated routers:
-
-```python
-api_router.include_router(setbuilder.router, prefix="/setbuilder", tags=["setbuilder"])
-```
-
-(place it after the `events` include, e.g. right after the `requests`/`search` includes — order among prefixed routers is cosmetic).
-
-- [ ] **Step 5: Run the tests to verify they pass**
-
-Run: `cd server && .venv/bin/pytest tests/test_setbuilder_api.py -v`
-Expected: all PASS (11 tests).
-
-- [ ] **Step 6: Run the full backend suite + lint + coverage gate**
-
-Run: `cd server && .venv/bin/ruff check . && .venv/bin/ruff format --check . && .venv/bin/bandit -r app -c pyproject.toml -q && .venv/bin/pytest --tb=short -q`
-Expected: lint clean, bandit clean, all tests pass, coverage gate satisfied. If `ruff format --check` fails, run `.venv/bin/ruff format .` and re-stage.
-
-- [ ] **Step 7: Commit**
-
-```bash
-git add server/app/api/setbuilder.py server/app/api/__init__.py server/tests/test_setbuilder_api.py
-git commit -m "feat(setbuilder): add /api/setbuilder set CRUD router"
-```
-
----
-
-## Task 7: Frontend API client types + methods
-
-**Files:**
-- Modify: `dashboard/lib/api-types.ts`
-- Modify: `dashboard/lib/api.ts`
-
-- [ ] **Step 1: Add the shared types**
-
-In `dashboard/lib/api-types.ts`, append these interfaces near the end (before the `PaginatedResponse` block is fine):
-
-```typescript
-export interface SetSummary {
-  id: number;
-  name: string;
-  event_id: number | null;
-  status: 'draft' | 'locked' | 'exported';
-  sharing_mode: 'private' | 'invite_only';
-  created_at: string;
-  updated_at: string;
-}
-
-export interface SetDetail extends SetSummary {
-  vibe_theme: string | null;
-  target_duration_sec: number | null;
-  bpm_floor: number | null;
-  bpm_ceiling: number | null;
-  key_strictness: number;
-  tidal_playlist_id: string | null;
-  exported_at: string | null;
-}
-```
-
-- [ ] **Step 2: Add the client methods**
-
-In `dashboard/lib/api.ts`:
-
-a) Add `SetSummary` and `SetDetail` to the `import type { ... } from './api-types'` block AND to the `export type { ... }` re-export block (both alphabetical lists — `SetDetail`/`SetSummary` go after `SearchResult`).
-
-b) Add these methods to the `ApiClient` class (next to `deleteEvent`):
-
-```typescript
-  async listSets(): Promise<SetSummary[]> {
-    return this.fetch('/api/setbuilder/sets');
-  }
-  async createSet(name: string, eventId?: number): Promise<SetDetail> {
-    return this.fetch('/api/setbuilder/sets', {
-      method: 'POST',
-      body: JSON.stringify({ name, event_id: eventId ?? null }),
-    });
-  }
-  async getSet(setId: number): Promise<SetDetail> {
-    return this.fetch(`/api/setbuilder/sets/${setId}`);
-  }
-  async renameSet(setId: number, name: string): Promise<SetDetail> {
-    return this.fetch(`/api/setbuilder/sets/${setId}`, {
-      method: 'PATCH',
-      body: JSON.stringify({ name }),
-    });
-  }
-  async deleteSet(setId: number): Promise<void> {
-    await this.rawFetch(`/api/setbuilder/sets/${setId}`, { method: 'DELETE' });
-  }
-```
-
-- [ ] **Step 3: Type-check**
-
-Run: `cd dashboard && npx tsc --noEmit`
-Expected: no errors.
-
-- [ ] **Step 4: Commit**
-
-```bash
-git add dashboard/lib/api-types.ts dashboard/lib/api.ts
-git commit -m "feat(setbuilder): add set CRUD methods to frontend API client"
-```
-
----
-
-## Task 8: Dashboard set-list page
-
-**Files:**
-- Create: `dashboard/app/setbuilder/page.tsx`
-- Create: `dashboard/app/setbuilder/__tests__/page.test.tsx`
-
-- [ ] **Step 1: Write the failing test**
-
-Create `dashboard/app/setbuilder/__tests__/page.test.tsx`:
-
-```tsx
-import { render, screen, waitFor } from '@testing-library/react';
-import { describe, it, expect, vi, beforeEach } from 'vitest';
-import SetbuilderPage from '../page';
-
-vi.mock('next/navigation', () => ({
-  useRouter: () => ({ push: vi.fn() }),
-}));
-
-const mockListSets = vi.fn();
-vi.mock('@/lib/api', () => ({
-  api: {
-    listSets: () => mockListSets(),
-    createSet: vi.fn(),
-    deleteSet: vi.fn(),
-    renameSet: vi.fn(),
-  },
-}));
-
-vi.mock('@/lib/auth', () => ({
-  useAuth: () => ({ isAuthenticated: true, isLoading: false, role: 'dj' }),
-}));
-
-describe('SetbuilderPage', () => {
-  beforeEach(() => {
-    mockListSets.mockReset();
-  });
-
-  it('renders the empty state when there are no sets', async () => {
-    mockListSets.mockResolvedValue([]);
-    render(<SetbuilderPage />);
-    await waitFor(() => {
-      expect(screen.getByText(/no sets yet/i)).toBeInTheDocument();
-    });
-  });
-
-  it('renders set cards from the API', async () => {
-    mockListSets.mockResolvedValue([
-      {
-        id: 1,
-        name: 'Friday Wedding',
-        event_id: null,
-        status: 'draft',
-        sharing_mode: 'private',
-        created_at: '2026-06-07T00:00:00Z',
-        updated_at: '2026-06-07T00:00:00Z',
-      },
-    ]);
-    render(<SetbuilderPage />);
-    await waitFor(() => {
-      expect(screen.getByText('Friday Wedding')).toBeInTheDocument();
-    });
-  });
-});
-```
-
-- [ ] **Step 2: Run the test to verify it fails**
-
-Run: `cd dashboard && npm test -- --run app/setbuilder`
-Expected: FAIL — cannot resolve `../page`.
-
-- [ ] **Step 3: Write the set-list page**
-
-Create `dashboard/app/setbuilder/page.tsx`:
-
-```tsx
-'use client';
-
-import { useEffect, useState } from 'react';
-import { useRouter } from 'next/navigation';
-import Link from 'next/link';
-import { useAuth } from '@/lib/auth';
-import { api } from '@/lib/api';
-import type { SetSummary } from '@/lib/api-types';
-
-export default function SetbuilderPage() {
-  const { isAuthenticated, isLoading, role } = useAuth();
-  const router = useRouter();
-  const [sets, setSets] = useState<SetSummary[]>([]);
-  const [loading, setLoading] = useState(true);
-  const [showCreate, setShowCreate] = useState(false);
-  const [newName, setNewName] = useState('');
-  const [creating, setCreating] = useState(false);
-  const [error, setError] = useState<string | null>(null);
-
-  useEffect(() => {
-    if (!isLoading && !isAuthenticated) {
-      router.push('/login');
-    } else if (!isLoading && role === 'pending') {
-      router.push('/pending');
-    }
-  }, [isAuthenticated, isLoading, role, router]);
-
-  useEffect(() => {
-    if (isAuthenticated) {
-      api
-        .listSets()
-        .then(setSets)
-        .catch(() => setError('Failed to load sets'))
-        .finally(() => setLoading(false));
-    }
-  }, [isAuthenticated]);
-
-  const handleCreate = async (e: React.FormEvent) => {
-    e.preventDefault();
-    if (!newName.trim()) return;
-    setCreating(true);
-    try {
-      const created = await api.createSet(newName.trim());
-      setSets((prev) => [created, ...prev]);
-      setNewName('');
-      setShowCreate(false);
-    } catch (err) {
-      setError(err instanceof Error ? err.message : 'Failed to create set');
-    } finally {
-      setCreating(false);
-    }
-  };
-
-  const handleDelete = async (id: number) => {
-    if (!window.confirm('Delete this set? This cannot be undone.')) return;
-    try {
-      await api.deleteSet(id);
-      setSets((prev) => prev.filter((s) => s.id !== id));
-    } catch (err) {
-      setError(err instanceof Error ? err.message : 'Failed to delete set');
-    }
-  };
-
-  if (isLoading || !isAuthenticated) {
-    return (
-      <div className="container">
-        <div className="loading">Loading...</div>
-      </div>
-    );
-  }
-
-  return (
-    <div className="container">
-      {error && (
-        <div
-          style={{
-            background: 'var(--color-danger-subtle)',
-            color: 'var(--color-danger)',
-            padding: '0.75rem 1rem',
-            borderRadius: '0.5rem',
-            marginBottom: '1rem',
-            fontSize: '0.875rem',
-          }}
-        >
-          {error}
-        </div>
-      )}
-
-      <div className="header">
-        <h1>Sets</h1>
-        <div style={{ display: 'flex', gap: '1rem', alignItems: 'center' }}>
-          <Link
-            href="/dashboard"
-            className="btn"
-            style={{ background: 'var(--surface-raised)', textDecoration: 'none', color: 'var(--text)' }}
-          >
-            Dashboard
-          </Link>
-          <button className="btn btn-primary" onClick={() => setShowCreate(true)}>
-            New Set
-          </button>
-        </div>
-      </div>
-
-      {showCreate && (
-        <div className="card" style={{ marginBottom: '2rem' }}>
-          <h2 style={{ marginBottom: '1rem' }}>Create New Set</h2>
-          <form onSubmit={handleCreate}>
-            <div className="form-group">
-              <label htmlFor="setName">Set Name</label>
-              <input
-                id="setName"
-                type="text"
-                className="input"
-                placeholder="Friday Wedding"
-                value={newName}
-                onChange={(e) => setNewName(e.target.value)}
-                maxLength={120}
-                required
-              />
-            </div>
-            <div style={{ display: 'flex', gap: '1rem' }}>
-              <button type="submit" className="btn btn-primary" disabled={creating}>
-                {creating ? 'Creating...' : 'Create'}
-              </button>
-              <button
-                type="button"
-                className="btn"
-                style={{ background: 'var(--surface-raised)' }}
-                onClick={() => setShowCreate(false)}
-              >
-                Cancel
-              </button>
-            </div>
-          </form>
-        </div>
-      )}
-
-      {loading ? (
-        <div className="loading">Loading sets...</div>
-      ) : sets.length === 0 ? (
-        <div className="card" style={{ textAlign: 'center' }}>
-          <p style={{ color: 'var(--text-secondary)' }}>No sets yet. Create your first set!</p>
-        </div>
-      ) : (
-        <div className="event-grid">
-          {sets.map((s) => (
-            <div key={s.id} className="event-card" style={{ position: 'relative' }}>
-              <Link href={`/setbuilder/${s.id}`} style={{ textDecoration: 'none', color: 'inherit' }}>
-                <h3>{s.name}</h3>
-                <div className="code">{s.status}</div>
-                <p style={{ color: 'var(--text-secondary)', fontSize: '0.875rem' }}>
-                  Updated: {new Date(s.updated_at).toLocaleString()}
-                </p>
-              </Link>
-              <button
-                className="btn btn-sm btn-danger"
-                style={{ marginTop: '0.75rem' }}
-                onClick={() => handleDelete(s.id)}
-              >
-                Delete
-              </button>
-            </div>
-          ))}
-        </div>
-      )}
-    </div>
-  );
-}
-```
-
-- [ ] **Step 4: Run the test to verify it passes**
-
-Run: `cd dashboard && npm test -- --run app/setbuilder`
-Expected: 2 PASS.
-
-- [ ] **Step 5: Commit**
-
-```bash
-git add dashboard/app/setbuilder/page.tsx dashboard/app/setbuilder/__tests__/page.test.tsx
-git commit -m "feat(setbuilder): add set-list dashboard page"
-```
-
----
-
-## Task 9: Builder workspace shell (4-panel grid)
-
-**Files:**
-- Create: `dashboard/app/setbuilder/[setId]/page.tsx`
-- Create: `dashboard/app/setbuilder/setbuilder.module.css`
-
-The exec-summary workspace is a 3-column grid (Pool 320px | center | Chat 360px) where the center stacks Curve over Timeline. The issue asks for a "4-panel grid (Pool / Curve / Timeline / Chat placeholders)". **Decision:** render all four as distinct panels in a CSS grid — Pool (left, full height), Curve (top center), Timeline (bottom center), Chat (right, full height) — using `grid-template-areas`. This satisfies "4-panel" while preserving the design's spatial intent.
-
-- [ ] **Step 1: Write the scoped CSS**
-
-Create `dashboard/app/setbuilder/setbuilder.module.css`:
-
-```css
-.workspace {
-  display: grid;
-  grid-template-columns: 320px 1fr 360px;
-  grid-template-rows: minmax(200px, 40%) 1fr;
-  grid-template-areas:
-    'pool curve chat'
-    'pool timeline chat';
-  gap: 1px;
-  height: calc(100vh - 56px);
-  background: var(--border-subtle);
-}
-
-.topbar {
-  display: flex;
-  align-items: center;
-  justify-content: space-between;
-  height: 56px;
-  padding: 0 1rem;
-  background: var(--card);
-  border-bottom: 1px solid var(--border);
-}
-
-.topbarTitle {
-  font-family: var(--font-display), sans-serif;
-  font-weight: 600;
-  font-size: 1rem;
-  color: var(--text);
-}
-
-.panel {
-  background: var(--bg);
-  display: flex;
-  flex-direction: column;
-  overflow: hidden;
-}
-
-.panelPool {
-  grid-area: pool;
-}
-.panelCurve {
-  grid-area: curve;
-}
-.panelTimeline {
-  grid-area: timeline;
-}
-.panelChat {
-  grid-area: chat;
-}
-
-.panelHeader {
-  padding: 0.75rem 1rem;
-  font-family: var(--font-display), sans-serif;
-  font-size: 0.8125rem;
-  font-weight: 600;
-  letter-spacing: 0.04em;
-  text-transform: uppercase;
-  color: var(--text-secondary);
-  border-bottom: 1px solid var(--border-subtle);
-}
-
-.panelBody {
-  flex: 1;
-  display: flex;
-  align-items: center;
-  justify-content: center;
-  padding: 1rem;
-  color: var(--text-secondary);
-  font-size: 0.875rem;
-  text-align: center;
-}
-```
-
-- [ ] **Step 2: Write the builder page**
-
-Create `dashboard/app/setbuilder/[setId]/page.tsx`:
-
-```tsx
-'use client';
-
-import { use, useEffect, useState } from 'react';
-import { useRouter } from 'next/navigation';
-import Link from 'next/link';
-import { useAuth } from '@/lib/auth';
-import { api } from '@/lib/api';
-import type { SetDetail } from '@/lib/api-types';
-import styles from '../setbuilder.module.css';
-
-export default function BuilderPage({ params }: { params: Promise<{ setId: string }> }) {
-  const { setId } = use(params);
-  const { isAuthenticated, isLoading, role } = useAuth();
-  const router = useRouter();
-  const [set, setSet] = useState<SetDetail | null>(null);
-  const [error, setError] = useState<string | null>(null);
-
-  useEffect(() => {
-    if (!isLoading && !isAuthenticated) {
-      router.push('/login');
-    } else if (!isLoading && role === 'pending') {
-      router.push('/pending');
-    }
-  }, [isAuthenticated, isLoading, role, router]);
-
-  useEffect(() => {
-    if (isAuthenticated) {
-      api
-        .getSet(Number(setId))
-        .then(setSet)
-        .catch(() => setError('Set not found'));
-    }
-  }, [isAuthenticated, setId]);
-
-  if (isLoading || !isAuthenticated) {
-    return (
-      <div className="container">
-        <div className="loading">Loading...</div>
-      </div>
-    );
-  }
-
-  if (error) {
-    return (
-      <div className="container">
-        <div className="card" style={{ textAlign: 'center' }}>
-          <p style={{ color: 'var(--color-danger)' }}>{error}</p>
-          <Link href="/setbuilder" className="btn btn-primary" style={{ marginTop: '1rem', textDecoration: 'none' }}>
-            Back to Sets
-          </Link>
-        </div>
-      </div>
-    );
-  }
-
-  return (
-    <div>
-      <div className={styles.topbar}>
-        <Link
-          href="/setbuilder"
-          className="btn btn-sm"
-          style={{ background: 'var(--surface-raised)', textDecoration: 'none', color: 'var(--text)' }}
-        >
-          ← Sets
-        </Link>
-        <span className={styles.topbarTitle}>{set?.name ?? 'Loading…'}</span>
-        <span style={{ width: 60 }} />
-      </div>
-
-      <div className={styles.workspace}>
-        <section className={`${styles.panel} ${styles.panelPool}`} aria-label="Pool">
-          <div className={styles.panelHeader}>Pool</div>
-          <div className={styles.panelBody}>Candidate tracks will appear here.</div>
-        </section>
-
-        <section className={`${styles.panel} ${styles.panelCurve}`} aria-label="Curve">
-          <div className={styles.panelHeader}>Curve</div>
-          <div className={styles.panelBody}>Energy curve editor coming soon.</div>
-        </section>
-
-        <section className={`${styles.panel} ${styles.panelTimeline}`} aria-label="Timeline">
-          <div className={styles.panelHeader}>Timeline</div>
-          <div className={styles.panelBody}>Ordered set timeline coming soon.</div>
-        </section>
-
-        <section className={`${styles.panel} ${styles.panelChat}`} aria-label="Chat">
-          <div className={styles.panelHeader}>Chat</div>
-          <div className={styles.panelBody}>Agent chat coming soon.</div>
-        </section>
-      </div>
-    </div>
-  );
-}
-```
-
-- [ ] **Step 3: Type-check + lint + test**
-
-Run: `cd dashboard && npx tsc --noEmit && npm run lint && npm test -- --run`
-Expected: tsc clean, ESLint clean, all vitest tests pass.
-
-- [ ] **Step 4: Commit**
-
-```bash
-git add dashboard/app/setbuilder/\[setId\]/page.tsx dashboard/app/setbuilder/setbuilder.module.css
-git commit -m "feat(setbuilder): add builder workspace shell with 4-panel grid"
-```
-
----
-
-## Task 10: Full local CI sweep + finishing
-
-**Files:** none (verification + handoff)
-
-- [ ] **Step 1: Backend CI (from `server/`)**
-
-Run:
-```bash
-cd server && .venv/bin/ruff check . && .venv/bin/ruff format --check . && .venv/bin/bandit -r app -c pyproject.toml -q && .venv/bin/pytest --tb=short -q && .venv/bin/alembic upgrade head && .venv/bin/alembic check
-```
-Expected: every step green; `alembic check` says no new operations; coverage gate satisfied.
-
-- [ ] **Step 2: Frontend CI (from `dashboard/`)**
-
-Run:
-```bash
-cd dashboard && npm run lint && npx tsc --noEmit && npm test -- --run
-```
-Expected: every step green. (Restore `next-env.d.ts` with `git checkout dashboard/next-env.d.ts` if a build touched it.)
-
-- [ ] **Step 3: Finish the branch**
-
-Use superpowers:finishing-a-development-branch, choose **option 2 (Push + PR against main)**. The PR body MUST include `Closes #387`, a `## Design decisions` section (lift the decisions list above), and a test plan section.
-
----
-
-## Self-Review
-
-**Spec coverage:**
-- Models `Set`, `SetSlot`, `SetCurvePoint`, `SetCollaborator` → Task 2. ✔
-- Models `TrackVibe`, `TrackVibeOverride` incl. 5-col UNIQUE → Task 1. ✔
-- Alembic migration, single head, `alembic check` clean → Task 3 + Task 10. ✔
-- Router `/api/setbuilder/*` gated by `get_current_active_user`, set CRUD only → Task 6. ✔
-- LLM gateway interface stub delegating to `llm_client.py`, no provider SDK import → Task 4. ✔
-- Dashboard set list + builder 4-panel shell with design tokens → Tasks 8, 9. ✔
-- Acceptance "authenticated DJ can create/list/rename/delete an empty set" → Task 6 tests. ✔
-- Acceptance "no direct LLM provider SDK import anywhere in setbuilder code" → Task 4 AST test + manual review. ✔
-
-**Placeholder scan:** No TBD/TODO/"handle edge cases" — every code step is concrete.
-
-**Type consistency:** `SetSummary`/`SetDetail` match between `schemas/setbuilder.py` (Task 5), `api-types.ts` (Task 7), and the page imports (Tasks 8, 9). Gateway `dispatch`/`GatewayResponse`/`MODEL_HINTS` names match between `gateway.py` (Task 4) and its test. Service function names (`create_set`, `list_sets`, `get_owned_set`, `rename_set`, `delete_set`) match between `set_service.py` (Task 5) and the router (Task 6). Migration column names/types/server_defaults match the models (Tasks 1–3).
diff --git a/docs/superpowers/specs/2026-05-24-admin-ai-oauth-design.md b/docs/superpowers/specs/2026-05-24-admin-ai-oauth-design.md
index 6f912e93..83ba8e05 100644
--- a/docs/superpowers/specs/2026-05-24-admin-ai-oauth-design.md
+++ b/docs/superpowers/specs/2026-05-24-admin-ai-oauth-design.md
@@ -509,12 +509,28 @@ MVP ships when all hold:
 
 This spec is the work-order for an implementation agent (likely via `superpowers:executing-plans` + `superpowers:subagent-driven-development`).
 
+### 10.0 Branching & Integration Strategy
+
+**This work-track does NOT merge incrementally into `main`.** It is large and multi-stage; merging each piece into `main` before the whole feature is validated would ship half-built surfaces to production.
+
+Instead, all work converges on a **long-lived integration branch: `epic/ai-engine`** (created from `main`).
+
+- **Every sub-task branches off `epic/ai-engine`, not `main`:**
+  `git fetch origin && git checkout -b feat/issue-NNN origin/epic/ai-engine`
+- **Every sub-PR targets `epic/ai-engine` as its base** (`gh pr create --base epic/ai-engine ...`). Never open a sub-PR against `main`.
+- **Each stage is still validated independently** — full CI, CodeRabbit review, and manual testing run on every sub-PR before it merges into `epic/ai-engine`. The integration branch is not a dumping ground; it is gated the same as `main`.
+- **`epic/ai-engine` → `main` happens exactly once**, at the end, after the complete feature is validated end-to-end (full regression pass + manual sign-off). That final merge is its own reviewed PR.
+- **Keep the epic current:** periodically rebase/merge `main` into `epic/ai-engine` so it doesn't drift from production. Resolve conflicts on the epic, never by force-pushing `main`.
+- Wherever §11 mini-specs say a deferred item "depends on MVP merged", read that as **merged into `epic/ai-engine`** (not `main`).
+
+The MVP (issue #329 / its PR) is the first merge into `epic/ai-engine` and establishes the gateway interfaces all deferred adapters build on.
+
 ### 10.1 Phase 1: Build the MVP
 
 The implementer agent must:
 
 1. Read this spec in full before touching code
-2. Confirm it is working on branch `worktree-feat+admin-ai-oauth` (or equivalent feature branch — never `main`)
+2. Confirm it is working on a feature branch cut from `origin/epic/ai-engine` (e.g. `feat/issue-NNN`) — never `main`, and never directly on `epic/ai-engine` (see §10.0)
 3. Read `CLAUDE.md` (project root) for branch strategy, commit format, CI checks, deploy workflow
 4. Read related memory: `[[llm-oauth-gateway]]`, `[[feedback-litellm-avoid]]`
 5. Use `superpowers:writing-plans` to produce a phased implementation plan from this spec
@@ -527,7 +543,7 @@ The implementer agent must:
    - Sub-agent F: recommendation-engine migration + regression test
    - Sub-agent G: documentation updates (`CLAUDE.md` adds new env vars / new endpoints; `docs/` may need a new HUMAN-VERIFICATION-style doc for LLM connectors)
 7. Each sub-agent prompt must include the branch-safety template from `~/.claude/rules/agents.md` (read CLAUDE.md, never commit to main, branch name)
-8. After all sub-agents finish, run full local CI (the "push to testing" workflow from MEMORY.md) and only then push + open PR
+8. After all sub-agents finish, run full local CI (the "push to testing" workflow from MEMORY.md) and only then push + open PR **with base `epic/ai-engine`** (`gh pr create --base epic/ai-engine`)
 9. Honor all acceptance criteria in §9 before marking the MVP complete
 
 ### 10.2 Phase 2: File deferred items as GitHub issues
diff --git a/server/alembic/versions/047_admin_ai_oauth.py b/server/alembic/versions/047_admin_ai_oauth.py
new file mode 100644
index 00000000..9e080e86
--- /dev/null
+++ b/server/alembic/versions/047_admin_ai_oauth.py
@@ -0,0 +1,309 @@
+"""LLM gateway: connectors + call log + audit event + system_settings columns + data migration.
+
+Revision ID: 047
+Revises: 046
+Create Date: 2026-05-24
+
+Creates:
+- llm_connectors: per-DJ encrypted credential storage (Fernet via EncryptedText)
+- llm_call_log: per-call telemetry (counts only, no prompt/completion content)
+- llm_audit_event: connector lifecycle events for security review
+- 3 new columns on system_settings (apikey policy, compatible policy, default connector FK)
+
+Data migration:
+- If ANTHROPIC_API_KEY env var is set, creates an "anthropic_apikey" connector
+  named "Org Default (migrated from env var)" owned by the first admin user,
+  and points system_settings.llm_default_connector_id at it.
+- Idempotent: skips if a connector with that name already exists.
+- Skipped silently if no env var, no admin user, or encryption key unavailable.
+"""
+
+import json
+import logging
+import os
+from datetime import UTC, datetime
+
+import sqlalchemy as sa
+from sqlalchemy.orm import Session
+
+from alembic import op
+from app.core.encryption import encrypt_value
+
+revision: str = "047"
+down_revision: str | None = "046"
+branch_labels = None
+depends_on = None
+
+logger = logging.getLogger(__name__)
+
+_MIGRATED_DISPLAY_NAME = "Org Default (migrated from env var)"
+
+
+def upgrade() -> None:
+    # llm_connectors
+    op.create_table(
+        "llm_connectors",
+        sa.Column("id", sa.Integer(), primary_key=True),
+        sa.Column(
+            "user_id",
+            sa.Integer(),
+            sa.ForeignKey("users.id", ondelete="CASCADE"),
+            nullable=False,
+        ),
+        sa.Column("connector_type", sa.String(40), nullable=False),
+        sa.Column("display_name", sa.String(80), nullable=False),
+        sa.Column("status", sa.String(20), nullable=False, server_default="active"),
+        sa.Column("credentials", sa.Text(), nullable=False),
+        sa.Column("base_url_plain", sa.String(255), nullable=True),
+        sa.Column("model_hint", sa.String(80), nullable=True),
+        sa.Column(
+            "created_at",
+            sa.DateTime(),
+            nullable=False,
+            server_default=sa.func.now(),
+        ),
+        sa.Column(
+            "updated_at",
+            sa.DateTime(),
+            nullable=False,
+            server_default=sa.func.now(),
+        ),
+        sa.Column("last_used_at", sa.DateTime(), nullable=True),
+        sa.Column("last_error", sa.String(255), nullable=True),
+        sa.UniqueConstraint(
+            "user_id", "connector_type", "display_name", name="uq_dj_connector_label"
+        ),
+    )
+    op.create_index("ix_llm_connectors_user_id", "llm_connectors", ["user_id"])
+    op.create_index("ix_llm_connectors_connector_type", "llm_connectors", ["connector_type"])
+    op.create_index("ix_user_active", "llm_connectors", ["user_id", "status"])
+
+    # llm_call_log
+    op.create_table(
+        "llm_call_log",
+        sa.Column("id", sa.Integer(), primary_key=True),
+        sa.Column(
+            "connector_id",
+            sa.Integer(),
+            sa.ForeignKey("llm_connectors.id", ondelete="CASCADE"),
+            nullable=False,
+        ),
+        sa.Column("purpose", sa.String(40), nullable=False),
+        sa.Column("status", sa.String(20), nullable=False),
+        sa.Column("latency_ms", sa.Integer(), nullable=False),
+        sa.Column("tokens_in", sa.Integer(), nullable=True),
+        sa.Column("tokens_out", sa.Integer(), nullable=True),
+        sa.Column("error_code", sa.String(60), nullable=True),
+        sa.Column(
+            "created_at",
+            sa.DateTime(),
+            nullable=False,
+            server_default=sa.func.now(),
+        ),
+    )
+    op.create_index("ix_llm_call_log_connector_id", "llm_call_log", ["connector_id"])
+    op.create_index("ix_llm_call_log_purpose", "llm_call_log", ["purpose"])
+    op.create_index("ix_llm_call_log_created_at", "llm_call_log", ["created_at"])
+
+    # llm_audit_event
+    op.create_table(
+        "llm_audit_event",
+        sa.Column("id", sa.Integer(), primary_key=True),
+        sa.Column(
+            "actor_user_id",
+            sa.Integer(),
+            sa.ForeignKey("users.id"),
+            nullable=False,
+        ),
+        sa.Column(
+            "target_connector_id",
+            sa.Integer(),
+            sa.ForeignKey("llm_connectors.id", ondelete="SET NULL"),
+            nullable=True,
+        ),
+        sa.Column("event_type", sa.String(60), nullable=False),
+        sa.Column(
+            "created_at",
+            sa.DateTime(),
+            nullable=False,
+            server_default=sa.func.now(),
+        ),
+    )
+    op.create_index("ix_llm_audit_event_actor_user_id", "llm_audit_event", ["actor_user_id"])
+    op.create_index("ix_llm_audit_event_event_type", "llm_audit_event", ["event_type"])
+
+    # system_settings additions
+    op.add_column(
+        "system_settings",
+        sa.Column(
+            "llm_apikey_connectors_enabled",
+            sa.Boolean(),
+            nullable=False,
+            server_default=sa.text("true"),
+        ),
+    )
+    op.add_column(
+        "system_settings",
+        sa.Column(
+            "llm_compatible_connector_enabled",
+            sa.Boolean(),
+            nullable=False,
+            server_default=sa.text("true"),
+        ),
+    )
+    op.add_column(
+        "system_settings",
+        sa.Column(
+            "llm_default_connector_id",
+            sa.Integer(),
+            sa.ForeignKey("llm_connectors.id", ondelete="SET NULL"),
+            nullable=True,
+        ),
+    )
+
+    # Data migration: convert ANTHROPIC_API_KEY env var into a connector + org default
+    _migrate_env_var_anthropic_key()
+
+
+def downgrade() -> None:
+    op.drop_column("system_settings", "llm_default_connector_id")
+    op.drop_column("system_settings", "llm_compatible_connector_enabled")
+    op.drop_column("system_settings", "llm_apikey_connectors_enabled")
+
+    op.drop_index("ix_llm_audit_event_event_type", table_name="llm_audit_event")
+    op.drop_index("ix_llm_audit_event_actor_user_id", table_name="llm_audit_event")
+    op.drop_table("llm_audit_event")
+
+    op.drop_index("ix_llm_call_log_created_at", table_name="llm_call_log")
+    op.drop_index("ix_llm_call_log_purpose", table_name="llm_call_log")
+    op.drop_index("ix_llm_call_log_connector_id", table_name="llm_call_log")
+    op.drop_table("llm_call_log")
+
+    op.drop_index("ix_user_active", table_name="llm_connectors")
+    op.drop_index("ix_llm_connectors_connector_type", table_name="llm_connectors")
+    op.drop_index("ix_llm_connectors_user_id", table_name="llm_connectors")
+    op.drop_table("llm_connectors")
+
+
+def _migrate_env_var_anthropic_key() -> None:
+    """Best-effort data migration. Never fails the migration."""
+    api_key = os.environ.get("ANTHROPIC_API_KEY", "").strip()
+    if not api_key:
+        return
+
+    conn = op.get_bind()
+    session = Session(bind=conn)
+    try:
+        admin_row = session.execute(
+            sa.text("SELECT id FROM users WHERE role = 'admin' ORDER BY id ASC LIMIT 1")
+        ).first()
+        if not admin_row:
+            logger.info("046_admin_ai_oauth: no admin user found, skipping data migration")
+            return
+
+        admin_id = admin_row[0]
+
+        # Idempotency: skip if a connector with this label already exists.
+        existing = session.execute(
+            sa.text("SELECT id FROM llm_connectors WHERE user_id = :uid AND display_name = :name"),
+            {"uid": admin_id, "name": _MIGRATED_DISPLAY_NAME},
+        ).first()
+        if existing:
+            logger.info("046_admin_ai_oauth: connector already exists, skipping data migration")
+            return
+
+        try:
+            encrypted_creds = encrypt_value(json.dumps({"api_key": api_key}))
+        except Exception:
+            logger.warning("046_admin_ai_oauth: encryption unavailable, skipping data migration")
+            return
+
+        # Pull anthropic_model from settings if available; falls back to default.
+        try:
+            from app.core.config import get_settings
+
+            model_hint = get_settings().anthropic_model
+        except Exception:
+            model_hint = "claude-haiku-4-5-20251001"
+
+        now = datetime.now(UTC).replace(tzinfo=None)
+        result = session.execute(
+            sa.text(
+                "INSERT INTO llm_connectors "
+                "(user_id, connector_type, display_name, status, credentials, "
+                "model_hint, created_at, updated_at) "
+                "VALUES (:uid, :ctype, :name, :status, :creds, "
+                ":mhint, :created, :updated) "
+                "RETURNING id"
+            ),
+            {
+                "uid": admin_id,
+                "ctype": "anthropic_apikey",
+                "name": _MIGRATED_DISPLAY_NAME,
+                "status": "active",
+                "creds": encrypted_creds,
+                "mhint": model_hint,
+                "created": now,
+                "updated": now,
+            },
+        )
+        connector_id_row = result.first()
+        if connector_id_row is None:
+            # SQLite doesn't support RETURNING — fetch lastrowid via execute
+            connector_id = session.execute(
+                sa.text(
+                    "SELECT id FROM llm_connectors WHERE user_id = :uid AND display_name = :name"
+                ),
+                {"uid": admin_id, "name": _MIGRATED_DISPLAY_NAME},
+            ).scalar()
+        else:
+            connector_id = connector_id_row[0]
+
+        if connector_id is None:
+            logger.warning("046_admin_ai_oauth: could not resolve new connector id")
+            return
+
+        # Ensure system_settings row exists, then point at the new connector.
+        ss = session.execute(sa.text("SELECT id FROM system_settings LIMIT 1")).first()
+        if ss:
+            session.execute(
+                sa.text(
+                    "UPDATE system_settings SET llm_default_connector_id = :cid WHERE id = :sid"
+                ),
+                {"cid": connector_id, "sid": ss[0]},
+            )
+        else:
+            session.execute(
+                sa.text(
+                    "INSERT INTO system_settings (id, llm_default_connector_id) VALUES (1, :cid)"
+                ),
+                {"cid": connector_id},
+            )
+
+        # Audit event
+        session.execute(
+            sa.text(
+                "INSERT INTO llm_audit_event "
+                "(actor_user_id, target_connector_id, event_type, created_at) "
+                "VALUES (:uid, :cid, :etype, :created)"
+            ),
+            {
+                "uid": admin_id,
+                "cid": connector_id,
+                "etype": "connector_created",
+                "created": now,
+            },
+        )
+
+        session.commit()
+        logger.info(
+            "046_admin_ai_oauth: migrated ANTHROPIC_API_KEY env var to "
+            "connector_id=%s for admin user_id=%s",
+            connector_id,
+            admin_id,
+        )
+    except Exception as exc:
+        logger.warning("046_admin_ai_oauth: data migration failed: %s", exc)
+        session.rollback()
+    finally:
+        session.close()
diff --git a/server/alembic/versions/048_llm_call_log_retention.py b/server/alembic/versions/048_llm_call_log_retention.py
new file mode 100644
index 00000000..7534315d
--- /dev/null
+++ b/server/alembic/versions/048_llm_call_log_retention.py
@@ -0,0 +1,35 @@
+"""Configurable llm_call_log retention.
+
+Revision ID: 048
+Revises: 047
+Create Date: 2026-05-26
+
+Adds system_settings.llm_call_log_retention_days (int, default 30, NOT NULL).
+The daily cleanup job reads this value each run; sanity bounds (7..365) are
+enforced at the API level, not the database.
+"""
+
+import sqlalchemy as sa
+
+from alembic import op
+
+revision: str = "048"
+down_revision: str | None = "047"
+branch_labels = None
+depends_on = None
+
+
+def upgrade() -> None:
+    op.add_column(
+        "system_settings",
+        sa.Column(
+            "llm_call_log_retention_days",
+            sa.Integer(),
+            nullable=False,
+            server_default=sa.text("30"),
+        ),
+    )
+
+
+def downgrade() -> None:
+    op.drop_column("system_settings", "llm_call_log_retention_days")
diff --git a/server/alembic/versions/049_llm_connector_is_default.py b/server/alembic/versions/049_llm_connector_is_default.py
new file mode 100644
index 00000000..4642b63f
--- /dev/null
+++ b/server/alembic/versions/049_llm_connector_is_default.py
@@ -0,0 +1,128 @@
+"""Per-DJ explicit default connector toggle (issue #336).
+
+Revision ID: 049
+Revises: 048
+Create Date: 2026-05-28
+
+Adds llm_connectors.is_default (bool, NOT NULL, default false) plus a partial
+unique index enforcing at most one default per user. Backfills by marking each
+DJ's MRU active connector as default on first deploy so resolution behavior is
+unchanged for existing users (they keep getting their previous most-recently
+used connector — now pinned).
+"""
+
+from __future__ import annotations
+
+import logging
+
+import sqlalchemy as sa
+
+from alembic import op
+
+revision: str = "049"
+down_revision: str | None = "048"
+branch_labels = None
+depends_on = None
+
+logger = logging.getLogger(__name__)
+
+
+def upgrade() -> None:
+    op.add_column(
+        "llm_connectors",
+        sa.Column(
+            "is_default",
+            sa.Boolean(),
+            nullable=False,
+            server_default=sa.text("false"),
+        ),
+    )
+
+    bind = op.get_bind()
+    dialect = bind.dialect.name
+
+    # Partial unique index: at most one default per user_id. Both Postgres and
+    # SQLite (3.8+) support the partial-index WHERE clause; other dialects skip
+    # the index — the service layer still enforces single-default semantics.
+    if dialect == "postgresql":
+        op.create_index(
+            "ix_llm_connectors_user_default_unique",
+            "llm_connectors",
+            ["user_id"],
+            unique=True,
+            postgresql_where=sa.text("is_default"),
+        )
+    elif dialect == "sqlite":
+        op.create_index(
+            "ix_llm_connectors_user_default_unique",
+            "llm_connectors",
+            ["user_id"],
+            unique=True,
+            sqlite_where=sa.text("is_default"),
+        )
+    else:  # pragma: no cover — production runs Postgres; SQLite is tests
+        # Fall back to a non-unique covering index so resolver lookups stay
+        # cheap. The service layer (clear-then-set) still enforces uniqueness.
+        op.create_index(
+            "ix_llm_connectors_user_default_unique",
+            "llm_connectors",
+            ["user_id"],
+        )
+
+    _backfill_mru_defaults(bind)
+
+
+def downgrade() -> None:
+    op.drop_index("ix_llm_connectors_user_default_unique", table_name="llm_connectors")
+    op.drop_column("llm_connectors", "is_default")
+
+
+def _backfill_mru_defaults(bind: sa.engine.Connection) -> None:
+    """Mark each user's MRU active connector as default (one per user).
+
+    MRU = ``last_used_at`` DESC NULLS LAST, ``id`` DESC — same ordering the
+    gateway resolver uses. Skips users that have no active connector. Idempotent
+    on re-run: if a user already has any default, leaves it alone.
+    """
+    user_rows = bind.execute(
+        sa.text("SELECT DISTINCT user_id FROM llm_connectors WHERE status = 'active'")
+    ).all()
+
+    for (user_id,) in user_rows:
+        existing_default = bind.execute(
+            sa.text(
+                "SELECT id FROM llm_connectors "
+                "WHERE user_id = :uid AND is_default = :truthy AND status = 'active' "
+                "LIMIT 1"
+            ),
+            {"uid": user_id, "truthy": True},
+        ).first()
+        if existing_default is not None:
+            continue
+
+        # ORDER BY last_used_at DESC NULLS LAST is portable via the CASE trick
+        # so the migration works on both Postgres and SQLite (the latter's
+        # NULLS handling differs by default).
+        mru = bind.execute(
+            sa.text(
+                "SELECT id FROM llm_connectors "
+                "WHERE user_id = :uid AND status = 'active' "
+                "ORDER BY CASE WHEN last_used_at IS NULL THEN 1 ELSE 0 END, "
+                "last_used_at DESC, id DESC "
+                "LIMIT 1"
+            ),
+            {"uid": user_id},
+        ).first()
+        if mru is None:
+            continue
+
+        bind.execute(
+            sa.text("UPDATE llm_connectors SET is_default = :truthy WHERE id = :cid"),
+            {"truthy": True, "cid": mru[0]},
+        )
+        logger.info(
+            "048_llm_connector_is_default: backfilled is_default=True for "
+            "connector_id=%s user_id=%s",
+            mru[0],
+            user_id,
+        )
diff --git a/server/alembic/versions/050_llm_connector_health_check_columns.py b/server/alembic/versions/050_llm_connector_health_check_columns.py
new file mode 100644
index 00000000..2434ac40
--- /dev/null
+++ b/server/alembic/versions/050_llm_connector_health_check_columns.py
@@ -0,0 +1,42 @@
+"""Add last_health_check_at + last_health_check_status to llm_connectors.
+
+Revision ID: 050
+Revises: 049
+Create Date: 2026-05-28
+
+Adds two health-check observability columns to ``llm_connectors``:
+
+- ``last_health_check_at`` (DateTime, nullable) — UTC timestamp of the most
+  recent health check (DJ-triggered "Test" button OR the background monitor).
+- ``last_health_check_status`` (String(20), nullable) — outcome of that
+  health check. One of: ``"ok"``, ``"auth_invalid"``, ``"rate_limited"``,
+  ``"provider_unavailable"``, ``"quota_exceeded"``, ``"error"``. Allowed
+  values are enforced at the application layer (see ``connector_storage``).
+
+Both columns are nullable because existing rows have no prior health check.
+"""
+
+import sqlalchemy as sa
+
+from alembic import op
+
+revision: str = "050"
+down_revision: str | None = "049"
+branch_labels = None
+depends_on = None
+
+
+def upgrade() -> None:
+    op.add_column(
+        "llm_connectors",
+        sa.Column("last_health_check_at", sa.DateTime(), nullable=True),
+    )
+    op.add_column(
+        "llm_connectors",
+        sa.Column("last_health_check_status", sa.String(length=20), nullable=True),
+    )
+
+
+def downgrade() -> None:
+    op.drop_column("llm_connectors", "last_health_check_status")
+    op.drop_column("llm_connectors", "last_health_check_at")
diff --git a/server/alembic/versions/051_llm_feature_preference.py b/server/alembic/versions/051_llm_feature_preference.py
new file mode 100644
index 00000000..e0dc3c4c
--- /dev/null
+++ b/server/alembic/versions/051_llm_feature_preference.py
@@ -0,0 +1,56 @@
+"""Add llm_feature_preferences table.
+
+Revision ID: 051
+Revises: 050
+Create Date: 2026-05-28
+
+Per-feature connector preference (issue #337). Maps ``(user_id, feature)`` to a
+pinned ``connector_id`` with a UNIQUE constraint so a DJ has at most one pinned
+connector per feature. Both FKs cascade on delete so a deleted user or
+connector never leaves a dangling preference.
+"""
+
+import sqlalchemy as sa
+
+from alembic import op
+
+revision: str = "051"
+down_revision: str | None = "050"
+branch_labels = None
+depends_on = None
+
+
+def upgrade() -> None:
+    op.create_table(
+        "llm_feature_preferences",
+        sa.Column("id", sa.Integer(), nullable=False),
+        sa.Column("user_id", sa.Integer(), nullable=False),
+        sa.Column("feature", sa.String(length=40), nullable=False),
+        sa.Column("connector_id", sa.Integer(), nullable=False),
+        sa.Column(
+            "created_at",
+            sa.DateTime(),
+            server_default=sa.func.now(),
+            nullable=False,
+        ),
+        sa.ForeignKeyConstraint(["user_id"], ["users.id"], ondelete="CASCADE"),
+        sa.ForeignKeyConstraint(["connector_id"], ["llm_connectors.id"], ondelete="CASCADE"),
+        sa.PrimaryKeyConstraint("id"),
+        sa.UniqueConstraint("user_id", "feature", name="uq_llm_feature_pref_user_feature"),
+    )
+    op.create_index(
+        "ix_llm_feature_preferences_user_id",
+        "llm_feature_preferences",
+        ["user_id"],
+    )
+    op.create_index(
+        "ix_llm_feature_preferences_connector_id",
+        "llm_feature_preferences",
+        ["connector_id"],
+    )
+
+
+def downgrade() -> None:
+    op.drop_index("ix_llm_feature_preferences_connector_id", table_name="llm_feature_preferences")
+    op.drop_index("ix_llm_feature_preferences_user_id", table_name="llm_feature_preferences")
+    op.drop_table("llm_feature_preferences")
diff --git a/server/alembic/versions/052_llm_connector_monthly_token_cap.py b/server/alembic/versions/052_llm_connector_monthly_token_cap.py
new file mode 100644
index 00000000..46c9186a
--- /dev/null
+++ b/server/alembic/versions/052_llm_connector_monthly_token_cap.py
@@ -0,0 +1,47 @@
+"""Add monthly_token_cap to llm_connectors (issue #339).
+
+Revision ID: 052
+Revises: 051
+Create Date: 2026-05-28
+
+Adds an admin-set per-DJ monthly token cap to ``llm_connectors``:
+
+- ``monthly_token_cap`` (Integer, nullable) — NULL means unlimited. When set,
+  the LLM gateway refuses dispatch once the current calendar month's summed
+  ``tokens_in + tokens_out`` for the connector meets or exceeds this value.
+
+Nullable with no server default so existing connectors stay unlimited.
+"""
+
+import sqlalchemy as sa
+
+from alembic import op
+
+revision: str = "052"
+down_revision: str | None = "051"
+branch_labels = None
+depends_on = None
+
+
+def upgrade() -> None:
+    op.add_column(
+        "llm_connectors",
+        sa.Column("monthly_token_cap", sa.Integer(), nullable=True),
+    )
+    # Defence-in-depth: the API schema (ge=0) and service layer already reject
+    # negatives, but a DB CHECK guarantees a bad write can never persist a
+    # negative cap (which would make the connector permanently "over budget").
+    op.create_check_constraint(
+        "ck_llm_connectors_monthly_token_cap_nonnegative",
+        "llm_connectors",
+        "monthly_token_cap IS NULL OR monthly_token_cap >= 0",
+    )
+
+
+def downgrade() -> None:
+    op.drop_constraint(
+        "ck_llm_connectors_monthly_token_cap_nonnegative",
+        "llm_connectors",
+        type_="check",
+    )
+    op.drop_column("llm_connectors", "monthly_token_cap")
diff --git a/server/app/api/__init__.py b/server/app/api/__init__.py
index 71e8c63d..234a496e 100644
--- a/server/app/api/__init__.py
+++ b/server/app/api/__init__.py
@@ -2,6 +2,7 @@
 
 from app.api import (
     admin,
+    admin_llm,
     auth,
     beatport,
     bridge,
@@ -9,6 +10,7 @@
     events,
     guest,
     kiosk,
+    llm,
     public,
     requests,
     search,
@@ -45,3 +47,5 @@ def api_health_check():
 api_router.include_router(kiosk.public_router, prefix="/public/kiosk", tags=["kiosk"])
 api_router.include_router(kiosk.auth_router, prefix="/kiosk", tags=["kiosk"])
 api_router.include_router(admin.router, prefix="/admin", tags=["admin"])
+api_router.include_router(llm.router, prefix="/llm", tags=["llm"])
+api_router.include_router(admin_llm.router, prefix="/admin/llm", tags=["admin", "llm"])
diff --git a/server/app/api/admin_llm.py b/server/app/api/admin_llm.py
new file mode 100644
index 00000000..2f7564f0
--- /dev/null
+++ b/server/app/api/admin_llm.py
@@ -0,0 +1,444 @@
+"""Admin LLM policy + connector oversight endpoints.
+
+Authentication: ``get_current_admin``.
+Routes are mounted at ``/api/admin/llm``.
+"""
+
+from __future__ import annotations
+
+import csv
+import io
+import logging
+from collections.abc import Iterator
+from datetime import timedelta
+
+from fastapi import APIRouter, Depends, HTTPException, Query
+from fastapi import Request as FastAPIRequest
+from fastapi.responses import StreamingResponse
+from sqlalchemy import func, select
+from sqlalchemy.orm import Session
+
+from app.api.deps import get_current_admin, get_db
+from app.core.csv_safe import sanitize_csv_value
+from app.core.rate_limit import limiter
+from app.core.time import utcnow
+from app.models.llm_connector import LlmAuditEvent, LlmConnector
+from app.models.user import User
+from app.schemas.llm import (
+    AdminAuditOut,
+    AdminConnectorCapPatch,
+    AdminConnectorOut,
+    AdminPolicyOut,
+    AdminPolicyPatch,
+    AdminUsageOut,
+    AuditEventRow,
+    UsageRow,
+)
+from app.services.llm.connector_storage import (
+    AUDIT_POLICY_CHANGED,
+    AUDIT_REVOKED_BY_ADMIN,
+    audit_event,
+    current_month_token_usage,
+    current_month_token_usage_bulk,
+    get_connector,
+    get_usage_stats,
+    get_user_label,
+    list_all_connectors,
+    revoke_connector,
+    set_monthly_cap,
+)
+from app.services.system_settings import get_system_settings, update_system_settings
+
+logger = logging.getLogger(__name__)
+
+router = APIRouter()
+
+# Hard ceiling for a single CSV export — keeps an attacker (or an honest admin
+# with a huge history) from streaming an unbounded result set.
+_AUDIT_CSV_ROW_CAP = 10_000
+
+
+def _connector_to_admin_out(
+    row: LlmConnector, dj_username: str, current_month_tokens: int = 0
+) -> AdminConnectorOut:
+    """Reflect a connector row + its owner's display name into the admin view.
+
+    ``AdminConnectorOut`` adds ``dj_username`` and ``current_month_tokens``,
+    which aren't columns on the row, so the model is validated from a
+    column-reflection dict plus those extras rather than the ORM object
+    directly.
+    """
+    return AdminConnectorOut.model_validate(
+        {
+            **{c.name: getattr(row, c.name) for c in LlmConnector.__table__.columns},
+            "dj_username": dj_username,
+            "current_month_tokens": current_month_tokens,
+        }
+    )
+
+
+def _audit_query(
+    db: Session,
+    *,
+    event_type: str | None,
+    actor_user_id: int | None,
+    target_connector_id: int | None,
+    days: int,
+):
+    """Build the base SELECT joining actor username + connector display name.
+
+    Read-only: never touches the encrypted ``credentials`` column. Returns a
+    Core ``Select`` over (LlmAuditEvent, actor_username, connector_display_name)
+    so both the JSON browse endpoint and the CSV export share one filter path.
+    """
+    cutoff = utcnow() - timedelta(days=days)
+    stmt = (
+        select(
+            LlmAuditEvent,
+            User.username.label("actor_username"),
+            LlmConnector.display_name.label("connector_display_name"),
+        )
+        .join(User, User.id == LlmAuditEvent.actor_user_id, isouter=True)
+        .join(
+            LlmConnector,
+            LlmConnector.id == LlmAuditEvent.target_connector_id,
+            isouter=True,
+        )
+        .where(LlmAuditEvent.created_at >= cutoff)
+    )
+    if event_type is not None:
+        stmt = stmt.where(LlmAuditEvent.event_type == event_type)
+    if actor_user_id is not None:
+        stmt = stmt.where(LlmAuditEvent.actor_user_id == actor_user_id)
+    if target_connector_id is not None:
+        stmt = stmt.where(LlmAuditEvent.target_connector_id == target_connector_id)
+    return stmt
+
+
+@router.get("/policy", response_model=AdminPolicyOut)
+@limiter.limit("60/minute")
+def get_policy(
+    request: FastAPIRequest,
+    _admin: User = Depends(get_current_admin),
+    db: Session = Depends(get_db),
+) -> AdminPolicyOut:
+    settings = get_system_settings(db)
+    return AdminPolicyOut(
+        llm_apikey_connectors_enabled=settings.llm_apikey_connectors_enabled,
+        llm_compatible_connector_enabled=settings.llm_compatible_connector_enabled,
+        llm_default_connector_id=settings.llm_default_connector_id,
+        llm_call_log_retention_days=settings.llm_call_log_retention_days,
+    )
+
+
+@router.patch("/policy", response_model=AdminPolicyOut)
+@limiter.limit("30/minute")
+def patch_policy(
+    request: FastAPIRequest,
+    payload: AdminPolicyPatch,
+    admin: User = Depends(get_current_admin),
+    db: Session = Depends(get_db),
+) -> AdminPolicyOut:
+    update_kwargs: dict = {}
+    if payload.llm_apikey_connectors_enabled is not None:
+        update_kwargs["llm_apikey_connectors_enabled"] = payload.llm_apikey_connectors_enabled
+    if payload.llm_compatible_connector_enabled is not None:
+        update_kwargs["llm_compatible_connector_enabled"] = payload.llm_compatible_connector_enabled
+    if payload.llm_call_log_retention_days is not None:
+        update_kwargs["llm_call_log_retention_days"] = payload.llm_call_log_retention_days
+
+    # Default connector handling:
+    # - clear_default=True takes precedence and sets to NULL
+    # - explicit `llm_default_connector_id: null` also clears the default
+    # - otherwise, llm_default_connector_id (if non-None) is validated and set
+    explicit_null_default = (
+        "llm_default_connector_id" in payload.model_fields_set
+        and payload.llm_default_connector_id is None
+    )
+    if payload.clear_default or explicit_null_default:
+        update_kwargs["llm_default_connector_id"] = None
+    elif payload.llm_default_connector_id is not None:
+        target = get_connector(db, payload.llm_default_connector_id)
+        if target is None:
+            raise HTTPException(status_code=400, detail="default connector not found")
+        if target.status != "active":
+            raise HTTPException(
+                status_code=400,
+                detail="default connector must be active",
+            )
+        update_kwargs["llm_default_connector_id"] = target.id
+
+    settings = update_system_settings(db, **update_kwargs)
+    audit_event(
+        db,
+        actor_user_id=admin.id,
+        target_connector_id=settings.llm_default_connector_id,
+        event_type=AUDIT_POLICY_CHANGED,
+    )
+    db.commit()
+    return AdminPolicyOut(
+        llm_apikey_connectors_enabled=settings.llm_apikey_connectors_enabled,
+        llm_compatible_connector_enabled=settings.llm_compatible_connector_enabled,
+        llm_default_connector_id=settings.llm_default_connector_id,
+        llm_call_log_retention_days=settings.llm_call_log_retention_days,
+    )
+
+
+@router.get("/connectors", response_model=list[AdminConnectorOut])
+@limiter.limit("60/minute")
+def list_connectors_admin(
+    request: FastAPIRequest,
+    _admin: User = Depends(get_current_admin),
+    db: Session = Depends(get_db),
+) -> list[AdminConnectorOut]:
+    rows = list_all_connectors(db)
+    user_ids = {r.user_id for r in rows}
+    usernames: dict[int, str] = {}
+    if user_ids:
+        users = db.query(User).filter(User.id.in_(user_ids)).all()
+        usernames = {u.id: u.username for u in users}
+
+    # One grouped aggregate for all connectors instead of an N+1 per-row query.
+    usage_by_connector = current_month_token_usage_bulk(db, [r.id for r in rows])
+
+    return [
+        _connector_to_admin_out(
+            r,
+            usernames.get(r.user_id) or f"user#{r.user_id}",
+            usage_by_connector.get(r.id, 0),
+        )
+        for r in rows
+    ]
+
+
+@router.post("/connectors/{connector_id}/revoke", response_model=AdminConnectorOut)
+@limiter.limit("30/minute")
+def revoke_connector_admin(
+    request: FastAPIRequest,
+    connector_id: int,
+    admin: User = Depends(get_current_admin),
+    db: Session = Depends(get_db),
+) -> AdminConnectorOut:
+    row = get_connector(db, connector_id)
+    if row is None:
+        raise HTTPException(status_code=404, detail="Connector not found")
+
+    revoke_connector(row)
+    audit_event(
+        db,
+        actor_user_id=admin.id,
+        target_connector_id=row.id,
+        event_type=AUDIT_REVOKED_BY_ADMIN,
+    )
+
+    # If the revoked connector was the system default, clear it.
+    settings = get_system_settings(db)
+    if settings.llm_default_connector_id == row.id:
+        settings.llm_default_connector_id = None
+
+    db.commit()
+    db.refresh(row)
+    return _connector_to_admin_out(
+        row, get_user_label(db, row.user_id), current_month_token_usage(db, row.id)
+    )
+
+
+@router.patch("/connectors/{connector_id}/cap", response_model=AdminConnectorOut)
+@limiter.limit("30/minute")
+def set_connector_cap_admin(
+    request: FastAPIRequest,
+    connector_id: int,
+    payload: AdminConnectorCapPatch,
+    admin: User = Depends(get_current_admin),
+    db: Session = Depends(get_db),
+) -> AdminConnectorOut:
+    """Set or clear a connector's monthly token cap (admin-only, issue #339).
+
+    ``monthly_token_cap = null`` clears the cap (unlimited). The change is
+    pre-flight only: an in-flight gateway call already past its cap check is
+    unaffected. Pydantic enforces the non-negative bound (``ge=0``); the
+    service layer re-validates defensively.
+    """
+    row = get_connector(db, connector_id)
+    if row is None:
+        raise HTTPException(status_code=404, detail="Connector not found")
+
+    try:
+        set_monthly_cap(row, payload.monthly_token_cap)
+    except ValueError as exc:
+        raise HTTPException(status_code=400, detail=str(exc)) from exc
+
+    audit_event(
+        db,
+        actor_user_id=admin.id,
+        target_connector_id=row.id,
+        event_type=AUDIT_POLICY_CHANGED,
+    )
+    db.commit()
+    db.refresh(row)
+    return _connector_to_admin_out(
+        row, get_user_label(db, row.user_id), current_month_token_usage(db, row.id)
+    )
+
+
+@router.get("/usage", response_model=AdminUsageOut)
+@limiter.limit("30/minute")
+def get_usage(
+    request: FastAPIRequest,
+    days: int = Query(default=30, ge=1, le=180),
+    _admin: User = Depends(get_current_admin),
+    db: Session = Depends(get_db),
+) -> AdminUsageOut:
+    rows = get_usage_stats(db, days=days)
+    rows_out: list[UsageRow] = []
+    if rows:
+        connector_ids = [r["connector_id"] for r in rows]
+        connectors = db.query(LlmConnector).filter(LlmConnector.id.in_(connector_ids)).all()
+        connector_map = {c.id: c for c in connectors}
+        user_ids = {c.user_id for c in connectors}
+        users = db.query(User).filter(User.id.in_(user_ids)).all() if user_ids else []
+        usernames = {u.id: u.username for u in users}
+
+        for r in rows:
+            cid = r["connector_id"]
+            c = connector_map.get(cid)
+            if c is None:
+                continue
+            total = r["total_calls"]
+            errors = r["error_count"]
+            rows_out.append(
+                UsageRow(
+                    connector_id=cid,
+                    dj_username=usernames.get(c.user_id, f"user#{c.user_id}"),
+                    display_name=c.display_name,
+                    connector_type=c.connector_type,  # type: ignore[arg-type]
+                    total_calls=total,
+                    total_tokens_in=r["total_tokens_in"],
+                    total_tokens_out=r["total_tokens_out"],
+                    error_count=errors,
+                    error_rate=(errors / total) if total else 0.0,
+                )
+            )
+    # Sort: most calls first, then by error rate desc as tiebreaker
+    rows_out.sort(key=lambda r: (-r.total_calls, -r.error_rate))
+    return AdminUsageOut(days=days, rows=rows_out)
+
+
+@router.get("/audit", response_model=AdminAuditOut)
+@limiter.limit("60/minute")
+def list_audit_events(
+    request: FastAPIRequest,
+    event_type: str | None = Query(default=None, max_length=60),
+    actor_user_id: int | None = Query(default=None, ge=1),
+    target_connector_id: int | None = Query(default=None, ge=1),
+    days: int = Query(default=30, ge=1, le=3650),
+    limit: int = Query(default=50, ge=1, le=200),
+    offset: int = Query(default=0, ge=0),
+    _admin: User = Depends(get_current_admin),
+    db: Session = Depends(get_db),
+) -> AdminAuditOut:
+    """Browse the LLM audit trail (admin-only).
+
+    Read-only view over ``llm_audit_event`` with optional filters and
+    pagination. The target connector's display name is joined in — credential
+    material is never read or returned.
+    """
+    base = _audit_query(
+        db,
+        event_type=event_type,
+        actor_user_id=actor_user_id,
+        target_connector_id=target_connector_id,
+        days=days,
+    )
+
+    total = db.execute(select(func.count()).select_from(base.subquery())).scalar_one()
+
+    page = (
+        base.order_by(LlmAuditEvent.created_at.desc(), LlmAuditEvent.id.desc())
+        .limit(limit)
+        .offset(offset)
+    )
+
+    rows_out: list[AuditEventRow] = []
+    for event, actor_username, connector_display_name in db.execute(page).all():
+        rows_out.append(
+            AuditEventRow(
+                id=event.id,
+                created_at=event.created_at,
+                event_type=event.event_type,
+                actor_user_id=event.actor_user_id,
+                actor_username=actor_username or f"user#{event.actor_user_id}",
+                target_connector_id=event.target_connector_id,
+                target_connector_display_name=connector_display_name,
+                notes=None,
+            )
+        )
+
+    return AdminAuditOut(rows=rows_out, total=int(total), limit=limit, offset=offset)
+
+
+@router.get(
+    "/audit.csv",
+    response_class=StreamingResponse,
+    responses={
+        200: {
+            "content": {"text/csv": {"schema": {"type": "string", "format": "binary"}}},
+            "description": "CSV export of the filtered audit trail.",
+        }
+    },
+)
+@limiter.limit("12/minute")
+def export_audit_events_csv(
+    request: FastAPIRequest,
+    event_type: str | None = Query(default=None, max_length=60),
+    actor_user_id: int | None = Query(default=None, ge=1),
+    target_connector_id: int | None = Query(default=None, ge=1),
+    days: int = Query(default=30, ge=1, le=3650),
+    _admin: User = Depends(get_current_admin),
+    db: Session = Depends(get_db),
+) -> StreamingResponse:
+    """Export the (filtered) audit trail as CSV (admin-only).
+
+    Honors the same filters as ``GET /audit``. Capped at
+    ``_AUDIT_CSV_ROW_CAP`` rows to avoid unbounded streaming. Columns:
+    timestamp, actor, event_type, target_connector, notes. Never includes
+    credential material.
+    """
+    stmt = (
+        _audit_query(
+            db,
+            event_type=event_type,
+            actor_user_id=actor_user_id,
+            target_connector_id=target_connector_id,
+            days=days,
+        )
+        .order_by(LlmAuditEvent.created_at.desc(), LlmAuditEvent.id.desc())
+        .limit(_AUDIT_CSV_ROW_CAP)
+    )
+    result_rows = db.execute(stmt).all()
+
+    def _generate() -> Iterator[str]:
+        buffer = io.StringIO()
+        writer = csv.writer(buffer)
+        writer.writerow(["timestamp", "actor", "event_type", "target_connector", "notes"])
+        yield buffer.getvalue()
+        buffer.seek(0)
+        buffer.truncate(0)
+
+        for event, actor_username, connector_display_name in result_rows:
+            actor = actor_username or f"user#{event.actor_user_id}"
+            writer.writerow(
+                [
+                    event.created_at.isoformat() if event.created_at else "",
+                    sanitize_csv_value(actor),
+                    sanitize_csv_value(event.event_type or ""),
+                    sanitize_csv_value(connector_display_name or ""),
+                    "",
+                ]
+            )
+            yield buffer.getvalue()
+            buffer.seek(0)
+            buffer.truncate(0)
+
+    headers = {"Content-Disposition": 'attachment; filename="llm-audit-events.csv"'}
+    return StreamingResponse(_generate(), media_type="text/csv", headers=headers)
diff --git a/server/app/api/events.py b/server/app/api/events.py
index 8ebc07e9..46f3153c 100644
--- a/server/app/api/events.py
+++ b/server/app/api/events.py
@@ -191,7 +191,7 @@ def _request_to_out(r) -> RequestOut:
     )
 
 
-def _build_recommendation_response(result, db) -> RecommendationResponse:
+def _build_recommendation_response(result, db, actor=None) -> RecommendationResponse:
     """Build a RecommendationResponse from a recommendation engine result."""
     from app.services.recommendation.camelot import parse_key
     from app.services.recommendation.llm_hooks import is_llm_available
@@ -234,7 +234,7 @@ def _build_recommendation_response(result, db) -> RecommendationResponse:
         profile=profile,
         services_used=result.services_used,
         total_candidates_searched=result.total_candidates_searched,
-        llm_available=is_llm_available(db),
+        llm_available=is_llm_available(db, actor=actor),
     )
 
 
@@ -856,7 +856,7 @@ def get_recommendations(
         )
 
     result = generate_recommendations(db, user, event)
-    return _build_recommendation_response(result, db)
+    return _build_recommendation_response(result, db, actor=user)
 
 
 @router.get("/{code}/playlists")
@@ -933,7 +933,7 @@ def get_recommendations_from_template(
         template_source=template_request.source,
         template_id=template_request.playlist_id,
     )
-    return _build_recommendation_response(result, db)
+    return _build_recommendation_response(result, db, actor=user)
 
 
 @router.post("/{code}/recommendations/llm")
@@ -954,14 +954,14 @@ async def get_llm_recommendations(
     sys_settings = get_system_settings(db)
     _llm_rate_limit_cache["value"] = sys_settings.llm_rate_limit_per_minute
 
-    if not is_llm_available(db):
+    user = event.created_by
+
+    if not is_llm_available(db, actor=user):
         raise HTTPException(
             status_code=503,
-            detail="LLM recommendations not configured. Set ANTHROPIC_API_KEY to enable.",
+            detail="LLM recommendations not configured. Add a DJ/admin AI connector to enable.",
         )
 
-    user = event.created_by
-
     has_services = bool(user.tidal_access_token) or bool(user.beatport_access_token)
     if not has_services:
         raise HTTPException(
@@ -969,8 +969,13 @@ async def get_llm_recommendations(
             detail="No music services connected. Link Tidal or Beatport to get recommendations.",
         )
 
+    from app.services.llm.exceptions import QuotaCapReached
+
     try:
         result = await generate_recommendations_from_llm(db, user, event, prompt_request.prompt)
+    except QuotaCapReached as exc:
+        # DJ-facing message only — no internal usage/cap details leaked (issue #339).
+        raise HTTPException(status_code=429, detail=str(exc)) from exc
     except Exception:
         import logging
 
@@ -980,7 +985,7 @@ async def get_llm_recommendations(
             detail="LLM service error. Try again or use algorithmic recommendations.",
         )
 
-    base = _build_recommendation_response(result, db)
+    base = _build_recommendation_response(result, db, actor=user)
 
     llm_queries = [
         LLMQueryInfo(
@@ -999,7 +1004,7 @@ async def get_llm_recommendations(
         services_used=base.services_used,
         total_candidates_searched=base.total_candidates_searched,
         llm_queries=llm_queries,
-        llm_model=get_settings().anthropic_model,
+        llm_model=result.llm_model or get_settings().anthropic_model,
     )
 
 
diff --git a/server/app/api/llm.py b/server/app/api/llm.py
new file mode 100644
index 00000000..67381dce
--- /dev/null
+++ b/server/app/api/llm.py
@@ -0,0 +1,563 @@
+"""Per-DJ LLM connector management endpoints.
+
+Authentication: ``get_current_active_user`` (any DJ, not pending).
+Routes are mounted at ``/api/llm/connectors``.
+
+All endpoints scope queries by ``user_id = current_user.id`` server-side.
+404 (not 403) is returned for connector IDs the DJ doesn't own — this avoids
+leaking the existence of another DJ's connectors.
+"""
+
+from __future__ import annotations
+
+import json as _json
+import logging
+
+from fastapi import APIRouter, Depends, HTTPException
+from fastapi import Request as FastAPIRequest
+from sqlalchemy.orm import Session
+from sse_starlette.sse import EventSourceResponse
+
+from app.api.deps import get_current_active_user, get_db
+from app.core.rate_limit import limiter
+from app.models.llm_connector import (
+    CONNECTOR_TYPE_OPENAI_COMPATIBLE,
+    VALID_CONNECTOR_TYPES,
+    LlmConnector,
+)
+from app.models.user import User
+from app.schemas.ai_settings import AIModelsResponse
+from app.schemas.llm import (
+    KNOWN_FEATURE_VALUES,
+    ConnectorCreate,
+    ConnectorCredentialsRotate,
+    ConnectorOut,
+    ConnectorPatch,
+    ConnectorTestResult,
+    DjPolicyOut,
+    FeatureKey,
+    FeaturePreferenceOut,
+    FeaturePreferenceSet,
+    FeaturePreferencesListOut,
+)
+from app.services.llm.base import ChatRequest as LlmChatRequest
+from app.services.llm.base import Message as LlmMessage
+from app.services.llm.connector_storage import (
+    AUDIT_CREATED,
+    AUDIT_CREDENTIALS_ROTATED,
+    AUDIT_DEFAULT_SET,
+    AUDIT_DEFAULT_UNSET,
+    AUDIT_DELETED,
+    audit_event,
+    build_create_payload,
+    clear_feature_preference,
+    create_connector,
+    delete_connector,
+    get_connector_for_user,
+    get_feature_preferences_for_user,
+    list_connectors_for_user,
+    rotate_credentials,
+    set_default_for_user,
+    set_feature_preference,
+    unset_default_for_user,
+    update_metadata,
+)
+from app.services.llm.exceptions import LlmError, NoLlmConfigured
+from app.services.llm.gateway import Gateway
+from app.services.llm.openrouter_models import get_openrouter_models
+from app.services.system_settings import get_system_settings
+
+logger = logging.getLogger(__name__)
+
+router = APIRouter()
+
+
+# API-key connector types (everything that isn't the custom OpenAI-compatible
+# endpoint). Gated by the single ``llm_apikey_connectors_enabled`` flag, mirroring
+# ``_check_connector_type_allowed`` below. Sorted for a deterministic response.
+_APIKEY_CONNECTOR_TYPES: tuple[str, ...] = tuple(
+    sorted(VALID_CONNECTOR_TYPES - {CONNECTOR_TYPE_OPENAI_COMPATIBLE})
+)
+
+
+def _allowed_connector_types(*, apikey_enabled: bool, compatible_enabled: bool) -> list[str]:
+    """Compute the connector types a DJ may create under the given policy.
+
+    Kept consistent with ``_check_connector_type_allowed`` so the advertised set
+    exactly matches what the create endpoint will accept (no UX/enforcement drift).
+    """
+    allowed: list[str] = []
+    if apikey_enabled:
+        allowed.extend(_APIKEY_CONNECTOR_TYPES)
+    if compatible_enabled:
+        allowed.append(CONNECTOR_TYPE_OPENAI_COMPATIBLE)
+    return allowed
+
+
+def _check_connector_type_allowed(db: Session, connector_type: str) -> None:
+    """Enforce the admin policy toggles. Raises 403 when blocked."""
+    settings = get_system_settings(db)
+    if connector_type == CONNECTOR_TYPE_OPENAI_COMPATIBLE:
+        if not settings.llm_compatible_connector_enabled:
+            raise HTTPException(
+                status_code=403,
+                detail="Custom OpenAI-compatible connectors are disabled by admin policy",
+            )
+    elif connector_type in VALID_CONNECTOR_TYPES:
+        if not settings.llm_apikey_connectors_enabled:
+            raise HTTPException(
+                status_code=403,
+                detail="API-key connectors are disabled by admin policy",
+            )
+
+
+def _get_owned_connector_or_404(db: Session, connector_id: int, user_id: int) -> LlmConnector:
+    """Fetch a connector scoped to its owner, or raise 404.
+
+    Returns 404 (not 403) for IDs the DJ doesn't own so the existence of another
+    DJ's connectors is never leaked.
+    """
+    row = get_connector_for_user(db, connector_id, user_id)
+    if row is None:
+        raise HTTPException(status_code=404, detail="Connector not found")
+    return row
+
+
+def _audit_and_return(
+    db: Session, row: LlmConnector, *, actor_user_id: int, event_type: str
+) -> ConnectorOut:
+    """Shared write-side epilogue: audit row → commit → refresh → public view.
+
+    The create / rotate / set-default / unset-default endpoints all finish with
+    this identical sequence.
+    """
+    audit_event(db, actor_user_id=actor_user_id, target_connector_id=row.id, event_type=event_type)
+    db.commit()
+    db.refresh(row)
+    return ConnectorOut.model_validate(row)
+
+
+def _feature_prefs_response(db: Session, user_id: int) -> FeaturePreferencesListOut:
+    """Build the list response: the DJ's current pins + the pinnable catalogue."""
+    rows = get_feature_preferences_for_user(db, user_id)
+    return FeaturePreferencesListOut(
+        preferences=[FeaturePreferenceOut.model_validate(r) for r in rows],
+        known_features=list(KNOWN_FEATURE_VALUES),  # type: ignore[arg-type]
+    )
+
+
+def _raise_if_duplicate_label(exc: Exception) -> None:
+    """Translate the per-DJ (display_name, type) unique violation into a 409."""
+    if "uq_dj_connector_label" in str(exc):
+        raise HTTPException(
+            status_code=409,
+            detail="You already have a connector with that display name and type",
+        ) from exc
+
+
+@router.get("/connectors", response_model=list[ConnectorOut])
+@limiter.limit("60/minute")
+def list_connectors(
+    request: FastAPIRequest,
+    user: User = Depends(get_current_active_user),
+    db: Session = Depends(get_db),
+) -> list[ConnectorOut]:
+    rows = list_connectors_for_user(db, user.id)
+    return [ConnectorOut.model_validate(r) for r in rows]
+
+
+@router.get(
+    "/policy",
+    response_model=DjPolicyOut,
+    responses={
+        401: {"description": "Not authenticated (missing or invalid bearer token)."},
+        403: {"description": "Authenticated but not an active DJ (e.g. pending approval)."},
+    },
+)
+@limiter.limit("60/minute")
+def get_dj_policy(
+    request: FastAPIRequest,
+    _user: User = Depends(get_current_active_user),
+    db: Session = Depends(get_db),
+) -> DjPolicyOut:
+    """DJ-readable connector policy (non-sensitive subset).
+
+    The settings/ai page consumes this to fail *closed* — hiding connector
+    types the admin has disabled rather than showing every provider and only
+    discovering the block when the create call returns 403. Admin-only fields
+    (e.g. ``llm_default_connector_id``) are intentionally excluded.
+    """
+    settings = get_system_settings(db)
+    return DjPolicyOut(
+        llm_apikey_connectors_enabled=settings.llm_apikey_connectors_enabled,
+        llm_compatible_connector_enabled=settings.llm_compatible_connector_enabled,
+        allowed_connector_types=_allowed_connector_types(
+            apikey_enabled=settings.llm_apikey_connectors_enabled,
+            compatible_enabled=settings.llm_compatible_connector_enabled,
+        ),  # type: ignore[arg-type]
+    )
+
+
+@router.get("/openrouter/models", response_model=AIModelsResponse)
+@limiter.limit("30/minute")
+async def list_openrouter_models(
+    request: FastAPIRequest,
+    user: User = Depends(get_current_active_user),
+    db: Session = Depends(get_db),
+) -> AIModelsResponse:
+    """Return the OpenRouter model catalogue for the model-hint dropdown.
+
+    Served from a process-wide TTL cache (refreshed hourly). The OpenRouter
+    ``/models`` endpoint is public, so no connector credentials are required.
+    Returns an empty list if the catalogue is unavailable — the frontend then
+    falls back to a free-text model input.
+    """
+    models = await get_openrouter_models()
+    return AIModelsResponse(models=models)
+
+
+@router.post("/connectors", response_model=ConnectorOut, status_code=201)
+@limiter.limit("5/minute")
+def create_connector_endpoint(
+    request: FastAPIRequest,
+    payload: ConnectorCreate,
+    user: User = Depends(get_current_active_user),
+    db: Session = Depends(get_db),
+) -> ConnectorOut:
+    _check_connector_type_allowed(db, payload.connector_type)
+
+    try:
+        built = build_create_payload(
+            connector_type=payload.connector_type,
+            display_name=payload.display_name,
+            api_key=payload.api_key,
+            base_url=payload.base_url,
+            bearer=payload.bearer,
+            model_hint=payload.model_hint,
+            aws_access_key_id=payload.aws_access_key_id,
+            aws_secret_access_key=payload.aws_secret_access_key,
+            aws_region=payload.aws_region,
+            aws_model_id=payload.aws_model_id,
+            azure_resource_name=payload.azure_resource_name,
+            azure_deployment_name=payload.azure_deployment_name,
+            azure_api_version=payload.azure_api_version,
+        )
+    except ValueError as exc:
+        raise HTTPException(status_code=400, detail=str(exc)) from exc
+
+    try:
+        row = create_connector(db, user_id=user.id, payload=built)
+    except Exception as exc:  # likely a UniqueConstraint collision
+        db.rollback()
+        _raise_if_duplicate_label(exc)
+        logger.exception("Failed to create LLM connector")
+        raise HTTPException(status_code=500, detail="Failed to create connector") from exc
+
+    return _audit_and_return(db, row, actor_user_id=user.id, event_type=AUDIT_CREATED)
+
+
+@router.patch("/connectors/{connector_id}", response_model=ConnectorOut)
+@limiter.limit("30/minute")
+def update_connector_metadata(
+    request: FastAPIRequest,
+    connector_id: int,
+    payload: ConnectorPatch,
+    user: User = Depends(get_current_active_user),
+    db: Session = Depends(get_db),
+) -> ConnectorOut:
+    row = _get_owned_connector_or_404(db, connector_id, user.id)
+
+    try:
+        update_metadata(row, display_name=payload.display_name, model_hint=payload.model_hint)
+    except ValueError as exc:
+        raise HTTPException(status_code=400, detail=str(exc)) from exc
+
+    try:
+        db.commit()
+    except Exception as exc:  # likely a UniqueConstraint collision on rename
+        db.rollback()
+        _raise_if_duplicate_label(exc)
+        logger.exception("Failed to update LLM connector metadata")
+        raise HTTPException(status_code=500, detail="Failed to update connector metadata") from exc
+    db.refresh(row)
+    return ConnectorOut.model_validate(row)
+
+
+@router.put("/connectors/{connector_id}/credentials", response_model=ConnectorOut)
+@limiter.limit("5/minute")
+def rotate_connector_credentials(
+    request: FastAPIRequest,
+    connector_id: int,
+    payload: ConnectorCredentialsRotate,
+    user: User = Depends(get_current_active_user),
+    db: Session = Depends(get_db),
+) -> ConnectorOut:
+    row = _get_owned_connector_or_404(db, connector_id, user.id)
+
+    try:
+        rotate_credentials(
+            db,
+            connector=row,
+            api_key=payload.api_key,
+            base_url=payload.base_url,
+            bearer=payload.bearer,
+            aws_access_key_id=payload.aws_access_key_id,
+            aws_secret_access_key=payload.aws_secret_access_key,
+            aws_region=payload.aws_region,
+            aws_model_id=payload.aws_model_id,
+            azure_resource_name=payload.azure_resource_name,
+            azure_deployment_name=payload.azure_deployment_name,
+            azure_api_version=payload.azure_api_version,
+        )
+    except ValueError as exc:
+        raise HTTPException(status_code=400, detail=str(exc)) from exc
+
+    return _audit_and_return(db, row, actor_user_id=user.id, event_type=AUDIT_CREDENTIALS_ROTATED)
+
+
+@router.post("/connectors/{connector_id}/test", response_model=ConnectorTestResult)
+@limiter.limit("10/minute")
+async def test_connector(
+    request: FastAPIRequest,
+    connector_id: int,
+    user: User = Depends(get_current_active_user),
+    db: Session = Depends(get_db),
+) -> ConnectorTestResult:
+    """Run a health check and return a sanitised result.
+
+    Behaviour identical to the background monitor (issue #340), so the
+    ``last_health_check_at`` / ``last_health_check_status`` columns and audit
+    rows are written the same way on every invocation regardless of trigger
+    source. See ``services/llm/health_check.py`` for the shared helper.
+    """
+    from app.services.llm.health_check import run_health_check
+
+    row = _get_owned_connector_or_404(db, connector_id, user.id)
+
+    outcome = await run_health_check(db, row, actor_user_id=user.id)
+    db.commit()
+
+    if outcome.ok:
+        return ConnectorTestResult(ok=True)
+    # Reuse the same code → message mapping the gateway uses for transient
+    # errors. The helper has already sanitised any upstream payload.
+    message = {
+        "auth_invalid": "Authentication failed against the provider",
+        "rate_limited": "Provider rate limited the request",
+        "quota_exceeded": "Provider quota or billing failure",
+        "provider_unavailable": "Provider unreachable or timed out",
+        "error": "Unknown error",
+    }.get(outcome.status, "Unknown error")
+    return ConnectorTestResult(
+        ok=False,
+        error_code=outcome.error_code or outcome.status,
+        message=message,
+    )
+
+
+# A short, fixed prompt for the streaming health probe. Streams a single
+# sentence so the DJ sees tokens arrive in real time, exercising the full
+# resolve → adapter.stream → SSE path end-to-end.
+_STREAM_TEST_PROMPT = "Reply with one short friendly sentence confirming you are online."
+
+
+@router.post("/connectors/{connector_id}/stream-test")
+@limiter.limit("10/minute")
+async def stream_test_connector(
+    request: FastAPIRequest,
+    connector_id: int,
+    user: User = Depends(get_current_active_user),
+    db: Session = Depends(get_db),
+) -> EventSourceResponse:
+    """Stream a short sentence through the connector as ``text/event-stream``.
+
+    Validates ownership up front (404 for connectors the DJ doesn't own — never
+    leaks existence). Each SSE ``data:`` frame is a JSON ``ChatResponseChunk``.
+    On a typed gateway error an ``event: error`` frame is emitted carrying only a
+    sanitised code (never the upstream payload), then the stream ends. Client
+    disconnect cancels the upstream provider request — the gateway generator's
+    ``finally`` writes the counts-only call log and closes the adapter.
+
+    Unlike the public guest SSE stream (``api/sse.py``), this endpoint is
+    authenticated, rate-limited (10/min), and strictly bounded (max 64 output
+    tokens), so it holds the request-scoped DB session for the brief stream
+    lifetime rather than opening a detached ``SessionLocal`` — the pool-pinning
+    concern that drove ``api/sse.py``'s pattern applies to unauthenticated,
+    indefinitely-open guest connections, not a short admin health probe.
+    """
+    row = _get_owned_connector_or_404(db, connector_id, user.id)
+
+    chat_request = LlmChatRequest(
+        messages=[LlmMessage(role="user", content=_STREAM_TEST_PROMPT)],
+        max_tokens=64,
+        temperature=0.0,
+        model=row.model_hint or None,
+    )
+
+    async def _publisher():
+        try:
+            async for chunk in Gateway.stream(db, user, chat_request, purpose="stream_test"):
+                yield {"data": _json.dumps(chunk.model_dump())}
+        except NoLlmConfigured:
+            yield {"event": "error", "data": _json.dumps({"code": "no_connector"})}
+        except LlmError as exc:
+            # Map to a sanitised, stable code — never echo the provider message.
+            code = type(exc).__name__
+            logger.info("stream-test failed for connector %s: %s", connector_id, code)
+            yield {"event": "error", "data": _json.dumps({"code": code})}
+
+    return EventSourceResponse(
+        _publisher(),
+        media_type="text/event-stream",
+        headers={"X-Accel-Buffering": "no"},
+    )
+
+
+@router.post(
+    "/connectors/{connector_id}/default",
+    response_model=ConnectorOut,
+    responses={
+        400: {"description": "Connector cannot be set as default (e.g. disabled or auth_invalid)."},
+        404: {"description": "Connector not found for current user."},
+    },
+)
+@limiter.limit("30/minute")
+def set_connector_as_default(
+    request: FastAPIRequest,
+    connector_id: int,
+    user: User = Depends(get_current_active_user),
+    db: Session = Depends(get_db),
+) -> ConnectorOut:
+    """Pin this connector as the DJ's explicit default (issue #336).
+
+    Atomically clears any other defaults the DJ owns before flipping this row,
+    so the partial unique index never sees two True rows for the same user.
+
+    Setting a disabled / auth_invalid connector as default is rejected with 400
+    so DJs don't silently break their own routing — a default that the gateway
+    would skip anyway is a footgun.
+    """
+    row = _get_owned_connector_or_404(db, connector_id, user.id)
+    if row.status != "active":
+        raise HTTPException(
+            status_code=400,
+            detail="Only an active connector can be set as default",
+        )
+
+    try:
+        set_default_for_user(db, connector=row)
+    except Exception as exc:
+        db.rollback()
+        logger.exception("Failed to set LLM connector as default")
+        raise HTTPException(status_code=500, detail="Failed to set default") from exc
+
+    return _audit_and_return(db, row, actor_user_id=user.id, event_type=AUDIT_DEFAULT_SET)
+
+
+@router.delete(
+    "/connectors/{connector_id}/default",
+    response_model=ConnectorOut,
+    responses={
+        404: {"description": "Connector not found for current user."},
+    },
+)
+@limiter.limit("30/minute")
+def unset_connector_as_default(
+    request: FastAPIRequest,
+    connector_id: int,
+    user: User = Depends(get_current_active_user),
+    db: Session = Depends(get_db),
+) -> ConnectorOut:
+    """Clear the explicit default — gateway resolution falls back to MRU."""
+    row = _get_owned_connector_or_404(db, connector_id, user.id)
+
+    # No-op fast path: don't write an audit row if nothing changed.
+    if not row.is_default:
+        return ConnectorOut.model_validate(row)
+
+    unset_default_for_user(db, connector=row)
+    return _audit_and_return(db, row, actor_user_id=user.id, event_type=AUDIT_DEFAULT_UNSET)
+
+
+@router.get("/feature-preferences", response_model=FeaturePreferencesListOut)
+@limiter.limit("60/minute")
+def list_feature_preferences(
+    request: FastAPIRequest,
+    user: User = Depends(get_current_active_user),
+    db: Session = Depends(get_db),
+) -> FeaturePreferencesListOut:
+    """List the DJ's per-feature connector pins (issue #337)."""
+    return _feature_prefs_response(db, user.id)
+
+
+@router.post(
+    "/feature-preferences",
+    response_model=FeaturePreferencesListOut,
+    responses={
+        400: {"description": "Connector is not active and cannot be pinned."},
+        404: {"description": "Connector not found for current user."},
+    },
+)
+@limiter.limit("30/minute")
+def set_feature_preference_endpoint(
+    request: FastAPIRequest,
+    payload: FeaturePreferenceSet,
+    user: User = Depends(get_current_active_user),
+    db: Session = Depends(get_db),
+) -> FeaturePreferencesListOut:
+    """Pin (or re-pin) a connector to a feature for the current DJ.
+
+    Validates connector ownership server-side (404 for IDs the DJ doesn't own,
+    so another DJ's connector existence is never leaked) and rejects pinning a
+    non-active connector (400) — the gateway would skip it anyway, so silently
+    accepting it is a footgun.
+    """
+    row = _get_owned_connector_or_404(db, payload.connector_id, user.id)
+    if row.status != "active":
+        raise HTTPException(
+            status_code=400,
+            detail="Only an active connector can be pinned to a feature",
+        )
+    set_feature_preference(db, user_id=user.id, feature=payload.feature, connector_id=row.id)
+    db.commit()
+    return _feature_prefs_response(db, user.id)
+
+
+@router.delete("/feature-preferences/{feature}", response_model=FeaturePreferencesListOut)
+@limiter.limit("30/minute")
+def clear_feature_preference_endpoint(
+    request: FastAPIRequest,
+    feature: FeatureKey,
+    user: User = Depends(get_current_active_user),
+    db: Session = Depends(get_db),
+) -> FeaturePreferencesListOut:
+    """Clear the DJ's pin for ``feature`` (no-op if unset). Returns the new list."""
+    clear_feature_preference(db, user_id=user.id, feature=feature)
+    db.commit()
+    return _feature_prefs_response(db, user.id)
+
+
+@router.delete("/connectors/{connector_id}", status_code=204)
+@limiter.limit("30/minute")
+def delete_connector_endpoint(
+    request: FastAPIRequest,
+    connector_id: int,
+    user: User = Depends(get_current_active_user),
+    db: Session = Depends(get_db),
+) -> None:
+    row = _get_owned_connector_or_404(db, connector_id, user.id)
+    audit_event(
+        db,
+        actor_user_id=user.id,
+        target_connector_id=row.id,
+        event_type=AUDIT_DELETED,
+    )
+    # If this connector is the system default, clear it before deletion to
+    # mirror the admin revoke path (and to be correct on SQLite, where the FK
+    # ON DELETE SET NULL may not fire).
+    settings = get_system_settings(db)
+    if settings.llm_default_connector_id == row.id:
+        settings.llm_default_connector_id = None
+    delete_connector(db, row)
+    db.commit()
+    return None
diff --git a/server/app/api/sse.py b/server/app/api/sse.py
index e493344b..ca4a4ecf 100644
--- a/server/app/api/sse.py
+++ b/server/app/api/sse.py
@@ -5,12 +5,11 @@
 import logging
 from typing import Any
 
-from fastapi import APIRouter, Depends, HTTPException, Request
-from sqlalchemy.orm import Session
+from fastapi import APIRouter, HTTPException, Request
 from sse_starlette.sse import EventSourceResponse
 
-from app.api.deps import get_db
 from app.core.rate_limit import limiter
+from app.db.session import SessionLocal
 from app.services.event import EventLookupResult, get_event_by_public_code_with_status
 from app.services.event_bus import get_event_bus
 
@@ -29,6 +28,11 @@ async def _event_generator(
     Keepalive pings are handled by sse-starlette's built-in ping task (every 15s).
     This generator only yields actual events. The timeout on queue.get() lets us
     periodically check for client disconnect without blocking forever.
+
+    NOTE (issue #356): this generator deliberately holds NO DB session. If a
+    future change needs per-tick DB access it MUST open its own short-lived
+    ``with SessionLocal() as s:`` session per tick and close it before awaiting
+    again — never hold a pooled connection across the stream lifetime.
     """
     bus = get_event_bus()
     queue = bus.subscribe(event_code)
@@ -54,7 +58,6 @@ async def _event_generator(
 async def event_stream(
     code: str,
     request: Request,
-    db: Session = Depends(get_db),
 ) -> EventSourceResponse:
     """Public SSE endpoint for real-time event updates.
 
@@ -63,6 +66,14 @@ async def event_stream(
     unauthenticated DoS (unlimited long-lived connections exhausting FDs)
     and passive eavesdropping via 6-char event-code brute force.
 
+    POOL SAFETY (issue #356): the one-shot existence/auth check runs inside a
+    short-lived ``with SessionLocal()`` block whose pooled connection is
+    returned BEFORE the EventSourceResponse is returned. An EventSource
+    connection can stay open indefinitely, so we must NOT hold a
+    request-scoped ``get_db`` session across the stream lifetime — doing so
+    pinned one pooled connection per open stream and exhausted the QueuePool
+    (size 5 + overflow 10 = 15 connections) under modest guest load.
+
     Event types:
     - request_created: New request submitted
     - request_status_changed: Request status update
@@ -70,16 +81,18 @@ async def event_stream(
     - requests_bulk_update: Batch accept/reject
     - bridge_status_changed: Bridge connect/disconnect
     """
-    event, result = get_event_by_public_code_with_status(db, code)
-    if result == EventLookupResult.NOT_FOUND:
-        raise HTTPException(status_code=404, detail="Event not found")
-    if result == EventLookupResult.ARCHIVED:
-        raise HTTPException(status_code=410, detail="Event has been archived")
-    if result == EventLookupResult.EXPIRED:
-        raise HTTPException(status_code=410, detail="Event has expired")
+    with SessionLocal() as db:
+        event, result = get_event_by_public_code_with_status(db, code)
+        if result == EventLookupResult.NOT_FOUND:
+            raise HTTPException(status_code=404, detail="Event not found")
+        if result == EventLookupResult.ARCHIVED:
+            raise HTTPException(status_code=410, detail="Event has been archived")
+        if result == EventLookupResult.EXPIRED:
+            raise HTTPException(status_code=410, detail="Event has expired")
+        event_code = event.code
 
     return EventSourceResponse(
-        _event_generator(request, event.code),
+        _event_generator(request, event_code),
         media_type="text/event-stream",
         headers={"X-Accel-Buffering": "no"},
     )
diff --git a/server/app/core/config.py b/server/app/core/config.py
index 3a49afcb..52707689 100644
--- a/server/app/core/config.py
+++ b/server/app/core/config.py
@@ -128,11 +128,15 @@ def is_lockout_enabled(self) -> bool:
     # ListenBrainz API (artist discovery for recommendations)
     listenbrainz_user_token: str = ""
 
-    # Anthropic API (LLM-powered recommendations)
+    # Anthropic API (LLM-powered recommendations).
+    # NOTE: credentials live in the LLM Gateway connector system (the source of
+    # truth since the MVP). These two fields remain only for admin observability
+    # of the legacy key (admin AI-settings/model-listing endpoints) and as the
+    # default model-name label on recommendation responses. The legacy env-var
+    # *fallback* in the recommendation engine was removed in #343, along with the
+    # now-unused ANTHROPIC_MAX_TOKENS / ANTHROPIC_TIMEOUT_SECONDS settings.
     anthropic_api_key: str = ""
     anthropic_model: str = "claude-haiku-4-5-20251001"
-    anthropic_max_tokens: int = 1024
-    anthropic_timeout_seconds: int = 15
 
     # Cache durations (1 hour for Spotify since popularity changes)
     search_cache_hours: int = 1
diff --git a/server/app/core/csv_safe.py b/server/app/core/csv_safe.py
new file mode 100644
index 00000000..782c4e9b
--- /dev/null
+++ b/server/app/core/csv_safe.py
@@ -0,0 +1,25 @@
+"""CSV safety helpers shared across all CSV exports.
+
+The stdlib ``csv`` module handles RFC 4180 quoting/escaping but does NOT defend
+against spreadsheet *formula injection* (a.k.a. CSV injection) — that is an
+application-layer concern, so it lives here as a single shared primitive rather
+than being re-implemented per endpoint.
+"""
+
+_FORMULA_PREFIXES = ("=", "+", "-", "@", " ", "\t", "\r", "\n")
+
+
+def sanitize_csv_value(value: str | None) -> str:
+    """Neutralize CSV/spreadsheet formula injection.
+
+    Spreadsheet apps (Excel, Google Sheets, LibreOffice) interpret cells starting
+    with ``=``, ``+``, ``-``, ``@``, space, tab, CR, or LF as formulas (leading
+    whitespace/control chars can be stripped on import, exposing a trailing formula), which can
+    be exploited when an exported file is opened. Prefixing such a cell with a single
+    quote forces it to render as literal text.
+    """
+    if not value:
+        return ""
+    if value[0] in _FORMULA_PREFIXES:
+        return "'" + value
+    return value
diff --git a/server/app/main.py b/server/app/main.py
index f894108f..c3fae23a 100644
--- a/server/app/main.py
+++ b/server/app/main.py
@@ -30,6 +30,42 @@
 CORS_ALLOW_METHODS = ["GET", "POST", "PUT", "PATCH", "DELETE", "OPTIONS"]
 
 TIDAL_COLLECTION_POLL_INTERVAL_SECONDS = 300  # 5 minutes
+LLM_CALL_LOG_CLEANUP_INTERVAL_SECONDS = 86400  # 24 hours
+
+
+def _run_llm_call_log_cleanup() -> None:
+    """Synchronous daily cleanup of expired llm_call_log rows.
+
+    Reads ``llm_call_log_retention_days`` from system settings each run, so an
+    admin change to the retention window takes effect on the next pass (within
+    24h) without a restart. Executed in a thread to avoid blocking the loop.
+    """
+    from app.db.session import SessionLocal
+    from app.services.llm.connector_storage import purge_call_log_older_than
+    from app.services.system_settings import get_system_settings
+
+    db = SessionLocal()
+    try:
+        retention_days = get_system_settings(db).llm_call_log_retention_days
+        deleted = purge_call_log_older_than(db, retention_days=retention_days)
+        db.commit()
+        if deleted:
+            logger.info(
+                "llm_call_log cleanup deleted %s rows older than %s days",
+                deleted,
+                retention_days,
+            )
+    finally:
+        db.close()
+
+
+async def _llm_call_log_cleanup_loop() -> None:
+    while True:
+        try:
+            await asyncio.to_thread(_run_llm_call_log_cleanup)
+        except Exception:
+            logger.exception("llm_call_log cleanup loop error")
+        await asyncio.sleep(LLM_CALL_LOG_CLEANUP_INTERVAL_SECONDS)
 
 
 def _run_tidal_collection_poll() -> None:
@@ -74,13 +110,23 @@ async def lifespan(app: FastAPI):
         lg = logging.getLogger(name)
         lg.handlers.clear()
         lg.propagate = True
-    task = asyncio.create_task(_tidal_collection_poll_loop())
+    # Import lazily so test runs that mock out the loop module don't trigger
+    # adapter imports at startup-time.
+    from app.services.llm.health_monitor import health_monitor_loop
+
+    tasks = [
+        asyncio.create_task(_tidal_collection_poll_loop()),
+        asyncio.create_task(_llm_call_log_cleanup_loop()),
+        asyncio.create_task(health_monitor_loop()),
+    ]
     try:
         yield
     finally:
-        task.cancel()
-        with contextlib.suppress(asyncio.CancelledError):
-            await task
+        for task in tasks:
+            task.cancel()
+        for task in tasks:
+            with contextlib.suppress(asyncio.CancelledError):
+                await task
 
 
 app = FastAPI(
diff --git a/server/app/models/__init__.py b/server/app/models/__init__.py
index 6d3df398..591ad611 100644
--- a/server/app/models/__init__.py
+++ b/server/app/models/__init__.py
@@ -5,6 +5,8 @@
 from app.models.guest import Guest
 from app.models.guest_profile import GuestProfile  # noqa: F401
 from app.models.kiosk import Kiosk
+from app.models.llm_connector import LlmAuditEvent, LlmCallLog, LlmConnector
+from app.models.llm_feature_preference import LlmFeaturePreference
 from app.models.mb_artist_cache import MbArtistCache
 from app.models.now_playing import NowPlaying
 from app.models.pending_email_change import PendingEmailChange
@@ -25,6 +27,10 @@
     "Guest",
     "GuestProfile",
     "Kiosk",
+    "LlmAuditEvent",
+    "LlmCallLog",
+    "LlmConnector",
+    "LlmFeaturePreference",
     "MbArtistCache",
     "NowPlaying",
     "PendingEmailChange",
diff --git a/server/app/models/llm_connector.py b/server/app/models/llm_connector.py
new file mode 100644
index 00000000..766dd1df
--- /dev/null
+++ b/server/app/models/llm_connector.py
@@ -0,0 +1,229 @@
+"""LLM connector models — provider-agnostic credential storage and audit trail.
+
+Tables:
+- llm_connectors: per-DJ LLM provider credentials (encrypted at rest)
+- llm_call_log: per-call telemetry (counts only — no prompt/completion content)
+- llm_audit_event: security-relevant credential lifecycle events
+
+See docs/superpowers/specs/2026-05-24-admin-ai-oauth-design.md §4.2.
+"""
+
+from datetime import datetime
+
+from sqlalchemy import (
+    Boolean,
+    CheckConstraint,
+    DateTime,
+    ForeignKey,
+    Index,
+    Integer,
+    String,
+    UniqueConstraint,
+    func,
+    text,
+)
+from sqlalchemy.orm import Mapped, mapped_column
+
+from app.core.encryption import EncryptedText
+from app.models.base import Base
+
+# Valid connector types — keep in sync with services/llm/registry.py
+CONNECTOR_TYPE_OPENAI_APIKEY = "openai_apikey"
+CONNECTOR_TYPE_ANTHROPIC_APIKEY = "anthropic_apikey"
+CONNECTOR_TYPE_OPENAI_COMPATIBLE = "openai_compatible"
+CONNECTOR_TYPE_GEMINI_APIKEY = "gemini_apikey"
+CONNECTOR_TYPE_AZURE_OPENAI = "azure_openai"
+CONNECTOR_TYPE_BEDROCK = "bedrock"
+CONNECTOR_TYPE_OPENROUTER_APIKEY = "openrouter_apikey"
+CONNECTOR_TYPE_XAI_APIKEY = "xai_apikey"
+
+VALID_CONNECTOR_TYPES = frozenset(
+    {
+        CONNECTOR_TYPE_OPENAI_APIKEY,
+        CONNECTOR_TYPE_ANTHROPIC_APIKEY,
+        CONNECTOR_TYPE_OPENAI_COMPATIBLE,
+        CONNECTOR_TYPE_GEMINI_APIKEY,
+        CONNECTOR_TYPE_AZURE_OPENAI,
+        CONNECTOR_TYPE_BEDROCK,
+        CONNECTOR_TYPE_OPENROUTER_APIKEY,
+        CONNECTOR_TYPE_XAI_APIKEY,
+    }
+)
+
+# Connector statuses
+STATUS_ACTIVE = "active"
+STATUS_AUTH_INVALID = "auth_invalid"
+STATUS_DISABLED = "disabled"
+
+# Health-check status values written to ``last_health_check_status``. Kept here
+# so the API/background loop/admin UI all use the same vocabulary. These are
+# *outcomes*, not connector statuses — a single connector accumulates many
+# health-check rows over its lifetime; only the most recent outcome is stored
+# on the row itself (audit_event rows preserve the full history).
+HEALTH_CHECK_OK = "ok"
+HEALTH_CHECK_AUTH_INVALID = "auth_invalid"
+HEALTH_CHECK_RATE_LIMITED = "rate_limited"
+HEALTH_CHECK_QUOTA_EXCEEDED = "quota_exceeded"
+HEALTH_CHECK_PROVIDER_UNAVAILABLE = "provider_unavailable"
+HEALTH_CHECK_ERROR = "error"
+
+VALID_HEALTH_CHECK_STATUSES = frozenset(
+    {
+        HEALTH_CHECK_OK,
+        HEALTH_CHECK_AUTH_INVALID,
+        HEALTH_CHECK_RATE_LIMITED,
+        HEALTH_CHECK_QUOTA_EXCEEDED,
+        HEALTH_CHECK_PROVIDER_UNAVAILABLE,
+        HEALTH_CHECK_ERROR,
+    }
+)
+
+# Audit event types
+AUDIT_CREATED = "connector_created"
+AUDIT_CREDENTIALS_ROTATED = "connector_credentials_rotated"
+AUDIT_DELETED = "connector_deleted"
+AUDIT_REVOKED_BY_ADMIN = "connector_revoked_by_admin"
+AUDIT_AUTH_INVALID_OBSERVED = "auth_invalid_observed"
+AUDIT_POLICY_CHANGED = "policy_changed"
+AUDIT_HEALTH_CHECK = "connector_health_check"
+AUDIT_DEFAULT_SET = "connector_default_set"
+AUDIT_DEFAULT_UNSET = "connector_default_unset"
+# Emitted by the background monitor when a periodic health check flips a
+# previously-active connector into ``auth_invalid``. Distinct from
+# ``AUDIT_HEALTH_CHECK`` (which is fired on EVERY check, OK or not) so admins
+# can filter to the credential-lifecycle subset.
+AUDIT_HEALTH_CHECK_FAILED = "connector_health_check_failed"
+
+
+class LlmConnector(Base):
+    """Per-DJ LLM provider credentials.
+
+    `credentials` is a JSON string encrypted via Fernet. Shape varies by type:
+    - openai_apikey / anthropic_apikey / openrouter_apikey: {"api_key": "..."}
+    - openai_compatible: {"base_url": "...", "bearer": "..." | null}
+    - azure_openai: {"api_key": "...", "azure_resource_name": "...",
+      "azure_deployment_name": "...", "azure_api_version": "..."}
+    - bedrock: {"aws_access_key_id": "...", "aws_secret_access_key": "...",
+      "aws_region": "...", "aws_model_id": "..."}
+
+    `base_url_plain` mirrors the openai_compatible base_url in plaintext so admin
+    listing can render without decrypting. Contains no credentials.
+    """
+
+    __tablename__ = "llm_connectors"
+
+    id: Mapped[int] = mapped_column(Integer, primary_key=True)
+    user_id: Mapped[int] = mapped_column(
+        ForeignKey("users.id", ondelete="CASCADE"), index=True, nullable=False
+    )
+    connector_type: Mapped[str] = mapped_column(String(40), index=True, nullable=False)
+    display_name: Mapped[str] = mapped_column(String(80), nullable=False)
+    status: Mapped[str] = mapped_column(
+        String(20), nullable=False, default=STATUS_ACTIVE, server_default=STATUS_ACTIVE
+    )
+    credentials: Mapped[str] = mapped_column(EncryptedText, nullable=False)
+
+    base_url_plain: Mapped[str | None] = mapped_column(String(255), nullable=True)
+    model_hint: Mapped[str | None] = mapped_column(String(80), nullable=True)
+
+    created_at: Mapped[datetime] = mapped_column(
+        DateTime, nullable=False, server_default=func.now()
+    )
+    updated_at: Mapped[datetime] = mapped_column(
+        DateTime, nullable=False, server_default=func.now(), onupdate=func.now()
+    )
+    last_used_at: Mapped[datetime | None] = mapped_column(DateTime, nullable=True)
+    last_error: Mapped[str | None] = mapped_column(String(255), nullable=True)
+
+    # Per-DJ explicit default. At most one connector per user_id may have
+    # is_default=True — enforced at the DB layer via a partial unique index
+    # (Postgres) and at the service layer via clear-then-set semantics. When
+    # set, the gateway prefers this connector over the MRU heuristic. See
+    # issue #336.
+    is_default: Mapped[bool] = mapped_column(
+        Boolean,
+        nullable=False,
+        default=False,
+        server_default=text("false"),
+    )
+
+    # Health-check observability (issue #346 + #340).
+    # ``last_health_check_at`` is written by every health-check invocation —
+    # the DJ-triggered Test button AND the background monitor. ``last_health_check_status``
+    # records the outcome (see HEALTH_CHECK_* constants).
+    last_health_check_at: Mapped[datetime | None] = mapped_column(DateTime, nullable=True)
+    last_health_check_status: Mapped[str | None] = mapped_column(String(20), nullable=True)
+
+    # Admin-set monthly token cap (issue #339). NULL = unlimited. When set, the
+    # gateway refuses dispatch once the current calendar month's summed
+    # tokens_in + tokens_out for this connector meets or exceeds the cap. The
+    # cap is admin-only (set via /api/admin/llm/connectors/{id}/cap) and is
+    # checked PRE-FLIGHT only — editing it never disrupts an in-flight call.
+    monthly_token_cap: Mapped[int | None] = mapped_column(Integer, nullable=True)
+
+    __table_args__ = (
+        UniqueConstraint("user_id", "connector_type", "display_name", name="uq_dj_connector_label"),
+        # A negative cap would make the connector permanently "over budget". The
+        # API schema (ge=0) and service layer already reject negatives; this DB
+        # CHECK is the defence-in-depth backstop so a bad write can never persist.
+        CheckConstraint(
+            "monthly_token_cap IS NULL OR monthly_token_cap >= 0",
+            name="ck_llm_connectors_monthly_token_cap_nonnegative",
+        ),
+        Index("ix_user_active", "user_id", "status"),
+        # Partial unique index — only enforced on Postgres. SQLite ignores
+        # the postgresql_where clause but still creates an unfiltered index;
+        # since the service layer clears siblings before flipping a row to
+        # True, that is harmless. The migration uses the same clause so the
+        # CI ``alembic check`` step stays clean on Postgres.
+        Index(
+            "ix_llm_connectors_user_default_unique",
+            "user_id",
+            unique=True,
+            postgresql_where=text("is_default"),
+            sqlite_where=text("is_default"),
+        ),
+    )
+
+
+class LlmCallLog(Base):
+    """Per-call telemetry — counts only, never prompt/completion content.
+
+    30-day retention is the default; daily cleanup deletes older rows.
+    """
+
+    __tablename__ = "llm_call_log"
+
+    id: Mapped[int] = mapped_column(Integer, primary_key=True)
+    connector_id: Mapped[int] = mapped_column(
+        ForeignKey("llm_connectors.id", ondelete="CASCADE"), index=True, nullable=False
+    )
+    purpose: Mapped[str] = mapped_column(String(40), index=True, nullable=False)
+    status: Mapped[str] = mapped_column(String(20), nullable=False)
+    latency_ms: Mapped[int] = mapped_column(Integer, nullable=False)
+    tokens_in: Mapped[int | None] = mapped_column(Integer, nullable=True)
+    tokens_out: Mapped[int | None] = mapped_column(Integer, nullable=True)
+    error_code: Mapped[str | None] = mapped_column(String(60), nullable=True)
+    created_at: Mapped[datetime] = mapped_column(
+        DateTime, nullable=False, server_default=func.now(), index=True
+    )
+
+
+class LlmAuditEvent(Base):
+    """Security-relevant connector lifecycle events.
+
+    Indefinite retention (no auto-cleanup). Includes admin-triggered events
+    so org operators have a complete audit trail for security reviews.
+    """
+
+    __tablename__ = "llm_audit_event"
+
+    id: Mapped[int] = mapped_column(Integer, primary_key=True)
+    actor_user_id: Mapped[int] = mapped_column(ForeignKey("users.id"), index=True, nullable=False)
+    target_connector_id: Mapped[int | None] = mapped_column(
+        ForeignKey("llm_connectors.id", ondelete="SET NULL"), nullable=True
+    )
+    event_type: Mapped[str] = mapped_column(String(60), index=True, nullable=False)
+    created_at: Mapped[datetime] = mapped_column(
+        DateTime, nullable=False, server_default=func.now()
+    )
diff --git a/server/app/models/llm_feature_preference.py b/server/app/models/llm_feature_preference.py
new file mode 100644
index 00000000..e1cd593a
--- /dev/null
+++ b/server/app/models/llm_feature_preference.py
@@ -0,0 +1,49 @@
+"""Per-feature connector preference — pins a DJ's connector to a feature.
+
+A DJ can pin the recommendation engine to one connector and the set-builder
+to another. The gateway consults this table first (keyed by ``purpose``)
+before falling back to the per-DJ default / MRU / org-default chain.
+
+See issue #337, spec §11.8.
+"""
+
+from datetime import datetime
+
+from sqlalchemy import DateTime, ForeignKey, Integer, String, UniqueConstraint, func
+from sqlalchemy.orm import Mapped, mapped_column
+
+from app.models.base import Base
+
+# Allowlist of feature keys a DJ may pin. These mirror the gateway ``purpose``
+# strings. ``recommendation`` is the only purpose dispatched today;
+# ``set_builder`` is reserved for the upcoming set-builder feature (issue spec
+# §11.8). Validation of API input against this set lives in ``schemas/llm.py``
+# (the ``FeatureKey`` Literal must stay in sync — guarded by a test).
+KNOWN_FEATURES = frozenset({"recommendation", "set_builder"})
+
+
+class LlmFeaturePreference(Base):
+    """Maps ``(user_id, feature)`` to a pinned ``connector_id``.
+
+    At most one row per ``(user_id, feature)`` — enforced by a UNIQUE
+    constraint. Deleting the connector cascades (ON DELETE CASCADE) so a stale
+    preference never points at a missing connector.
+    """
+
+    __tablename__ = "llm_feature_preferences"
+
+    id: Mapped[int] = mapped_column(Integer, primary_key=True)
+    user_id: Mapped[int] = mapped_column(
+        ForeignKey("users.id", ondelete="CASCADE"), index=True, nullable=False
+    )
+    feature: Mapped[str] = mapped_column(String(40), nullable=False)
+    connector_id: Mapped[int] = mapped_column(
+        ForeignKey("llm_connectors.id", ondelete="CASCADE"), index=True, nullable=False
+    )
+    created_at: Mapped[datetime] = mapped_column(
+        DateTime, nullable=False, server_default=func.now()
+    )
+
+    __table_args__ = (
+        UniqueConstraint("user_id", "feature", name="uq_llm_feature_pref_user_feature"),
+    )
diff --git a/server/app/models/system_settings.py b/server/app/models/system_settings.py
index e9dfa022..bdb979fa 100644
--- a/server/app/models/system_settings.py
+++ b/server/app/models/system_settings.py
@@ -1,4 +1,4 @@
-from sqlalchemy import Boolean, Integer, String
+from sqlalchemy import Boolean, ForeignKey, Integer, String, text
 from sqlalchemy.orm import Mapped, mapped_column
 
 from app.models.base import Base
@@ -25,3 +25,23 @@ class SystemSettings(Base):
     llm_enabled: Mapped[bool] = mapped_column(Boolean, default=True)
     llm_model: Mapped[str] = mapped_column(String(100), default="claude-haiku-4-5-20251001")
     llm_rate_limit_per_minute: Mapped[int] = mapped_column(Integer, default=3)
+
+    # llm_call_log retention (days). Daily cleanup deletes rows older than this.
+    # Bounds (7..365) are enforced at the API level, not the DB.
+    llm_call_log_retention_days: Mapped[int] = mapped_column(
+        Integer, default=30, server_default=text("30")
+    )
+
+    # LLM gateway connector policy (admin-controlled)
+    # See docs/superpowers/specs/2026-05-24-admin-ai-oauth-design.md §4.2
+    llm_apikey_connectors_enabled: Mapped[bool] = mapped_column(
+        Boolean, default=True, server_default=text("true")
+    )
+    llm_compatible_connector_enabled: Mapped[bool] = mapped_column(
+        Boolean, default=True, server_default=text("true")
+    )
+    # Org-default connector — used when a system-context (no actor) LLM call is dispatched
+    # FK kept nullable; SET NULL on connector delete to avoid orphan references.
+    llm_default_connector_id: Mapped[int | None] = mapped_column(
+        ForeignKey("llm_connectors.id", ondelete="SET NULL"), nullable=True
+    )
diff --git a/server/app/schemas/llm.py b/server/app/schemas/llm.py
new file mode 100644
index 00000000..67dd0a75
--- /dev/null
+++ b/server/app/schemas/llm.py
@@ -0,0 +1,356 @@
+"""Pydantic schemas for the LLM gateway / connector API."""
+
+from __future__ import annotations
+
+from datetime import datetime
+from typing import Literal
+
+from pydantic import BaseModel, ConfigDict, Field, model_validator
+
+from app.models.llm_feature_preference import KNOWN_FEATURES
+
+# Feature keys a DJ may pin a connector to (issue #337). ``FeatureKey`` is the
+# static Literal used in the request/response schemas (so the OpenAPI spec
+# emits a proper enum and FastAPI rejects unknown values at the boundary).
+# ``KNOWN_FEATURE_VALUES`` is the sorted runtime tuple returned to the
+# frontend so the picker is deterministic. A test
+# (``test_feature_key_literal_matches_known_features``) guards that the Literal
+# and ``KNOWN_FEATURES`` never drift apart.
+FeatureKey = Literal["recommendation", "set_builder"]
+KNOWN_FEATURE_VALUES: tuple[str, ...] = tuple(sorted(KNOWN_FEATURES))
+
+ConnectorType = Literal[
+    "openai_apikey",
+    "anthropic_apikey",
+    "openai_compatible",
+    "openrouter_apikey",
+    "xai_apikey",
+    "bedrock",
+    "azure_openai",
+    "gemini_apikey",
+]
+ConnectorStatus = Literal["active", "auth_invalid", "disabled"]
+
+
+def _provided(value: str | None) -> bool:
+    """True only when ``value`` is a non-blank string.
+
+    Used by the credential validators so whitespace-only inputs (``"   "``) are
+    treated as missing rather than passing a bare truthiness check.
+    """
+    return isinstance(value, str) and value.strip() != ""
+
+
+HealthCheckStatus = Literal[
+    "ok",
+    "auth_invalid",
+    "rate_limited",
+    "quota_exceeded",
+    "provider_unavailable",
+    "error",
+]
+
+
+class ConnectorOut(BaseModel):
+    """Public-safe connector view — never includes the credential blob."""
+
+    model_config = ConfigDict(from_attributes=True)
+
+    id: int
+    user_id: int
+    connector_type: ConnectorType
+    display_name: str
+    status: ConnectorStatus
+    base_url_plain: str | None = None
+    model_hint: str | None = None
+    created_at: datetime
+    updated_at: datetime
+    last_used_at: datetime | None = None
+    last_error: str | None = None
+    # Per-DJ explicit default flag (issue #336). When True, the gateway pins
+    # routing to this connector for the owning DJ instead of falling back to
+    # most-recently-used resolution.
+    is_default: bool = False
+    # Health-check observability (issues #340 + #346).
+    last_health_check_at: datetime | None = None
+    last_health_check_status: HealthCheckStatus | None = None
+    # Admin-set monthly token cap (issue #339). None = unlimited.
+    monthly_token_cap: int | None = None
+
+
+class AdminConnectorOut(ConnectorOut):
+    """Admin view — adds the DJ's username for display."""
+
+    dj_username: str
+    # Current calendar-month token usage (tokens_in + tokens_out), so the admin
+    # UI can render a usage-vs-cap progress bar without a second round-trip
+    # (issue #339).
+    current_month_tokens: int = 0
+
+
+class ConnectorCreate(BaseModel):
+    """Provider-agnostic create payload.
+
+    Field requirements vary by ``connector_type``:
+
+    - ``openai_apikey`` / ``anthropic_apikey`` / ``openrouter_apikey`` /
+      ``xai_apikey`` / ``gemini_apikey``: ``api_key`` required; ``base_url``
+      and ``bearer`` are ignored.
+    - ``openai_compatible``: ``base_url`` required; ``bearer`` optional;
+      ``api_key`` is ignored.
+    - ``bedrock``: ``aws_access_key_id``, ``aws_secret_access_key``,
+      ``aws_region`` and ``aws_model_id`` required; other fields ignored.
+    - ``azure_openai``: ``api_key``, ``azure_resource_name``,
+      ``azure_deployment_name`` and ``azure_api_version`` all required.
+
+    The combination is enforced by :meth:`_require_credentials_for_type`.
+    See ``build_create_payload`` in ``services/llm/connector_storage.py``
+    for the full validation flow (including key shape checks).
+    """
+
+    connector_type: ConnectorType
+    display_name: str = Field(..., min_length=1, max_length=80)
+    model_hint: str | None = Field(default=None, max_length=80)
+
+    # Set for apikey types (and azure_openai)
+    api_key: str | None = Field(default=None, max_length=512)
+
+    # Set for openai_compatible
+    base_url: str | None = Field(default=None, max_length=512)
+    bearer: str | None = Field(default=None, max_length=512)
+
+    # Set for bedrock (AWS SigV4 — billed to the DJ's AWS account)
+    aws_access_key_id: str | None = Field(default=None, max_length=128)
+    aws_secret_access_key: str | None = Field(default=None, max_length=512)
+    aws_region: str | None = Field(default=None, max_length=64)
+    aws_model_id: str | None = Field(default=None, max_length=128)
+
+    # Set for azure_openai (stored in the encrypted credentials blob, not columns)
+    azure_resource_name: str | None = Field(default=None, max_length=120)
+    azure_deployment_name: str | None = Field(default=None, max_length=120)
+    azure_api_version: str | None = Field(default=None, max_length=40)
+
+    @model_validator(mode="after")
+    def _require_credentials_for_type(self) -> ConnectorCreate:
+        if self.connector_type in (
+            "openai_apikey",
+            "anthropic_apikey",
+            "openrouter_apikey",
+            "xai_apikey",
+            "gemini_apikey",
+        ):
+            if not _provided(self.api_key):
+                raise ValueError("api_key is required for API-key connectors")
+        elif self.connector_type == "openai_compatible":
+            if not _provided(self.base_url):
+                raise ValueError("base_url is required for openai_compatible connectors")
+        elif self.connector_type == "bedrock":
+            missing = [
+                name
+                for name, value in (
+                    ("aws_access_key_id", self.aws_access_key_id),
+                    ("aws_secret_access_key", self.aws_secret_access_key),
+                    ("aws_region", self.aws_region),
+                    ("aws_model_id", self.aws_model_id),
+                )
+                if not _provided(value)
+            ]
+            if missing:
+                raise ValueError("bedrock connectors require " + ", ".join(missing))
+        elif self.connector_type == "azure_openai":
+            missing = [
+                name
+                for name, value in (
+                    ("api_key", self.api_key),
+                    ("azure_resource_name", self.azure_resource_name),
+                    ("azure_deployment_name", self.azure_deployment_name),
+                    ("azure_api_version", self.azure_api_version),
+                )
+                if not _provided(value)
+            ]
+            if missing:
+                raise ValueError("azure_openai connectors require: " + ", ".join(missing))
+        return self
+
+
+class ConnectorPatch(BaseModel):
+    """Metadata-only patch (no credential rotation here)."""
+
+    display_name: str | None = Field(default=None, min_length=1, max_length=80)
+    model_hint: str | None = Field(default=None, max_length=80)
+
+
+class ConnectorCredentialsRotate(BaseModel):
+    """Rotation payload — at least one credential field must be supplied.
+
+    Field semantics mirror :class:`ConnectorCreate`. The actual field required
+    depends on the connector being rotated (validated in ``rotate_credentials``).
+    """
+
+    api_key: str | None = Field(default=None, max_length=512)
+    base_url: str | None = Field(default=None, max_length=512)
+    bearer: str | None = Field(default=None, max_length=512)
+
+    # Set when rotating bedrock credentials.
+    aws_access_key_id: str | None = Field(default=None, max_length=128)
+    aws_secret_access_key: str | None = Field(default=None, max_length=512)
+    aws_region: str | None = Field(default=None, max_length=64)
+    aws_model_id: str | None = Field(default=None, max_length=128)
+
+    # azure_openai rotation — admins can swap resource/deployment/version
+    # without recreating the connector (all live in the encrypted blob).
+    azure_resource_name: str | None = Field(default=None, max_length=120)
+    azure_deployment_name: str | None = Field(default=None, max_length=120)
+    azure_api_version: str | None = Field(default=None, max_length=40)
+
+    @model_validator(mode="after")
+    def _require_at_least_one(self) -> ConnectorCredentialsRotate:
+        if not any(
+            _provided(v)
+            for v in (
+                self.api_key,
+                self.base_url,
+                self.bearer,
+                self.aws_access_key_id,
+                self.aws_secret_access_key,
+                self.aws_region,
+                self.aws_model_id,
+                self.azure_resource_name,
+                self.azure_deployment_name,
+                self.azure_api_version,
+            )
+        ):
+            raise ValueError("At least one credential field must be provided")
+        return self
+
+
+class ConnectorTestResult(BaseModel):
+    ok: bool
+    error_code: str | None = None
+    message: str | None = None
+
+
+class AdminPolicyOut(BaseModel):
+    llm_apikey_connectors_enabled: bool
+    llm_compatible_connector_enabled: bool
+    llm_default_connector_id: int | None
+    llm_call_log_retention_days: int
+
+
+class DjPolicyOut(BaseModel):
+    """DJ-readable connector policy — the non-sensitive subset of the admin
+    policy surface.
+
+    Lets the settings/ai page fail *closed*: a normal DJ can learn which
+    connector types the admin has enabled (so disallowed providers are hidden
+    in the picker) without exposing admin-only fields such as
+    ``llm_default_connector_id``.
+
+    ``allowed_connector_types`` is the pre-computed set of connector types a DJ
+    may create given the two toggles, so the frontend doesn't have to hard-code
+    the api-key-vs-compatible mapping.
+    """
+
+    llm_apikey_connectors_enabled: bool
+    llm_compatible_connector_enabled: bool
+    allowed_connector_types: list[ConnectorType]
+
+
+class AdminPolicyPatch(BaseModel):
+    llm_apikey_connectors_enabled: bool | None = None
+    llm_compatible_connector_enabled: bool | None = None
+    # Use a sentinel sentinel: clients can send null to clear, or omit to leave unchanged
+    llm_default_connector_id: int | None = None
+    clear_default: bool = False
+    # Sanity bounds: minimum 7 days (data minimization floor), maximum 365 days
+    # (reporting ceiling). Out-of-range values are rejected at the API level.
+    llm_call_log_retention_days: int | None = Field(None, ge=7, le=365)
+
+    @model_validator(mode="after")
+    def _check_default_consistency(self) -> AdminPolicyPatch:
+        if self.clear_default and self.llm_default_connector_id is not None:
+            raise ValueError(
+                "clear_default cannot be combined with a non-null llm_default_connector_id"
+            )
+        return self
+
+
+class AdminConnectorCapPatch(BaseModel):
+    """Admin set/clear a connector's monthly token cap (issue #339).
+
+    ``monthly_token_cap`` is **required** so intent is always explicit: an
+    integer sets the cap, ``null`` clears it (unlimited). Omitting the field
+    (an empty ``{}`` body) is rejected with 422 rather than silently treated as
+    ``null`` — that would let an accidental no-field PATCH wipe a configured
+    cap. A non-null value must be a non-negative integer; ``0`` means "no
+    further calls this month". The upper bound is a sanity ceiling, not a
+    billing limit.
+    """
+
+    monthly_token_cap: int | None = Field(..., ge=0, le=1_000_000_000)
+
+
+class UsageRow(BaseModel):
+    connector_id: int
+    dj_username: str
+    display_name: str
+    connector_type: ConnectorType
+    total_calls: int
+    total_tokens_in: int
+    total_tokens_out: int
+    error_count: int
+    error_rate: float
+
+
+class AdminUsageOut(BaseModel):
+    days: int
+    rows: list[UsageRow]
+
+
+class AuditEventRow(BaseModel):
+    """A single audit-trail row with joined display labels.
+
+    Never includes credential material — only the target connector's
+    human-readable display name (joined from ``llm_connectors``).
+    """
+
+    id: int
+    created_at: datetime
+    event_type: str
+    actor_user_id: int
+    actor_username: str
+    target_connector_id: int | None = None
+    target_connector_display_name: str | None = None
+    notes: str | None = None
+
+
+class AdminAuditOut(BaseModel):
+    """Paginated audit-event browse response."""
+
+    rows: list[AuditEventRow]
+    total: int
+    limit: int
+    offset: int
+
+
+class FeaturePreferenceOut(BaseModel):
+    """A single per-feature connector pin (issue #337)."""
+
+    model_config = ConfigDict(from_attributes=True)
+
+    feature: FeatureKey
+    connector_id: int
+
+
+class FeaturePreferencesListOut(BaseModel):
+    """All of a DJ's per-feature pins + the catalogue of pinnable features."""
+
+    preferences: list[FeaturePreferenceOut]
+    known_features: list[FeatureKey]
+
+
+class FeaturePreferenceSet(BaseModel):
+    """Set/change a per-feature pin. Upsert — replaces any existing pin."""
+
+    feature: FeatureKey
+    connector_id: int = Field(..., ge=1)
diff --git a/server/app/services/email_sender.py b/server/app/services/email_sender.py
index 619cf2ca..2fd33c08 100644
--- a/server/app/services/email_sender.py
+++ b/server/app/services/email_sender.py
@@ -78,3 +78,59 @@ def send_email_confirmation(to_address: str, confirmation_url: str) -> None:
         raise EmailSendError(str(exc)) from exc
 
     _logger.info("email.confirmation_sent to_hash=%s", to_address[:3] + "***")
+
+
+def send_connector_auth_invalid_notification(
+    to_address: str, display_name: str, connector_type: str
+) -> None:
+    """Notify a DJ that their LLM connector failed a background health check.
+
+    Triggered by the periodic connector health monitor (issue #340) when a
+    previously-active connector transitions to ``auth_invalid``. Never
+    includes credential material — only the display name and provider type
+    so the DJ can identify which key to rotate.
+    """
+    settings = get_settings()
+
+    if not settings.resend_api_key or not settings.email_from_address:
+        raise EmailNotConfiguredError("Resend API key or from address is not configured")
+
+    # Strip control characters defensively — display_name is user-supplied
+    # (DJ-set) and already validated at creation, but the connector_type comes
+    # from the registry. Belt-and-braces for an email body.
+    safe_display = "".join(c for c in (display_name or "") if c.isprintable())
+    safe_type = "".join(c for c in (connector_type or "") if c.isprintable())
+
+    resend.api_key = settings.resend_api_key
+
+    try:
+        resend.Emails.send(
+            {
+                "from": settings.email_from_address,
+                "to": [to_address],
+                "subject": "Your WrzDJ AI connector needs attention",
+                "text": (
+                    f'Your AI connector "{safe_display}" ({safe_type}) failed a '
+                    f"health check and was marked invalid.\n\n"
+                    f"This usually means the API key was revoked, expired, or the "
+                    f"upstream account is no longer in good standing.\n\n"
+                    f"To restore AI features, sign in to WrzDJ and rotate the "
+                    f"credentials on your AI Settings page.\n\n"
+                    f"If this looks wrong, you can re-test the connector from the "
+                    f"same page — a successful test restores its status automatically.\n"
+                ),
+            }
+        )
+    except Exception as exc:
+        _logger.error(
+            "email.connector_auth_invalid_send_failed to_hash=%s error=%s",
+            to_address[:3] + "***",
+            exc,
+        )
+        raise EmailSendError(str(exc)) from exc
+
+    _logger.info(
+        "email.connector_auth_invalid_sent to_hash=%s connector_type=%s",
+        to_address[:3] + "***",
+        safe_type,
+    )
diff --git a/server/app/services/export.py b/server/app/services/export.py
index 401607de..53694011 100644
--- a/server/app/services/export.py
+++ b/server/app/services/export.py
@@ -5,24 +5,12 @@
 import re
 from datetime import UTC, datetime
 
+from app.core.csv_safe import sanitize_csv_value
 from app.models.event import Event
 from app.models.play_history import PlayHistory
 from app.models.request import Request
 
-
-def sanitize_csv_value(value: str | None) -> str:
-    """
-    Sanitize a value to prevent CSV formula injection.
-
-    Spreadsheet applications (Excel, Google Sheets) interpret cells starting with
-    =, +, -, @, \t, or \r as formulas, which can be exploited for attacks.
-    Prefixing with a single quote prevents formula execution.
-    """
-    if not value:
-        return ""
-    if value[0] in ("=", "+", "-", "@", "\t", "\r"):
-        return "'" + value
-    return value
+__all__ = ["sanitize_csv_value", "sanitize_filename"]
 
 
 def sanitize_filename(name: str) -> str:
diff --git a/server/app/services/llm/__init__.py b/server/app/services/llm/__init__.py
index c22c9870..19fe59b4 100644
--- a/server/app/services/llm/__init__.py
+++ b/server/app/services/llm/__init__.py
@@ -1,6 +1,49 @@
-"""Provider-agnostic LLM gateway package.
+"""LLM gateway — provider-agnostic dispatch for agentic features.
 
-WrzDJSet (and any future agentic feature) MUST call LLMs only through
-`app.services.llm.gateway`. Direct provider SDK imports are forbidden in
-feature code — provider/model identifiers are data, not imports.
+See docs/superpowers/specs/2026-05-24-admin-ai-oauth-design.md.
+
+Entrypoint: ``Gateway.dispatch(db, actor, request, *, purpose)`` →
+``ChatResponse``. Adapters live under :mod:`app.services.llm.adapters`.
 """
+
+from app.services.llm.base import (
+    ChatRequest,
+    ChatResponse,
+    ContentBlock,
+    LlmAdapter,
+    Message,
+    TokenUsage,
+    ToolCall,
+    ToolSpec,
+)
+from app.services.llm.exceptions import (
+    AuthInvalid,
+    LlmError,
+    NoLlmConfigured,
+    ProviderUnavailable,
+    QuotaCapReached,
+    QuotaExceeded,
+    RateLimited,
+    ToolTranslationError,
+)
+from app.services.llm.gateway import Gateway
+
+__all__ = [
+    "AuthInvalid",
+    "ChatRequest",
+    "ChatResponse",
+    "ContentBlock",
+    "Gateway",
+    "LlmAdapter",
+    "LlmError",
+    "Message",
+    "NoLlmConfigured",
+    "ProviderUnavailable",
+    "QuotaCapReached",
+    "QuotaExceeded",
+    "RateLimited",
+    "TokenUsage",
+    "ToolCall",
+    "ToolSpec",
+    "ToolTranslationError",
+]
diff --git a/server/app/services/llm/adapters/__init__.py b/server/app/services/llm/adapters/__init__.py
new file mode 100644
index 00000000..136ae6bd
--- /dev/null
+++ b/server/app/services/llm/adapters/__init__.py
@@ -0,0 +1 @@
+"""Per-provider adapter classes — auto-registered with the gateway registry."""
diff --git a/server/app/services/llm/adapters/_httpx_openai.py b/server/app/services/llm/adapters/_httpx_openai.py
new file mode 100644
index 00000000..0d4f2db9
--- /dev/null
+++ b/server/app/services/llm/adapters/_httpx_openai.py
@@ -0,0 +1,278 @@
+"""Shared httpx-backed OpenAI Chat Completions caller.
+
+Both ``openai_apikey`` (Platform) and ``openai_compatible`` (Hermes/Ollama/etc.)
+use the same OpenAI Chat Completions wire format. They differ only in:
+
+- base URL (``https://api.openai.com/v1`` vs the user-supplied URL)
+- header (always ``Authorization: Bearer <token>``; bearer is optional for compatible)
+
+This helper handles the actual HTTP call + error mapping. Adapters wrap it with
+type-specific credential extraction and registration.
+"""
+
+from __future__ import annotations
+
+import json
+import logging
+from collections.abc import AsyncIterator
+from typing import Any
+
+import httpx
+
+from app.services.llm.adapters._shared import raise_for_status
+from app.services.llm.base import ChatRequest, ChatResponse, ChatResponseChunk, Message
+from app.services.llm.exceptions import (
+    AuthInvalid,
+    ProviderUnavailable,
+    QuotaExceeded,
+    RateLimited,
+    ToolTranslationError,
+)
+from app.services.llm.streaming import parse_openai_stream_event
+from app.services.llm.tool_translation import (
+    content_to_text,
+    parse_openai_response,
+    to_openai_tools,
+)
+
+logger = logging.getLogger(__name__)
+
+DEFAULT_TIMEOUT_SECONDS = 30.0
+MAX_TIMEOUT_SECONDS = 120.0
+
+
+def _messages_to_openai(req: ChatRequest) -> list[dict]:
+    """Translate canonical messages to OpenAI chat-completions format."""
+    out: list[dict] = []
+    if req.system:
+        out.append({"role": "system", "content": req.system})
+
+    for m in req.messages:
+        # OpenAI uses identical role names for system/user/assistant/tool.
+        msg: dict[str, Any] = {"role": m.role, "content": content_to_text(m.content)}
+        if m.role == "tool":
+            if not m.tool_call_id:
+                raise ToolTranslationError("Tool result message missing tool_call_id")
+            msg["tool_call_id"] = m.tool_call_id
+        out.append(msg)
+    return out
+
+
+def _build_payload(req: ChatRequest, model: str | None, *, max_tokens_field: str) -> dict:
+    tools, choice = to_openai_tools(req.tools, req.force_tool)
+
+    body: dict[str, Any] = {
+        "model": model,
+        "messages": _messages_to_openai(req),
+    }
+    if req.max_tokens is not None:
+        body[max_tokens_field] = req.max_tokens
+    if req.temperature is not None:
+        body["temperature"] = req.temperature
+    if tools:
+        body["tools"] = tools
+    if choice is not None:
+        body["tool_choice"] = choice
+
+    return body
+
+
+async def call_openai_chat(
+    *,
+    base_url: str,
+    api_key: str | None,
+    request: ChatRequest,
+    fallback_model: str | None,
+    extra_headers: dict | None = None,
+    max_tokens_field: str = "max_tokens",
+) -> ChatResponse:
+    """Issue a Chat Completions request and parse the response.
+
+    ``base_url`` must end either at the API root (``/v1``) or at the actual host
+    root — this helper appends ``/chat/completions`` and is tolerant of either
+    form. Adapters are responsible for ensuring URLs are validated upstream.
+    """
+    model = request.model or fallback_model
+    if not model:
+        raise ToolTranslationError(
+            "model is required (set ChatRequest.model or LlmConnector.model_hint)"
+        )
+
+    endpoint = _build_chat_endpoint(base_url)
+
+    headers: dict[str, str] = {
+        "Content-Type": "application/json",
+        "Accept": "application/json",
+    }
+    if api_key:
+        headers["Authorization"] = f"Bearer {api_key}"  # nosec B106
+    if extra_headers:
+        headers.update(extra_headers)
+
+    timeout = request.timeout_seconds or DEFAULT_TIMEOUT_SECONDS
+    timeout = min(max(timeout, 1.0), MAX_TIMEOUT_SECONDS)
+
+    payload = _build_payload(request, model, max_tokens_field=max_tokens_field)
+
+    try:
+        async with httpx.AsyncClient(timeout=timeout) as client:
+            resp = await client.post(endpoint, json=payload, headers=headers)
+    except httpx.TimeoutException as exc:
+        raise ProviderUnavailable("Upstream timeout") from exc
+    except httpx.HTTPError as exc:
+        raise ProviderUnavailable("Upstream network error") from exc
+
+    raise_for_status(resp)
+
+    try:
+        body = resp.json()
+    except json.JSONDecodeError as exc:
+        raise ToolTranslationError("Upstream returned non-JSON body") from exc
+    except ValueError as exc:
+        raise ToolTranslationError("Upstream returned non-JSON body") from exc
+
+    return parse_openai_response(body)
+
+
+def _map_stream_status(status_code: int) -> None:
+    """Raise the canonical typed error for a non-2xx streaming status.
+
+    Mirrors ``_shared.raise_for_status`` but operates on a bare status code
+    (the streaming path reads the status before consuming the body).
+    """
+    if status_code in (401, 403):
+        raise AuthInvalid(f"Auth failed (HTTP {status_code})")
+    if status_code == 402:
+        raise QuotaExceeded("Quota or billing failure (HTTP 402)")
+    if status_code == 429:
+        raise RateLimited("Rate limited (HTTP 429)")
+    if 500 <= status_code < 600:
+        raise ProviderUnavailable(f"Upstream error (HTTP {status_code})")
+    raise ToolTranslationError(f"Upstream rejected request (HTTP {status_code})")
+
+
+def _decode_openai_sse_event_data(data: str) -> ChatResponseChunk | None:
+    """Decode one assembled SSE event body into a chunk.
+
+    ``data`` is the event's ``data:`` payload lines already joined on newlines
+    and stripped. Returns ``None`` for an empty body; raises
+    ``ToolTranslationError`` on malformed JSON. The ``[DONE]`` sentinel and event
+    framing are handled by the caller.
+    """
+    if not data:
+        return None
+    try:
+        obj = json.loads(data)
+    except json.JSONDecodeError as exc:
+        raise ToolTranslationError("Upstream returned malformed SSE JSON") from exc
+    return parse_openai_stream_event(obj)
+
+
+async def stream_openai_chat(
+    *,
+    base_url: str,
+    api_key: str | None,
+    request: ChatRequest,
+    fallback_model: str | None,
+    extra_headers: dict | None = None,
+    max_tokens_field: str = "max_tokens",
+) -> AsyncIterator[ChatResponseChunk]:
+    """Issue a streaming Chat Completions request, yielding canonical chunks.
+
+    Cancellation: if the consumer stops iterating (e.g. an SSE client
+    disconnect closes the async generator), the ``async with client.stream(...)``
+    context exits and httpx closes the upstream connection, cancelling the
+    provider request. Non-2xx statuses are mapped to canonical typed exceptions
+    before the first chunk; mid-stream network drops surface as
+    ``ProviderUnavailable``.
+    """
+    model = request.model or fallback_model
+    if not model:
+        raise ToolTranslationError(
+            "model is required (set ChatRequest.model or LlmConnector.model_hint)"
+        )
+
+    endpoint = _build_chat_endpoint(base_url)
+
+    headers: dict[str, str] = {
+        "Content-Type": "application/json",
+        "Accept": "text/event-stream",
+    }
+    if api_key:
+        headers["Authorization"] = f"Bearer {api_key}"  # nosec B106
+    if extra_headers:
+        headers.update(extra_headers)
+
+    timeout = request.timeout_seconds or DEFAULT_TIMEOUT_SECONDS
+    timeout = min(max(timeout, 1.0), MAX_TIMEOUT_SECONDS)
+
+    payload = _build_payload(request, model, max_tokens_field=max_tokens_field)
+    payload["stream"] = True
+    # Ask OpenAI to include token usage in the terminal stream event. Harmless to
+    # OpenAI-compatible servers that ignore unknown fields.
+    payload["stream_options"] = {"include_usage": True}
+
+    try:
+        async with httpx.AsyncClient(timeout=timeout) as client:
+            async with client.stream("POST", endpoint, json=payload, headers=headers) as resp:
+                if resp.status_code >= 300:
+                    # Drain the (small) error body so the connection releases,
+                    # then map to a typed error. The body is never surfaced.
+                    await resp.aread()
+                    _map_stream_status(resp.status_code)
+                # SSE events are delimited by a blank line, and a single event
+                # may span multiple ``data:`` lines (joined on newlines). Buffer
+                # per event and decode the whole body, so a multi-line JSON object
+                # isn't decoded as broken fragments. Comment frames (":") and
+                # other fields (event:/id:/retry:) are ignored.
+                event_lines: list[str] = []
+                async for line in resp.aiter_lines():
+                    if line.startswith(":"):
+                        continue
+                    if line.startswith("data:"):
+                        event_lines.append(line[len("data:") :].lstrip())
+                        continue
+                    if line:
+                        continue
+                    data = "\n".join(event_lines).strip()
+                    event_lines.clear()
+                    if data == "[DONE]":
+                        break
+                    chunk = _decode_openai_sse_event_data(data)
+                    if chunk is not None:
+                        yield chunk
+                # A non-compliant server may close without a trailing blank line
+                # after the final event; flush whatever remains buffered.
+                data = "\n".join(event_lines).strip()
+                if data and data != "[DONE]":
+                    chunk = _decode_openai_sse_event_data(data)
+                    if chunk is not None:
+                        yield chunk
+    except httpx.TimeoutException as exc:
+        raise ProviderUnavailable("Upstream timeout") from exc
+    except httpx.HTTPError as exc:
+        raise ProviderUnavailable("Upstream network error") from exc
+
+
+def _build_chat_endpoint(base_url: str) -> str:
+    base = base_url.rstrip("/")
+    if base.endswith("/chat/completions"):
+        return base
+    return f"{base}/chat/completions"
+
+
+def build_healthcheck_request() -> ChatRequest:
+    """Return a minimal request used to verify the connector is alive.
+
+    Deliberately omits ``max_tokens``: reasoning models (OpenAI GPT-5 / o-series)
+    spend their completion budget on internal reasoning tokens before producing
+    any visible output, so a 1-token cap is fully consumed by reasoning and the
+    request fails with HTTP 400 ("max_tokens or model output limit was reached").
+    Letting the provider apply its default budget keeps the probe cheap (the
+    prompt is trivial) while working for reasoning and non-reasoning models alike.
+    Adapters override the ``model`` via the connector's ``model_hint``.
+    """
+    return ChatRequest(
+        messages=[Message(role="user", content="ping")],
+        temperature=0.0,
+    )
diff --git a/server/app/services/llm/adapters/_shared.py b/server/app/services/llm/adapters/_shared.py
new file mode 100644
index 00000000..36379ac7
--- /dev/null
+++ b/server/app/services/llm/adapters/_shared.py
@@ -0,0 +1,103 @@
+"""Shared primitives for the httpx-backed LLM adapters.
+
+Centralises three pieces that were copy-pasted across the OpenAI-wire, Gemini
+and Bedrock adapters:
+
+- ``parse_retry_after`` — HTTP ``Retry-After`` header → ``int`` seconds.
+- ``raise_for_status`` — httpx status code → canonical typed exception.
+- ``extract_api_key`` / ``extract_fixed_base_credentials`` — parse the encrypted
+  ``{"api_key": "..."}`` credential blob.
+
+The Anthropic adapter talks to the official SDK (``APIStatusError``), not httpx,
+so it keeps its own status mapping; the two api-key extractors intentionally
+differ in how they treat a non-dict blob (see ``extract_fixed_base_credentials``)
+to preserve each adapter's established error message.
+"""
+
+from __future__ import annotations
+
+import json
+from collections.abc import Callable
+
+import httpx
+
+from app.services.llm.exceptions import (
+    AuthInvalid,
+    ProviderUnavailable,
+    QuotaExceeded,
+    RateLimited,
+    ToolTranslationError,
+)
+
+
+def parse_retry_after(value: str | None) -> int | None:
+    if not value:
+        return None
+    try:
+        return int(float(value))
+    except ValueError:
+        return None
+
+
+def raise_for_status(
+    resp: httpx.Response,
+    *,
+    throttle_detector: Callable[[httpx.Response], bool] | None = None,
+) -> None:
+    """Map a non-2xx httpx response to a canonical adapter exception.
+
+    ``throttle_detector`` lets Bedrock treat an HTTP 400 carrying a
+    ``ThrottlingException`` error-type header as rate-limiting; the default
+    ``None`` preserves the plain OpenAI/Gemini mapping.
+    """
+    if 200 <= resp.status_code < 300:
+        return
+
+    code = resp.status_code
+    if code in (401, 403):
+        raise AuthInvalid(f"Auth failed (HTTP {code})")
+    if code == 402:
+        raise QuotaExceeded("Quota or billing failure (HTTP 402)")
+    if code == 429 or (code == 400 and throttle_detector is not None and throttle_detector(resp)):
+        retry_after = parse_retry_after(resp.headers.get("Retry-After"))
+        raise RateLimited("Rate limited (HTTP 429)", retry_after_seconds=retry_after)
+    if 500 <= code < 600:
+        raise ProviderUnavailable(f"Upstream error (HTTP {code})")
+    # 4xx other than the above → treat as a malformed input / translation error
+    # since the gateway only emits known shapes.
+    raise ToolTranslationError(f"Upstream rejected request (HTTP {code})")
+
+
+def extract_api_key(raw: str) -> str:
+    """Parse an ``{"api_key": "..."}`` credential blob → bare api key.
+
+    Used by the OpenAI / Gemini / Anthropic api-key adapters. A non-dict blob
+    falls through to the missing-key path (matching their established behaviour).
+    """
+    try:
+        blob = json.loads(raw)
+    except (json.JSONDecodeError, TypeError) as exc:
+        raise AuthInvalid("Connector credentials are malformed") from exc
+    api_key = blob.get("api_key") if isinstance(blob, dict) else None
+    if not api_key:
+        raise AuthInvalid("Connector is missing an api_key")
+    return str(api_key)
+
+
+def extract_fixed_base_credentials(raw: str, base_url: str) -> tuple[str, str]:
+    """Parse an ``{"api_key": "..."}`` blob for fixed-base-URL adapters.
+
+    Used by xAI and OpenRouter, whose base URL is pinned (never user-supplied).
+    Stricter than :func:`extract_api_key`: a non-dict blob raises
+    ``"Connector credentials shape is invalid"`` rather than falling through.
+    """
+    try:
+        blob = json.loads(raw)
+    except (json.JSONDecodeError, TypeError) as exc:
+        raise AuthInvalid("Connector credentials are malformed") from exc
+    if not isinstance(blob, dict):
+        raise AuthInvalid("Connector credentials shape is invalid")
+    api_key = blob.get("api_key")
+    if not api_key:
+        raise AuthInvalid("Connector is missing an api_key")
+    return base_url, str(api_key)
diff --git a/server/app/services/llm/adapters/anthropic_apikey.py b/server/app/services/llm/adapters/anthropic_apikey.py
new file mode 100644
index 00000000..1f38e58e
--- /dev/null
+++ b/server/app/services/llm/adapters/anthropic_apikey.py
@@ -0,0 +1,255 @@
+"""Anthropic API-key adapter — uses the official ``anthropic`` SDK."""
+
+from __future__ import annotations
+
+import logging
+from collections.abc import AsyncIterator
+from typing import Any
+
+from anthropic import (
+    APIConnectionError,
+    APIError,
+    APIStatusError,
+    APITimeoutError,
+    AsyncAnthropic,
+)
+
+from app.services.llm.adapters._shared import extract_api_key
+from app.services.llm.base import (
+    ChatRequest,
+    ChatResponse,
+    ChatResponseChunk,
+    LlmAdapter,
+    Message,
+    TokenUsage,
+    ToolCallDelta,
+)
+from app.services.llm.exceptions import (
+    AuthInvalid,
+    ProviderUnavailable,
+    QuotaExceeded,
+    RateLimited,
+    ToolTranslationError,
+)
+from app.services.llm.registry import register_adapter
+from app.services.llm.tool_translation import (
+    normalise_anthropic_stop_reason,
+    parse_anthropic_response,
+    to_anthropic_messages,
+    to_anthropic_tools,
+)
+
+logger = logging.getLogger(__name__)
+
+DEFAULT_MODEL = "claude-opus-4-7"
+DEFAULT_MAX_TOKENS = 1024
+DEFAULT_TIMEOUT_SECONDS = 30.0
+MAX_TIMEOUT_SECONDS = 120.0
+
+
+class AnthropicApiKeyAdapter(LlmAdapter):
+    connector_type = "anthropic_apikey"
+
+    def _extract_api_key(self) -> str:
+        return extract_api_key(self.connector.credentials or "")
+
+    def _client(self, *, timeout: float) -> AsyncAnthropic:
+        return AsyncAnthropic(api_key=self._extract_api_key(), timeout=timeout)
+
+    def _resolve_timeout(self, request: ChatRequest) -> float:
+        return min(
+            max(request.timeout_seconds or DEFAULT_TIMEOUT_SECONDS, 1.0),
+            MAX_TIMEOUT_SECONDS,
+        )
+
+    def _build_kwargs(self, request: ChatRequest) -> dict[str, Any]:
+        """Build the ``messages.create`` / ``messages.stream`` kwargs.
+
+        Shared by ``chat`` and ``stream`` so request translation never drifts
+        between the buffered and streamed paths.
+        """
+        model = request.model or self.connector.model_hint or DEFAULT_MODEL
+        max_tokens = request.max_tokens or DEFAULT_MAX_TOKENS
+
+        tools, choice = to_anthropic_tools(request.tools, request.force_tool)
+        kwargs: dict[str, Any] = {
+            "model": model,
+            "max_tokens": max_tokens,
+            "messages": to_anthropic_messages(request.messages),
+        }
+        if request.system:
+            kwargs["system"] = request.system
+        if request.temperature is not None:
+            kwargs["temperature"] = request.temperature
+        if tools:
+            kwargs["tools"] = tools
+        if choice is not None:
+            kwargs["tool_choice"] = choice
+        return kwargs
+
+    async def chat(self, request: ChatRequest) -> ChatResponse:
+        timeout = self._resolve_timeout(request)
+        kwargs = self._build_kwargs(request)
+
+        async with self._client(timeout=timeout) as client:
+            try:
+                message = await client.messages.create(**kwargs)
+            except APITimeoutError as exc:
+                raise ProviderUnavailable("Upstream timeout") from exc
+            except APIConnectionError as exc:
+                raise ProviderUnavailable("Upstream network error") from exc
+            except APIStatusError as exc:
+                self._raise_for_status(exc)
+            except APIError as exc:
+                raise ProviderUnavailable(f"Anthropic API error: {type(exc).__name__}") from exc
+
+        return parse_anthropic_response(message)
+
+    async def stream(self, request: ChatRequest) -> AsyncIterator[ChatResponseChunk]:
+        timeout = self._resolve_timeout(request)
+        kwargs = self._build_kwargs(request)
+
+        # Track whether any tool_use block appeared, plus the terminal
+        # stop_reason / output token count gathered from the message_delta event.
+        saw_tool_use = False
+        stop_reason: str | None = None
+        output_tokens: int | None = None
+
+        try:
+            async with self._client(timeout=timeout) as client:
+                async with client.messages.stream(**kwargs) as stream:
+                    async for event in stream:
+                        chunk, tool_seen, sr, ot = _translate_anthropic_event(event)
+                        saw_tool_use = saw_tool_use or tool_seen
+                        if sr is not None:
+                            stop_reason = sr
+                        if ot is not None:
+                            output_tokens = ot
+                        if chunk is not None:
+                            yield chunk
+        except APITimeoutError as exc:
+            raise ProviderUnavailable("Upstream timeout") from exc
+        except APIConnectionError as exc:
+            raise ProviderUnavailable("Upstream network error") from exc
+        except APIStatusError as exc:
+            self._raise_for_status(exc)
+        except APIError as exc:
+            raise ProviderUnavailable(f"Anthropic API error: {type(exc).__name__}") from exc
+
+        # Same canonicalisation as the buffered path (parse_anthropic_response),
+        # so stream and chat never diverge on pause_turn / refusal / unknowns.
+        canonical_stop = normalise_anthropic_stop_reason(stop_reason)
+        if saw_tool_use and canonical_stop != "tool_use":
+            canonical_stop = "tool_use"
+        # Anthropic streams output_tokens in message_delta but input_tokens only
+        # in message_start; for the counts-only call log the completion count is
+        # what matters, so prompt is recorded as 0 when unavailable.
+        final_usage = (
+            TokenUsage(prompt=0, completion=output_tokens) if output_tokens is not None else None
+        )
+        yield ChatResponseChunk(stop_reason=canonical_stop, usage=final_usage, done=True)
+
+    async def health_check(self) -> None:
+        # 1-token ping to validate the key + reach the API.
+        ping = ChatRequest(
+            messages=[Message(role="user", content="ping")],
+            max_tokens=1,
+            temperature=0.0,
+        )
+        await self.chat(ping)
+
+    @staticmethod
+    def _raise_for_status(exc: APIStatusError) -> None:
+        status = getattr(exc, "status_code", None)
+        if status in (401, 403):
+            raise AuthInvalid(f"Auth failed (HTTP {status})") from exc
+        if status == 402:
+            raise QuotaExceeded("Quota or billing failure (HTTP 402)") from exc
+        if status == 429:
+            retry_after = None
+            try:
+                resp_headers = getattr(exc.response, "headers", {}) or {}
+                retry_after_raw = resp_headers.get("retry-after") or resp_headers.get("Retry-After")
+                if retry_after_raw:
+                    retry_after = int(float(retry_after_raw))
+            except (TypeError, ValueError, AttributeError):
+                retry_after = None
+            raise RateLimited("Rate limited (HTTP 429)", retry_after_seconds=retry_after) from exc
+        if status is not None and 500 <= status < 600:
+            raise ProviderUnavailable(f"Upstream error (HTTP {status})") from exc
+        raise ToolTranslationError(f"Upstream rejected request (HTTP {status})") from exc
+
+
+def _field(obj: Any, name: str) -> Any:
+    """Read ``name`` from an SDK object (attribute) or a plain dict (key).
+
+    The Anthropic SDK yields typed event objects in production, but tests feed
+    plain dicts. Plain ``getattr`` returns ``None`` for dict keys, which would
+    silently drop every delta on a dict-backed event — so fall back to ``.get``.
+    """
+    if isinstance(obj, dict):
+        return obj.get(name)
+    return getattr(obj, name, None)
+
+
+def _translate_anthropic_event(
+    event: Any,
+) -> tuple[ChatResponseChunk | None, bool, str | None, int | None]:
+    """Translate one Anthropic SDK stream event into stream state.
+
+    Returns ``(chunk_or_None, saw_tool_use, stop_reason_or_None,
+    output_tokens_or_None)``. Mirrors the dual dict/object access style of
+    ``tool_translation.parse_anthropic_response`` so it tolerates either the
+    typed SDK events or plain dicts (used in tests).
+    """
+    etype = _field(event, "type")
+
+    if etype == "content_block_start":
+        block = _field(event, "content_block")
+        if _field(block, "type") == "tool_use":
+            idx = int(_field(event, "index") or 0)
+            chunk = ChatResponseChunk(
+                tool_call_deltas=[
+                    ToolCallDelta(
+                        index=idx,
+                        id=_field(block, "id"),
+                        name=_field(block, "name"),
+                    )
+                ]
+            )
+            return chunk, True, None, None
+        return None, False, None, None
+
+    if etype == "content_block_delta":
+        delta = _field(event, "delta")
+        dtype = _field(delta, "type")
+        if dtype == "text_delta":
+            return ChatResponseChunk(text_delta=_field(delta, "text") or ""), False, None, None
+        if dtype == "input_json_delta":
+            idx = int(_field(event, "index") or 0)
+            chunk = ChatResponseChunk(
+                tool_call_deltas=[
+                    ToolCallDelta(
+                        index=idx,
+                        input_json_fragment=_field(delta, "partial_json") or "",
+                    )
+                ]
+            )
+            return chunk, False, None, None
+        return None, False, None, None
+
+    if etype == "message_delta":
+        delta = _field(event, "delta")
+        stop_reason = _field(delta, "stop_reason")
+        usage = _field(event, "usage")
+        output_tokens = None
+        if usage is not None:
+            ot = _field(usage, "output_tokens")
+            if ot is not None:
+                output_tokens = int(ot)
+        return None, False, stop_reason, output_tokens
+
+    return None, False, None, None
+
+
+register_adapter("anthropic_apikey", AnthropicApiKeyAdapter)
diff --git a/server/app/services/llm/adapters/azure_openai.py b/server/app/services/llm/adapters/azure_openai.py
new file mode 100644
index 00000000..20a48de2
--- /dev/null
+++ b/server/app/services/llm/adapters/azure_openai.py
@@ -0,0 +1,165 @@
+"""Azure OpenAI adapter.
+
+Azure OpenAI exposes the same Chat Completions *body* as the OpenAI Platform
+API, but differs on two axes that prevent reusing the OpenAI-compatible code
+path directly:
+
+1. **URL** — per-deployment endpoint:
+   ``https://<resource>.openai.azure.com/openai/deployments/<deployment>/chat/completions?api-version=<ver>``
+2. **Auth header** — ``api-key: <key>`` (NOT ``Authorization: Bearer``).
+
+We therefore build the URL + headers ourselves and only share the request-body
+shaping (``_build_payload``) and response parsing (``parse_openai_response``)
+with the OpenAI helper, plus the HTTP status → typed-exception mapping.
+
+All configuration (resource name, deployment name, api version) **and** the
+api key live in the encrypted ``credentials`` blob — there are no dedicated
+columns. This lets admins rotate any of them via the existing
+``PUT /credentials`` route without recreating the connector.
+"""
+
+from __future__ import annotations
+
+import json
+import logging
+import re
+from typing import Any
+from urllib.parse import quote, urlencode
+
+import httpx
+
+from app.services.llm.adapters._httpx_openai import (
+    DEFAULT_TIMEOUT_SECONDS,
+    MAX_TIMEOUT_SECONDS,
+    _build_payload,
+    build_healthcheck_request,
+)
+from app.services.llm.adapters._shared import raise_for_status
+from app.services.llm.base import ChatRequest, ChatResponse, LlmAdapter
+from app.services.llm.exceptions import AuthInvalid, ProviderUnavailable, ToolTranslationError
+from app.services.llm.registry import register_adapter
+from app.services.llm.tool_translation import parse_openai_response
+
+logger = logging.getLogger(__name__)
+
+DEFAULT_MODEL = "gpt-4o-mini"
+
+# Azure naming rules: resource is a DNS host label (letters/digits/hyphen);
+# deployment + api-version are token-ish. These mirror the storage-layer
+# validators in connector_storage.py and provide defense-in-depth at the
+# URL-composition boundary against component injection (CLAUDE.md: validate at
+# system boundaries — never trust the credential blob implicitly).
+_RESOURCE_RE = re.compile(r"^[A-Za-z0-9-]+$")
+_DEPLOYMENT_RE = re.compile(r"^[A-Za-z0-9._-]+$")
+_API_VERSION_RE = re.compile(r"^[A-Za-z0-9._-]+$")
+
+
+def _build_azure_endpoint(resource_name: str, deployment_name: str, api_version: str) -> str:
+    """Compose the per-deployment Azure Chat Completions URL.
+
+    ``resource_name`` is the bare resource (e.g. ``my-co``), NOT a full host.
+
+    The three components are validated and the path/query parts URL-encoded so a
+    malformed credential blob cannot rewrite the authority/path/query and route
+    requests to an unintended endpoint.
+    """
+    resource_name = resource_name.strip()
+    deployment_name = deployment_name.strip()
+    api_version = api_version.strip()
+    if not _RESOURCE_RE.fullmatch(resource_name):
+        raise AuthInvalid("Invalid Azure resource name")
+    if not _DEPLOYMENT_RE.fullmatch(deployment_name):
+        raise AuthInvalid("Invalid Azure deployment name")
+    if not _API_VERSION_RE.fullmatch(api_version):
+        raise AuthInvalid("Invalid Azure API version")
+
+    deployment_segment = quote(deployment_name, safe="")
+    query = urlencode({"api-version": api_version})
+    return (
+        f"https://{resource_name}.openai.azure.com"
+        f"/openai/deployments/{deployment_segment}/chat/completions"
+        f"?{query}"
+    )
+
+
+class AzureOpenAIAdapter(LlmAdapter):
+    connector_type = "azure_openai"
+
+    def _extract_credentials(self) -> dict[str, str]:
+        """Return the validated config dict from the encrypted blob.
+
+        Keys: api_key, azure_resource_name, azure_deployment_name,
+        azure_api_version.
+        """
+        raw = self.connector.credentials or ""
+        try:
+            blob = json.loads(raw)
+        except (json.JSONDecodeError, TypeError) as exc:
+            raise AuthInvalid("Connector credentials are malformed") from exc
+        if not isinstance(blob, dict):
+            raise AuthInvalid("Connector credentials shape is invalid")
+
+        api_key = blob.get("api_key")
+        resource = blob.get("azure_resource_name")
+        deployment = blob.get("azure_deployment_name")
+        api_version = blob.get("azure_api_version")
+        if not (api_key and resource and deployment and api_version):
+            raise AuthInvalid("Connector is missing Azure OpenAI configuration")
+        return {
+            "api_key": str(api_key),
+            "azure_resource_name": str(resource),
+            "azure_deployment_name": str(deployment),
+            "azure_api_version": str(api_version),
+        }
+
+    async def _call(self, request: ChatRequest) -> ChatResponse:
+        creds = self._extract_credentials()
+        endpoint = _build_azure_endpoint(
+            creds["azure_resource_name"],
+            creds["azure_deployment_name"],
+            creds["azure_api_version"],
+        )
+
+        # Azure routes by deployment, so the body `model` is largely cosmetic,
+        # but the shared payload builder requires a non-None model. Default to
+        # the deployment name when no explicit model/hint is supplied.
+        model = request.model or self.connector.model_hint or creds["azure_deployment_name"]
+        # Azure serves the same OpenAI models, which reject the legacy `max_tokens`
+        # field on GPT-5 / o-series deployments — use `max_completion_tokens`.
+        payload = _build_payload(request, model, max_tokens_field="max_completion_tokens")
+
+        headers: dict[str, str] = {
+            "Content-Type": "application/json",
+            "Accept": "application/json",
+            "api-key": creds["api_key"],
+        }
+
+        timeout = request.timeout_seconds or DEFAULT_TIMEOUT_SECONDS
+        timeout = min(max(timeout, 1.0), MAX_TIMEOUT_SECONDS)
+
+        try:
+            async with httpx.AsyncClient(timeout=timeout) as client:
+                resp = await client.post(endpoint, json=payload, headers=headers)
+        except httpx.TimeoutException as exc:
+            raise ProviderUnavailable("Upstream timeout") from exc
+        except httpx.HTTPError as exc:
+            raise ProviderUnavailable("Upstream network error") from exc
+
+        raise_for_status(resp)
+
+        try:
+            body: Any = resp.json()
+        except (json.JSONDecodeError, ValueError) as exc:
+            raise ToolTranslationError("Upstream returned non-JSON body") from exc
+
+        return parse_openai_response(body)
+
+    async def chat(self, request: ChatRequest) -> ChatResponse:
+        return await self._call(request)
+
+    async def health_check(self) -> None:
+        # 1-token ping exercises the URL + api-key auth path.
+        await self._call(build_healthcheck_request())
+
+
+register_adapter("azure_openai", AzureOpenAIAdapter)
diff --git a/server/app/services/llm/adapters/bedrock.py b/server/app/services/llm/adapters/bedrock.py
new file mode 100644
index 00000000..0aa390b8
--- /dev/null
+++ b/server/app/services/llm/adapters/bedrock.py
@@ -0,0 +1,229 @@
+"""AWS Bedrock adapter — SigV4-signed ``InvokeModel`` over httpx (no boto3).
+
+Billing flows to the DJ's own AWS account. Auth is AWS Signature V4 (not a
+Bearer token), implemented manually in ``services/llm/sigv4.py`` so we add no
+new dependency.
+
+Per-family request/response handling, keyed off ``aws_model_id``:
+
+- ``anthropic.*`` (Claude on Bedrock) — uses the Anthropic Messages body
+  (``anthropic_version`` + ``messages`` + ``tools``), so it reuses the existing
+  Anthropic tool-schema translation and response parser.
+- ``meta.*`` / ``llama*`` (Llama on Bedrock) — uses the Llama prompt body.
+  Llama has no structured tool field, so tools are described in the system
+  prompt and tool calls are parsed out of the generated text.
+
+Other families are rejected with a ``ToolTranslationError`` (clear message)
+rather than guessing a body shape.
+"""
+
+from __future__ import annotations
+
+import json
+import logging
+from typing import Any
+
+import httpx
+
+from app.core.time import utcnow
+from app.services.llm.adapters._shared import raise_for_status
+from app.services.llm.base import ChatRequest, ChatResponse, LlmAdapter, Message
+from app.services.llm.exceptions import AuthInvalid, ProviderUnavailable, ToolTranslationError
+from app.services.llm.registry import register_adapter
+from app.services.llm.sigv4 import sign_request
+from app.services.llm.tool_translation import (
+    content_to_text,
+    parse_anthropic_response,
+    parse_llama_response,
+    render_llama_tool_instructions,
+    to_anthropic_messages,
+    to_anthropic_tools,
+)
+
+logger = logging.getLogger(__name__)
+
+ANTHROPIC_BEDROCK_VERSION = "bedrock-2023-05-31"
+DEFAULT_MAX_TOKENS = 1024
+DEFAULT_TIMEOUT_SECONDS = 30.0
+MAX_TIMEOUT_SECONDS = 120.0
+
+FAMILY_ANTHROPIC = "anthropic"
+FAMILY_LLAMA = "llama"
+
+
+def model_family(model_id: str) -> str:
+    """Map a Bedrock model id (or inference-profile id) to a request family."""
+    mid = (model_id or "").lower()
+    # Inference profiles prefix the region, e.g. "us.anthropic.claude-...".
+    if "anthropic." in mid:
+        return FAMILY_ANTHROPIC
+    if "meta." in mid or "llama" in mid:
+        return FAMILY_LLAMA
+    raise ToolTranslationError(f"Unsupported Bedrock model family for model_id={model_id!r}")
+
+
+class BedrockAdapter(LlmAdapter):
+    connector_type = "bedrock"
+
+    def _extract_credentials(self) -> dict[str, str]:
+        raw = self.connector.credentials or ""
+        try:
+            blob = json.loads(raw)
+        except (json.JSONDecodeError, TypeError) as exc:
+            raise AuthInvalid("Connector credentials are malformed") from exc
+        if not isinstance(blob, dict):
+            raise AuthInvalid("Connector credentials shape is invalid")
+        for field in ("aws_access_key_id", "aws_secret_access_key", "aws_region", "aws_model_id"):
+            if not blob.get(field):
+                raise AuthInvalid(f"Connector is missing {field}")
+        return {k: str(v) for k, v in blob.items()}
+
+    def _resolve_model_id(self, request: ChatRequest, creds: dict[str, str]) -> str:
+        # ChatRequest.model / model_hint override the stored aws_model_id.
+        return request.model or self.connector.model_hint or creds["aws_model_id"]
+
+    async def chat(self, request: ChatRequest) -> ChatResponse:
+        creds = self._extract_credentials()
+        model_id = self._resolve_model_id(request, creds)
+        family = model_family(model_id)
+
+        if family == FAMILY_ANTHROPIC:
+            body, tool_names = self._build_anthropic_body(request)
+        else:  # FAMILY_LLAMA
+            body, tool_names = self._build_llama_body(request)
+
+        payload = json.dumps(body).encode("utf-8")
+        timeout = min(
+            max(request.timeout_seconds or DEFAULT_TIMEOUT_SECONDS, 1.0),
+            MAX_TIMEOUT_SECONDS,
+        )
+
+        region = creds["aws_region"]
+        host = f"bedrock-runtime.{region}.amazonaws.com"
+        canonical_uri = f"/model/{model_id}/invoke"
+        url = f"https://{host}{canonical_uri}"
+
+        signed_headers = sign_request(
+            access_key_id=creds["aws_access_key_id"],
+            secret_access_key=creds["aws_secret_access_key"],
+            region=region,
+            host=host,
+            canonical_uri=canonical_uri,
+            body=payload,
+            now=utcnow(),
+            # Forward STS/temporary-credential session token when present so
+            # the SigV4 signature includes X-Amz-Security-Token.
+            session_token=creds.get("aws_session_token") or None,
+        )
+        headers = {
+            "Content-Type": "application/json",
+            "Accept": "application/json",
+            **signed_headers,
+        }
+
+        try:
+            async with httpx.AsyncClient(timeout=timeout) as client:
+                resp = await client.post(url, content=payload, headers=headers)
+        except httpx.TimeoutException as exc:
+            raise ProviderUnavailable("Upstream timeout") from exc
+        except httpx.HTTPError as exc:
+            raise ProviderUnavailable("Upstream network error") from exc
+
+        raise_for_status(resp, throttle_detector=_is_throttle)
+
+        try:
+            response_body = resp.json()
+        except (json.JSONDecodeError, ValueError) as exc:
+            raise ToolTranslationError("Upstream returned non-JSON body") from exc
+
+        if family == FAMILY_ANTHROPIC:
+            parsed = parse_anthropic_response(response_body)
+        else:
+            parsed = parse_llama_response(response_body, tool_names=tool_names)
+        # The Bedrock model id is the source of truth for telemetry — the
+        # InvokeModel body doesn't reliably echo the full id.
+        parsed.model = model_id
+        return parsed
+
+    async def health_check(self) -> None:
+        ping = ChatRequest(
+            messages=[Message(role="user", content="ping")],
+            max_tokens=1,
+            temperature=0.0,
+        )
+        await self.chat(ping)
+
+    # -- Per-family request bodies -----------------------------------------
+    def _build_anthropic_body(self, request: ChatRequest) -> tuple[dict, set[str] | None]:
+        tools, choice = to_anthropic_tools(request.tools, request.force_tool)
+        body: dict[str, Any] = {
+            "anthropic_version": ANTHROPIC_BEDROCK_VERSION,
+            "max_tokens": request.max_tokens or DEFAULT_MAX_TOKENS,
+            "messages": to_anthropic_messages(request.messages),
+        }
+        if request.system:
+            body["system"] = request.system
+        if request.temperature is not None:
+            body["temperature"] = request.temperature
+        if tools:
+            body["tools"] = tools
+        if choice is not None:
+            body["tool_choice"] = choice
+        return body, None
+
+    def _build_llama_body(self, request: ChatRequest) -> tuple[dict, set[str] | None]:
+        # When no tools are configured, pass an empty set (not None) so generated
+        # {"name","input"} JSON is never misclassified as a tool call.
+        tool_names = {t.name for t in request.tools} if request.tools else set()
+        tool_instructions = render_llama_tool_instructions(request.tools, request.force_tool)
+        prompt = _render_llama_prompt(request, tool_instructions)
+        body: dict[str, Any] = {"prompt": prompt}
+        if request.max_tokens is not None:
+            body["max_gen_len"] = request.max_tokens
+        if request.temperature is not None:
+            body["temperature"] = request.temperature
+        return body, tool_names
+
+
+def _render_llama_prompt(request: ChatRequest, tool_instructions: str | None) -> str:
+    """Render canonical messages into Llama 3's instruction-tuned chat format."""
+    parts: list[str] = ["<|begin_of_text|>"]
+
+    system_chunks: list[str] = []
+    if request.system:
+        system_chunks.append(request.system)
+    if tool_instructions:
+        system_chunks.append(tool_instructions)
+    for m in request.messages:
+        if m.role == "system":
+            system_chunks.append(content_to_text(m.content))
+    if system_chunks:
+        parts.append(
+            "<|start_header_id|>system<|end_header_id|>\n\n"
+            + "\n\n".join(system_chunks)
+            + "<|eot_id|>"
+        )
+
+    for m in request.messages:
+        if m.role == "system":
+            continue
+        role = "assistant" if m.role == "assistant" else "user"
+        parts.append(
+            f"<|start_header_id|>{role}<|end_header_id|>\n\n{content_to_text(m.content)}<|eot_id|>"
+        )
+
+    parts.append("<|start_header_id|>assistant<|end_header_id|>\n\n")
+    return "".join(parts)
+
+
+def _is_throttle(resp: httpx.Response) -> bool:
+    """Bedrock signals throttling via the ``ThrottlingException`` error type.
+
+    It can arrive as HTTP 429 or, on some paths, HTTP 400 with an
+    ``x-amzn-errortype`` header. Detect both so callers back off correctly.
+    """
+    err_type = resp.headers.get("x-amzn-errortype") or resp.headers.get("X-Amzn-ErrorType") or ""
+    return "throttl" in err_type.lower()
+
+
+register_adapter("bedrock", BedrockAdapter)
diff --git a/server/app/services/llm/adapters/gemini_apikey.py b/server/app/services/llm/adapters/gemini_apikey.py
new file mode 100644
index 00000000..e8afc089
--- /dev/null
+++ b/server/app/services/llm/adapters/gemini_apikey.py
@@ -0,0 +1,158 @@
+"""Google Gemini API-key adapter (native generativelanguage API).
+
+Gemini's native API is NOT OpenAI-compatible, so this adapter talks to
+``generativelanguage.googleapis.com`` directly via httpx rather than reusing
+the shared OpenAI caller. Key differences handled here:
+
+- Tools are nested ``function_declarations`` under a single ``tools`` entry
+  (see ``tool_translation.to_gemini_tools``).
+- Messages use ``contents`` with roles ``user`` / ``model`` and ``parts``.
+- The system prompt maps to ``systemInstruction``.
+- Auth is via the ``x-goog-api-key`` header (never the URL/query string, so the
+  key is not captured in proxy/access logs).
+"""
+
+from __future__ import annotations
+
+import json
+import logging
+from typing import Any
+
+import httpx
+
+from app.services.llm.adapters._shared import extract_api_key, raise_for_status
+from app.services.llm.base import ChatRequest, ChatResponse, LlmAdapter, Message
+from app.services.llm.exceptions import ProviderUnavailable, ToolTranslationError
+from app.services.llm.registry import register_adapter
+from app.services.llm.tool_translation import parse_gemini_response, to_gemini_tools
+
+logger = logging.getLogger(__name__)
+
+GEMINI_BASE_URL = "https://generativelanguage.googleapis.com/v1beta"
+DEFAULT_MODEL = "gemini-2.5-flash"
+DEFAULT_TIMEOUT_SECONDS = 30.0
+MAX_TIMEOUT_SECONDS = 120.0
+
+
+class GeminiApiKeyAdapter(LlmAdapter):
+    connector_type = "gemini_apikey"
+
+    def _extract_api_key(self) -> str:
+        return extract_api_key(self.connector.credentials or "")
+
+    async def chat(self, request: ChatRequest) -> ChatResponse:
+        api_key = self._extract_api_key()
+        model = request.model or self.connector.model_hint or DEFAULT_MODEL
+
+        payload = self._build_payload(request)
+        endpoint = f"{GEMINI_BASE_URL}/models/{model}:generateContent"
+        headers = {
+            "Content-Type": "application/json",
+            "Accept": "application/json",
+            # Header auth keeps the key out of URLs / access logs.
+            "x-goog-api-key": api_key,
+        }
+
+        timeout = min(
+            max(request.timeout_seconds or DEFAULT_TIMEOUT_SECONDS, 1.0),
+            MAX_TIMEOUT_SECONDS,
+        )
+
+        try:
+            async with httpx.AsyncClient(timeout=timeout) as client:
+                resp = await client.post(endpoint, json=payload, headers=headers)
+        except httpx.TimeoutException as exc:
+            raise ProviderUnavailable("Upstream timeout") from exc
+        except httpx.HTTPError as exc:
+            raise ProviderUnavailable("Upstream network error") from exc
+
+        raise_for_status(resp)
+
+        try:
+            body = resp.json()
+        except (json.JSONDecodeError, ValueError) as exc:
+            raise ToolTranslationError("Upstream returned non-JSON body") from exc
+
+        return parse_gemini_response(body)
+
+    async def health_check(self) -> None:
+        # 1-token ping to validate the key + reach the API.
+        ping = ChatRequest(
+            messages=[Message(role="user", content="ping")],
+            max_tokens=1,
+            temperature=0.0,
+        )
+        await self.chat(ping)
+
+    def _build_payload(self, request: ChatRequest) -> dict:
+        body: dict[str, Any] = {"contents": self._translate_messages(request.messages)}
+
+        if request.system:
+            body["systemInstruction"] = {"parts": [{"text": request.system}]}
+
+        generation_config: dict[str, Any] = {}
+        if request.max_tokens is not None:
+            generation_config["maxOutputTokens"] = request.max_tokens
+        if request.temperature is not None:
+            generation_config["temperature"] = request.temperature
+        if generation_config:
+            body["generationConfig"] = generation_config
+
+        tools, tool_config = to_gemini_tools(request.tools, request.force_tool)
+        if tools:
+            body["tools"] = tools
+        if tool_config is not None:
+            body["toolConfig"] = tool_config
+
+        return body
+
+    @staticmethod
+    def _translate_messages(messages: list[Message]) -> list[dict]:
+        """Translate canonical messages to Gemini ``contents``.
+
+        System messages are pulled out by the caller (``request.system``).
+        Assistant turns map to the Gemini ``model`` role; tool-result messages
+        map to a ``functionResponse`` part on a ``user`` turn.
+        """
+        out: list[dict] = []
+        for m in messages:
+            if m.role == "system":
+                # Surfaced via request.system; swallow here for legacy callers.
+                continue
+
+            content = m.content
+            if isinstance(content, list):
+                chunks: list[str] = []
+                for b in content:
+                    if isinstance(b, dict):
+                        chunks.append(str(b.get("text") or ""))
+                    else:
+                        chunks.append(str(getattr(b, "text", "") or ""))
+                text = "".join(chunks)
+            else:
+                text = content or ""
+
+            if m.role == "tool":
+                if not m.tool_call_id:
+                    raise ToolTranslationError("Tool message missing tool_call_id")
+                out.append(
+                    {
+                        "role": "user",
+                        "parts": [
+                            {
+                                "functionResponse": {
+                                    "name": m.tool_call_id,
+                                    "response": {"content": text},
+                                }
+                            }
+                        ],
+                    }
+                )
+                continue
+
+            role = "model" if m.role == "assistant" else "user"
+            out.append({"role": role, "parts": [{"text": text}]})
+        return out
+
+
+register_adapter("gemini_apikey", GeminiApiKeyAdapter)
diff --git a/server/app/services/llm/adapters/openai_apikey.py b/server/app/services/llm/adapters/openai_apikey.py
new file mode 100644
index 00000000..5950d1af
--- /dev/null
+++ b/server/app/services/llm/adapters/openai_apikey.py
@@ -0,0 +1,69 @@
+"""OpenAI Platform API-key adapter."""
+
+from __future__ import annotations
+
+import logging
+from collections.abc import AsyncIterator
+
+from app.services.llm.adapters._httpx_openai import (
+    build_healthcheck_request,
+    call_openai_chat,
+    stream_openai_chat,
+)
+from app.services.llm.adapters._shared import extract_api_key
+from app.services.llm.base import ChatRequest, ChatResponse, ChatResponseChunk, LlmAdapter
+from app.services.llm.registry import register_adapter
+
+logger = logging.getLogger(__name__)
+
+OPENAI_BASE_URL = "https://api.openai.com/v1"
+DEFAULT_MODEL = "gpt-5-mini"
+
+# OpenAI Platform's GPT-5 / o-series models reject the legacy ``max_tokens`` field
+# (HTTP 400 ``unsupported_parameter``) and require ``max_completion_tokens``, which
+# every current OpenAI Platform chat model also accepts. Third-party OpenAI-compatible
+# servers still speak ``max_tokens``, so this override is scoped to the Platform adapter.
+_MAX_TOKENS_FIELD = "max_completion_tokens"
+
+
+class OpenAIApiKeyAdapter(LlmAdapter):
+    connector_type = "openai_apikey"
+
+    def _extract_api_key(self) -> str:
+        return extract_api_key(self.connector.credentials or "")
+
+    async def chat(self, request: ChatRequest) -> ChatResponse:
+        api_key = self._extract_api_key()
+        return await call_openai_chat(
+            base_url=OPENAI_BASE_URL,
+            api_key=api_key,
+            request=request,
+            fallback_model=self.connector.model_hint or DEFAULT_MODEL,
+            max_tokens_field=_MAX_TOKENS_FIELD,
+        )
+
+    async def health_check(self) -> None:
+        api_key = self._extract_api_key()
+        ping = build_healthcheck_request()
+        # We just need to exercise the auth path — discard the response.
+        await call_openai_chat(
+            base_url=OPENAI_BASE_URL,
+            api_key=api_key,
+            request=ping,
+            fallback_model=self.connector.model_hint or DEFAULT_MODEL,
+            max_tokens_field=_MAX_TOKENS_FIELD,
+        )
+
+    async def stream(self, request: ChatRequest) -> AsyncIterator[ChatResponseChunk]:
+        api_key = self._extract_api_key()
+        async for chunk in stream_openai_chat(
+            base_url=OPENAI_BASE_URL,
+            api_key=api_key,
+            request=request,
+            fallback_model=self.connector.model_hint or DEFAULT_MODEL,
+            max_tokens_field=_MAX_TOKENS_FIELD,
+        ):
+            yield chunk
+
+
+register_adapter("openai_apikey", OpenAIApiKeyAdapter)
diff --git a/server/app/services/llm/adapters/openai_compatible.py b/server/app/services/llm/adapters/openai_compatible.py
new file mode 100644
index 00000000..13f311ad
--- /dev/null
+++ b/server/app/services/llm/adapters/openai_compatible.py
@@ -0,0 +1,82 @@
+"""OpenAI-compatible endpoint adapter (Hermes Agent / Ollama / LMStudio / vLLM)."""
+
+from __future__ import annotations
+
+import json
+import logging
+from collections.abc import AsyncIterator
+
+from app.services.llm.adapters._httpx_openai import (
+    build_healthcheck_request,
+    call_openai_chat,
+    stream_openai_chat,
+)
+from app.services.llm.base import ChatRequest, ChatResponse, ChatResponseChunk, LlmAdapter
+from app.services.llm.exceptions import AuthInvalid
+from app.services.llm.registry import register_adapter
+from app.services.llm.url_validator import InvalidBaseUrlError, validate_compatible_base_url
+
+logger = logging.getLogger(__name__)
+
+DEFAULT_MODEL = "gpt-5-mini"
+
+
+class OpenAICompatibleAdapter(LlmAdapter):
+    connector_type = "openai_compatible"
+
+    def _extract_credentials(self) -> tuple[str, str | None]:
+        """Return (base_url, bearer-or-None)."""
+        raw = self.connector.credentials or ""
+        try:
+            blob = json.loads(raw)
+        except (json.JSONDecodeError, TypeError) as exc:
+            raise AuthInvalid("Connector credentials are malformed") from exc
+        if not isinstance(blob, dict):
+            raise AuthInvalid("Connector credentials shape is invalid")
+        # Encrypted credentials are the sole source of truth for routing. base_url_plain
+        # is a display-only admin mirror — never send traffic to it, since it could be
+        # stale relative to the encrypted blob. Fail closed if the blob lacks the URL.
+        base_url = blob.get("base_url")
+        if not base_url:
+            raise AuthInvalid("Connector is missing a base_url")
+        # Final SSRF boundary check: re-validate at call time, since storage-time
+        # validation can be bypassed by stale rows or manual DB edits.
+        try:
+            base_url = validate_compatible_base_url(str(base_url))
+        except InvalidBaseUrlError as exc:
+            raise AuthInvalid("Connector base_url failed validation") from exc
+        bearer = blob.get("bearer")
+        # Empty-string bearer is treated as no bearer.
+        return base_url, (str(bearer) if bearer else None)
+
+    async def chat(self, request: ChatRequest) -> ChatResponse:
+        base_url, bearer = self._extract_credentials()
+        return await call_openai_chat(
+            base_url=base_url,
+            api_key=bearer,
+            request=request,
+            fallback_model=self.connector.model_hint or DEFAULT_MODEL,
+        )
+
+    async def health_check(self) -> None:
+        base_url, bearer = self._extract_credentials()
+        ping = build_healthcheck_request()
+        await call_openai_chat(
+            base_url=base_url,
+            api_key=bearer,
+            request=ping,
+            fallback_model=self.connector.model_hint or DEFAULT_MODEL,
+        )
+
+    async def stream(self, request: ChatRequest) -> AsyncIterator[ChatResponseChunk]:
+        base_url, bearer = self._extract_credentials()
+        async for chunk in stream_openai_chat(
+            base_url=base_url,
+            api_key=bearer,
+            request=request,
+            fallback_model=self.connector.model_hint or DEFAULT_MODEL,
+        ):
+            yield chunk
+
+
+register_adapter("openai_compatible", OpenAICompatibleAdapter)
diff --git a/server/app/services/llm/adapters/openrouter_apikey.py b/server/app/services/llm/adapters/openrouter_apikey.py
new file mode 100644
index 00000000..da97798e
--- /dev/null
+++ b/server/app/services/llm/adapters/openrouter_apikey.py
@@ -0,0 +1,73 @@
+"""OpenRouter API-key adapter.
+
+OpenRouter (https://openrouter.ai) exposes an OpenAI-compatible Chat
+Completions API at a fixed base URL and routes each request to one of many
+upstream models selected via the ``model`` field. A single OpenRouter API key
+therefore unlocks dozens of providers.
+
+This adapter subclasses :class:`OpenAICompatibleAdapter` to inherit the entire
+request/response + error-mapping pipeline. It differs only in:
+
+- a fixed ``base_url`` (``https://openrouter.ai/api/v1``) — never user-supplied
+- credentials stored as ``{"api_key": "sk-or-..."}`` (api-key shape), surfaced
+  to the shared OpenAI caller as the ``Authorization: Bearer`` token.
+"""
+
+from __future__ import annotations
+
+import logging
+
+from app.services.llm.adapters._httpx_openai import (
+    build_healthcheck_request,
+    call_openai_chat,
+)
+from app.services.llm.adapters._shared import extract_fixed_base_credentials
+from app.services.llm.adapters.openai_compatible import OpenAICompatibleAdapter
+from app.services.llm.base import ChatRequest, ChatResponse
+from app.services.llm.registry import register_adapter
+
+logger = logging.getLogger(__name__)
+
+OPENROUTER_BASE_URL = "https://openrouter.ai/api/v1"
+# OpenRouter model ids are namespaced ("provider/model"). This cheap, broadly
+# available default is only used when the connector has no model_hint.
+DEFAULT_MODEL = "openai/gpt-4o-mini"
+
+
+class OpenRouterApiKeyAdapter(OpenAICompatibleAdapter):
+    """OpenRouter connector — OpenAI-compatible with a fixed base URL."""
+
+    connector_type = "openrouter_apikey"
+
+    async def chat(self, request: ChatRequest) -> ChatResponse:
+        base_url, bearer = self._extract_credentials()
+        return await call_openai_chat(
+            base_url=base_url,
+            api_key=bearer,
+            request=request,
+            fallback_model=self.connector.model_hint or DEFAULT_MODEL,
+        )
+
+    async def health_check(self) -> None:
+        base_url, bearer = self._extract_credentials()
+        ping = build_healthcheck_request()
+        await call_openai_chat(
+            base_url=base_url,
+            api_key=bearer,
+            request=ping,
+            fallback_model=self.connector.model_hint or DEFAULT_MODEL,
+        )
+
+    def _extract_credentials(self) -> tuple[str, str | None]:
+        """Return (fixed base_url, api-key bearer).
+
+        OpenRouter stores credentials as ``{"api_key": "..."}`` (like the other
+        api-key connectors) rather than the ``{"base_url", "bearer"}`` shape
+        used by ``openai_compatible``. The base URL is always the fixed
+        OpenRouter endpoint — never user-supplied — which removes the SSRF
+        surface of arbitrary base URLs.
+        """
+        return extract_fixed_base_credentials(self.connector.credentials or "", OPENROUTER_BASE_URL)
+
+
+register_adapter("openrouter_apikey", OpenRouterApiKeyAdapter)
diff --git a/server/app/services/llm/adapters/xai_apikey.py b/server/app/services/llm/adapters/xai_apikey.py
new file mode 100644
index 00000000..dfa073f6
--- /dev/null
+++ b/server/app/services/llm/adapters/xai_apikey.py
@@ -0,0 +1,76 @@
+"""xAI Grok API-key adapter.
+
+xAI exposes an OpenAI-compatible Chat Completions surface at a fixed base URL
+(``https://api.x.ai/v1``). Rather than re-implement the OpenAI wire format we
+subclass :class:`OpenAICompatibleAdapter` and:
+
+- pin the base URL (it is NOT user-supplied — credentials only carry an api_key),
+- extract the api_key from the ``{"api_key": "..."}`` credential blob and pass it
+  through as the bearer token,
+- layer xAI-specific error context on top of the inherited error mapping.
+
+Tool-use mirrors OpenAI function-calling and is handled entirely by the inherited
+``call_openai_chat`` path (``to_openai_tools`` / ``parse_openai_response``).
+"""
+
+from __future__ import annotations
+
+import logging
+
+from app.services.llm.adapters._httpx_openai import (
+    build_healthcheck_request,
+    call_openai_chat,
+)
+from app.services.llm.adapters._shared import extract_fixed_base_credentials
+from app.services.llm.adapters.openai_compatible import OpenAICompatibleAdapter
+from app.services.llm.base import ChatRequest, ChatResponse
+from app.services.llm.exceptions import ProviderUnavailable
+from app.services.llm.registry import register_adapter
+
+logger = logging.getLogger(__name__)
+
+# Fixed xAI Chat Completions API root — never taken from user input.
+XAI_BASE_URL = "https://api.x.ai/v1"
+DEFAULT_MODEL = "grok-3-mini"
+
+
+class XaiApiKeyAdapter(OpenAICompatibleAdapter):
+    """xAI Grok adapter — fixed base URL, api_key credential, OpenAI-compatible wire."""
+
+    connector_type = "xai_apikey"
+
+    def _extract_credentials(self) -> tuple[str, str | None]:
+        """Return (fixed xAI base_url, api_key).
+
+        Unlike the parent ``openai_compatible`` adapter, xAI connectors store an
+        ``{"api_key": "..."}`` blob (the same shape as the other api-key
+        connectors) and the base URL is pinned — it is never user-supplied.
+        """
+        return extract_fixed_base_credentials(self.connector.credentials or "", XAI_BASE_URL)
+
+    async def chat(self, request: ChatRequest) -> ChatResponse:
+        base_url, api_key = self._extract_credentials()
+        try:
+            return await call_openai_chat(
+                base_url=base_url,
+                api_key=api_key,
+                request=request,
+                fallback_model=self.connector.model_hint or DEFAULT_MODEL,
+            )
+        except ProviderUnavailable as exc:
+            # Attach xAI context so telemetry/logs are unambiguous about which
+            # upstream failed. The error class (and gateway mapping) is unchanged.
+            raise ProviderUnavailable(f"xAI provider unavailable: {exc}") from exc
+
+    async def health_check(self) -> None:
+        base_url, api_key = self._extract_credentials()
+        ping = build_healthcheck_request()
+        await call_openai_chat(
+            base_url=base_url,
+            api_key=api_key,
+            request=ping,
+            fallback_model=self.connector.model_hint or DEFAULT_MODEL,
+        )
+
+
+register_adapter("xai_apikey", XaiApiKeyAdapter)
diff --git a/server/app/services/llm/base.py b/server/app/services/llm/base.py
new file mode 100644
index 00000000..124b3854
--- /dev/null
+++ b/server/app/services/llm/base.py
@@ -0,0 +1,173 @@
+"""Canonical request / response types + LlmAdapter ABC.
+
+Adapters convert between provider-native request/response shapes and these
+canonical models. See spec §4.4.
+"""
+
+from __future__ import annotations
+
+from abc import ABC, abstractmethod
+from collections.abc import AsyncIterator
+from typing import Literal
+
+from pydantic import BaseModel, ConfigDict, Field
+
+
+class ContentBlock(BaseModel):
+    """Optional multi-modal content block — text-only in MVP."""
+
+    type: Literal["text"] = "text"
+    text: str
+
+
+class Message(BaseModel):
+    role: Literal["system", "user", "assistant", "tool"]
+    content: str | list[ContentBlock]
+    tool_call_id: str | None = None
+    # When role == "assistant" and the message includes tool_use blocks,
+    # callers may serialise them as text + tool_calls separately. Adapters
+    # handle the per-provider shape; gateway callers just supply text/role.
+
+
+class ToolSpec(BaseModel):
+    """Canonical tool definition — JSON Schema shape carries the input schema."""
+
+    name: str
+    description: str
+    input_schema: dict
+
+
+class ToolCall(BaseModel):
+    """An LLM-issued call to a tool, parsed from the provider response."""
+
+    id: str
+    name: str
+    input: dict
+
+
+class TokenUsage(BaseModel):
+    prompt: int
+    completion: int
+
+
+class ChatRequest(BaseModel):
+    """Provider-agnostic chat request."""
+
+    model_config = ConfigDict(arbitrary_types_allowed=True)
+
+    messages: list[Message]
+    tools: list[ToolSpec] | None = None
+    force_tool: str | None = None
+    max_tokens: int | None = None
+    temperature: float | None = None
+    # Overrides the connector's model_hint when present.
+    model: str | None = None
+    # Per-call timeout in seconds; adapters may clamp to a max.
+    timeout_seconds: float | None = None
+    # Optional system prompt — adapters surface this as the provider's native
+    # system role (Anthropic top-level system; OpenAI as the first system msg).
+    system: str | None = None
+    # Automatic-fallback behaviour when the resolved connector fails with a
+    # transient/credential error (rate-limited, auth-expired, provider-down,
+    # quota-exceeded). Default "none" preserves the original fail-fast behaviour.
+    #   - "none": never fall back; surface the original error.
+    #   - "org_default": on a fallback-eligible error, retry once on the
+    #     org-default connector (if different from the one that failed).
+    #   - "retry_then_org_default": first retry once on the SAME connector, then
+    #     fall back to the org-default connector. Retries are bounded — at most
+    #     one same-connector retry and one org-default attempt; never loops.
+    fallback_policy: Literal["none", "org_default", "retry_then_org_default"] = "none"
+
+
+class ChatResponse(BaseModel):
+    """Provider-agnostic chat response."""
+
+    text: str = ""
+    tool_calls: list[ToolCall] = Field(default_factory=list)
+    stop_reason: Literal["end_turn", "tool_use", "max_tokens", "error"]
+    usage: TokenUsage | None = None
+    # The provider model id that actually produced the response (for telemetry).
+    model: str | None = None
+
+
+class ToolCallDelta(BaseModel):
+    """A fragment of a streamed tool call.
+
+    Providers emit tool-call arguments incrementally. ``index`` groups fragments
+    belonging to the same call (OpenAI sends an array index; Anthropic uses the
+    content-block index). ``id`` / ``name`` arrive once at the start of a call;
+    ``input_json_fragment`` carries the raw, possibly-partial argument JSON text.
+    Consumers concatenate fragments per ``index`` and JSON-parse the result when
+    the stream completes.
+    """
+
+    index: int
+    id: str | None = None
+    name: str | None = None
+    input_json_fragment: str = ""
+
+
+class ChatResponseChunk(BaseModel):
+    """One incremental chunk of a streamed chat response.
+
+    Non-final chunks carry ``text_delta`` and/or ``tool_call_deltas``. The final
+    chunk sets ``done=True`` and carries the canonical ``stop_reason`` plus
+    ``usage`` (when the provider reports it). ``stop_reason`` / ``usage`` are
+    ``None`` on every non-final chunk.
+    """
+
+    text_delta: str = ""
+    tool_call_deltas: list[ToolCallDelta] = Field(default_factory=list)
+    stop_reason: Literal["end_turn", "tool_use", "max_tokens", "error"] | None = None
+    usage: TokenUsage | None = None
+    done: bool = False
+
+
+class LlmAdapter(ABC):
+    """Adapter interface — one per connector_type.
+
+    Adapters are instantiated per call, given the resolved ``LlmConnector`` row.
+    They must read credentials lazily (the row's ``credentials`` column is an
+    ``EncryptedText`` column; accessing the attribute auto-decrypts).
+    """
+
+    #: connector_type identifier — set on the subclass.
+    connector_type: str = ""
+
+    def __init__(self, connector) -> None:  # noqa: ANN001 — LlmConnector type
+        self.connector = connector
+
+    @abstractmethod
+    async def chat(self, request: ChatRequest) -> ChatResponse:
+        """Dispatch a chat request, returning a canonical response.
+
+        Must raise one of:
+        - AuthInvalid (401/403)
+        - RateLimited (429, with retry_after_seconds if provided)
+        - QuotaExceeded (402 / billing failure)
+        - ProviderUnavailable (5xx / network / timeout)
+        - ToolTranslationError (couldn't translate input or parse output)
+        """
+
+    @abstractmethod
+    async def health_check(self) -> None:
+        """Validate the credential against the provider.
+
+        Raises the same typed exceptions as ``chat()``. Returns ``None`` on
+        success.
+        """
+
+    async def stream(self, request: ChatRequest) -> AsyncIterator[ChatResponseChunk]:
+        """Stream a chat response as incremental chunks.
+
+        Default raises :class:`StreamingUnsupported`. Adapters that support
+        provider-native streaming override this. The trailing ``yield`` is
+        unreachable but makes this method an async generator for type-checkers
+        and for callers that iterate before the first ``await``.
+        """
+        from app.services.llm.exceptions import StreamingUnsupported
+
+        raise StreamingUnsupported(
+            f"connector_type={self.connector_type!r} does not support streaming"
+        )
+        yield  # pragma: no cover  (makes this an async generator)
diff --git a/server/app/services/llm/connector_storage.py b/server/app/services/llm/connector_storage.py
new file mode 100644
index 00000000..30fcf50f
--- /dev/null
+++ b/server/app/services/llm/connector_storage.py
@@ -0,0 +1,815 @@
+"""SQLAlchemy CRUD helpers for LlmConnector + audit/call logging."""
+
+from __future__ import annotations
+
+import json
+import logging
+from datetime import datetime
+from typing import Any
+
+from sqlalchemy import case, delete, func, select
+from sqlalchemy.dialects.postgresql import insert as pg_insert
+from sqlalchemy.dialects.sqlite import insert as sqlite_insert
+from sqlalchemy.orm import Session
+
+from app.models.llm_connector import (
+    AUDIT_AUTH_INVALID_OBSERVED,
+    AUDIT_CREATED,
+    AUDIT_CREDENTIALS_ROTATED,
+    AUDIT_DEFAULT_SET,
+    AUDIT_DEFAULT_UNSET,
+    AUDIT_DELETED,
+    AUDIT_HEALTH_CHECK,
+    AUDIT_POLICY_CHANGED,
+    AUDIT_REVOKED_BY_ADMIN,
+    CONNECTOR_TYPE_ANTHROPIC_APIKEY,
+    CONNECTOR_TYPE_AZURE_OPENAI,
+    CONNECTOR_TYPE_BEDROCK,
+    CONNECTOR_TYPE_GEMINI_APIKEY,
+    CONNECTOR_TYPE_OPENAI_APIKEY,
+    CONNECTOR_TYPE_OPENAI_COMPATIBLE,
+    CONNECTOR_TYPE_OPENROUTER_APIKEY,
+    CONNECTOR_TYPE_XAI_APIKEY,
+    STATUS_ACTIVE,
+    STATUS_AUTH_INVALID,
+    STATUS_DISABLED,
+    VALID_CONNECTOR_TYPES,
+    LlmAuditEvent,
+    LlmCallLog,
+    LlmConnector,
+)
+from app.models.llm_feature_preference import LlmFeaturePreference
+from app.models.user import User
+from app.services.llm.url_validator import (
+    InvalidBaseUrlError,
+    validate_compatible_base_url,
+)
+
+logger = logging.getLogger(__name__)
+
+
+def list_connectors_for_user(db: Session, user_id: int) -> list[LlmConnector]:
+    return (
+        db.query(LlmConnector)
+        .filter(LlmConnector.user_id == user_id)
+        .order_by(LlmConnector.created_at.desc())
+        .all()
+    )
+
+
+def list_all_connectors(db: Session) -> list[LlmConnector]:
+    return (
+        db.query(LlmConnector)
+        .order_by(LlmConnector.user_id.asc(), LlmConnector.created_at.desc())
+        .all()
+    )
+
+
+def get_connector_for_user(db: Session, connector_id: int, user_id: int) -> LlmConnector | None:
+    return (
+        db.query(LlmConnector)
+        .filter(LlmConnector.id == connector_id, LlmConnector.user_id == user_id)
+        .one_or_none()
+    )
+
+
+def get_connector(db: Session, connector_id: int) -> LlmConnector | None:
+    return db.get(LlmConnector, connector_id)
+
+
+# API-key connector types (shared by the create + rotate validation dispatch).
+_APIKEY_CONNECTOR_TYPES = (
+    CONNECTOR_TYPE_OPENAI_APIKEY,
+    CONNECTOR_TYPE_ANTHROPIC_APIKEY,
+    CONNECTOR_TYPE_OPENROUTER_APIKEY,
+    CONNECTOR_TYPE_XAI_APIKEY,
+    CONNECTOR_TYPE_GEMINI_APIKEY,
+)
+
+
+def _normalise_model_hint(value: str | None, *, invalid_msg: str) -> str | None:
+    """Strip + validate a model_hint (≤80 chars, safe charset). ``invalid_msg``
+    stays caller-supplied so create vs update keep their distinct error text."""
+    if value is None:
+        return None
+    value = value.strip() or None
+    if value is not None:
+        if len(value) > 80:
+            raise ValueError("model_hint must be 80 characters or fewer")
+        if not _is_safe_model_hint(value):
+            raise ValueError(invalid_msg)
+    return value
+
+
+def _validate_api_key_blob(connector_type: str, api_key: str | None, *, required_msg: str) -> dict:
+    """Validate + assemble an ``{"api_key": ...}`` blob. ``required_msg`` differs
+    between create and rotate, so it stays caller-supplied."""
+    if not api_key:
+        raise ValueError(required_msg)
+    api_key = api_key.strip()
+    if not _looks_like_api_key(connector_type, api_key):
+        raise ValueError("api_key format is invalid")
+    return {"api_key": api_key}
+
+
+class CreateConnectorPayload:
+    """Validated creation payload — see :func:`create_connector`."""
+
+    __slots__ = ("connector_type", "display_name", "credentials", "base_url_plain", "model_hint")
+
+    def __init__(
+        self,
+        *,
+        connector_type: str,
+        display_name: str,
+        credentials: dict,
+        base_url_plain: str | None = None,
+        model_hint: str | None = None,
+    ) -> None:
+        self.connector_type = connector_type
+        self.display_name = display_name
+        self.credentials = credentials
+        self.base_url_plain = base_url_plain
+        self.model_hint = model_hint
+
+
+def build_create_payload(
+    *,
+    connector_type: str,
+    display_name: str,
+    api_key: str | None = None,
+    base_url: str | None = None,
+    bearer: str | None = None,
+    model_hint: str | None = None,
+    aws_access_key_id: str | None = None,
+    aws_secret_access_key: str | None = None,
+    aws_region: str | None = None,
+    aws_model_id: str | None = None,
+    azure_resource_name: str | None = None,
+    azure_deployment_name: str | None = None,
+    azure_api_version: str | None = None,
+) -> CreateConnectorPayload:
+    """Translate request fields into a validated ``CreateConnectorPayload``.
+
+    Raises :class:`ValueError` on validation errors. The caller is responsible
+    for returning a 400 to the client.
+    """
+    if connector_type not in VALID_CONNECTOR_TYPES:
+        raise ValueError(f"Unknown connector_type: {connector_type!r}")
+
+    display_name = (display_name or "").strip()
+    if not display_name:
+        raise ValueError("display_name is required")
+    if len(display_name) > 80:
+        raise ValueError("display_name must be 80 characters or fewer")
+    if any(ord(c) < 0x20 for c in display_name):
+        raise ValueError("display_name must not contain control characters")
+
+    model_hint = _normalise_model_hint(
+        model_hint,
+        invalid_msg=(
+            "model_hint may only contain letters, digits, dot, underscore, hyphen, or slash"
+        ),
+    )
+
+    creds: dict[str, Any]
+    plain_base_url: str | None = None
+
+    if connector_type in _APIKEY_CONNECTOR_TYPES:
+        creds = _validate_api_key_blob(connector_type, api_key, required_msg="api_key is required")
+    elif connector_type == CONNECTOR_TYPE_OPENAI_COMPATIBLE:
+        if not base_url:
+            raise ValueError("base_url is required")
+        try:
+            plain_base_url = validate_compatible_base_url(base_url)
+        except InvalidBaseUrlError as exc:
+            raise ValueError(str(exc)) from exc
+        creds = {"base_url": plain_base_url, "bearer": bearer or None}
+    elif connector_type == CONNECTOR_TYPE_BEDROCK:
+        creds = _build_bedrock_creds(
+            aws_access_key_id=aws_access_key_id,
+            aws_secret_access_key=aws_secret_access_key,
+            aws_region=aws_region,
+            aws_model_id=aws_model_id,
+        )
+    elif connector_type == CONNECTOR_TYPE_AZURE_OPENAI:
+        if not api_key:
+            raise ValueError("api_key is required")
+        api_key = api_key.strip()
+        creds = _build_azure_creds(
+            api_key=api_key,
+            azure_resource_name=azure_resource_name,
+            azure_deployment_name=azure_deployment_name,
+            azure_api_version=azure_api_version,
+        )
+    else:  # pragma: no cover — guarded by the membership check above
+        raise ValueError(f"Unsupported connector_type: {connector_type!r}")
+
+    return CreateConnectorPayload(
+        connector_type=connector_type,
+        display_name=display_name,
+        credentials=creds,
+        base_url_plain=plain_base_url,
+        model_hint=model_hint,
+    )
+
+
+_OPENAI_KEY_PREFIXES = ("sk-",)
+_ANTHROPIC_KEY_PREFIX = "sk-ant-"
+_OPENROUTER_KEY_PREFIX = "sk-or-"
+_XAI_KEY_PREFIX = "xai-"
+# Google AI Studio (Gemini) keys are "AIza" + 35 url-safe chars = 39 total.
+_GEMINI_KEY_PREFIX = "AIza"
+_GEMINI_KEY_LENGTH = 39
+_SAFE_CHARS = set("abcdefghijklmnopqrstuvwxyzABCDEFGHIJKLMNOPQRSTUVWXYZ0123456789-_.")
+# Slash is permitted so namespaced model ids (e.g. OpenRouter's
+# "provider/model") validate. The hint is only ever sent as the request-body
+# "model" field — never used to build a filesystem/URL path.
+_SAFE_MODEL_CHARS = set("abcdefghijklmnopqrstuvwxyzABCDEFGHIJKLMNOPQRSTUVWXYZ0123456789-_./")
+
+
+def _is_safe_model_hint(s: str) -> bool:
+    return all(c in _SAFE_MODEL_CHARS for c in s)
+
+
+# AWS region tokens are lowercase alnum + hyphen (e.g. us-east-1, eu-central-1).
+_AWS_REGION_CHARS = set("abcdefghijklmnopqrstuvwxyz0123456789-")
+# Bedrock model ids look like "anthropic.claude-3-5-sonnet-20241022-v2:0" or
+# "meta.llama3-70b-instruct-v1:0" — allow the inference-profile/ARN-ish chars.
+_AWS_MODEL_ID_CHARS = set("abcdefghijklmnopqrstuvwxyzABCDEFGHIJKLMNOPQRSTUVWXYZ0123456789-_.:/")
+
+
+def _build_bedrock_creds(
+    *,
+    aws_access_key_id: str | None,
+    aws_secret_access_key: str | None,
+    aws_region: str | None,
+    aws_model_id: str | None,
+) -> dict[str, str]:
+    """Validate + assemble the bedrock credentials blob.
+
+    Raises :class:`ValueError` (→ HTTP 400) on any malformed field. No AWS
+    dependency: the access key id / secret are opaque strings; we only sanity
+    check shape and reject obviously-bad input before persisting.
+    """
+    access_key = (aws_access_key_id or "").strip()
+    secret_key = (aws_secret_access_key or "").strip()
+    region = (aws_region or "").strip()
+    model_id = (aws_model_id or "").strip()
+
+    if not access_key:
+        raise ValueError("aws_access_key_id is required")
+    if not secret_key:
+        raise ValueError("aws_secret_access_key is required")
+    if not region:
+        raise ValueError("aws_region is required")
+    if not model_id:
+        raise ValueError("aws_model_id is required")
+
+    if " " in access_key or "\n" in access_key or not all(c in _SAFE_CHARS for c in access_key):
+        raise ValueError("aws_access_key_id format is invalid")
+    if " " in secret_key or "\n" in secret_key:
+        raise ValueError("aws_secret_access_key format is invalid")
+    if not all(c in _AWS_REGION_CHARS for c in region):
+        raise ValueError("aws_region format is invalid")
+    if not all(c in _AWS_MODEL_ID_CHARS for c in model_id):
+        raise ValueError("aws_model_id format is invalid")
+
+    return {
+        "aws_access_key_id": access_key,
+        "aws_secret_access_key": secret_key,
+        "aws_region": region,
+        "aws_model_id": model_id,
+    }
+
+
+def _looks_like_api_key(connector_type: str, key: str) -> bool:
+    """Cheap shape check — full validation is on the upstream API at health-check time."""
+    if not key or " " in key or "\n" in key:
+        return False
+    if not all(c in _SAFE_CHARS for c in key):
+        return False
+    if connector_type == CONNECTOR_TYPE_ANTHROPIC_APIKEY:
+        return key.startswith(_ANTHROPIC_KEY_PREFIX) and len(key) >= len(_ANTHROPIC_KEY_PREFIX) + 30
+    if connector_type == CONNECTOR_TYPE_OPENROUTER_APIKEY:
+        min_len = len(_OPENROUTER_KEY_PREFIX) + 20
+        return key.startswith(_OPENROUTER_KEY_PREFIX) and len(key) >= min_len
+    if connector_type == CONNECTOR_TYPE_OPENAI_APIKEY:
+        return any(key.startswith(p) for p in _OPENAI_KEY_PREFIXES) and len(key) >= 20
+    if connector_type == CONNECTOR_TYPE_XAI_APIKEY:
+        return key.startswith(_XAI_KEY_PREFIX) and len(key) >= len(_XAI_KEY_PREFIX) + 20
+    if connector_type == CONNECTOR_TYPE_GEMINI_APIKEY:
+        # Google "AIza…" keys are a fixed 39-char url-safe string.
+        return key.startswith(_GEMINI_KEY_PREFIX) and len(key) == _GEMINI_KEY_LENGTH
+    return False
+
+
+# Azure resource/deployment names: letters, digits, hyphen (Azure naming rules).
+_AZURE_NAME_CHARS = set("abcdefghijklmnopqrstuvwxyzABCDEFGHIJKLMNOPQRSTUVWXYZ0123456789-")
+# api-version is a date-ish token, optionally with a -preview suffix.
+_AZURE_VERSION_CHARS = set("abcdefghijklmnopqrstuvwxyzABCDEFGHIJKLMNOPQRSTUVWXYZ0123456789-.")
+
+
+def _validate_azure_field(name: str, value: str | None, allowed: set[str], max_len: int) -> str:
+    if not value:
+        raise ValueError(f"{name} is required")
+    value = value.strip()
+    if not value:
+        raise ValueError(f"{name} is required")
+    if len(value) > max_len:
+        raise ValueError(f"{name} must be {max_len} characters or fewer")
+    if not all(c in allowed for c in value):
+        raise ValueError(f"{name} contains invalid characters")
+    return value
+
+
+def _build_azure_creds(
+    *,
+    api_key: str | None,
+    azure_resource_name: str | None,
+    azure_deployment_name: str | None,
+    azure_api_version: str | None,
+) -> dict[str, Any]:
+    """Validate + assemble the Azure OpenAI credential blob.
+
+    All four fields (api_key + the three azure_* config values) are stored in
+    the encrypted blob — there are no dedicated DB columns.
+    """
+    if not api_key or not api_key.strip():
+        raise ValueError("api_key is required")
+    return {
+        "api_key": api_key.strip(),
+        "azure_resource_name": _validate_azure_field(
+            "azure_resource_name", azure_resource_name, _AZURE_NAME_CHARS, 120
+        ),
+        "azure_deployment_name": _validate_azure_field(
+            "azure_deployment_name", azure_deployment_name, _AZURE_NAME_CHARS, 120
+        ),
+        "azure_api_version": _validate_azure_field(
+            "azure_api_version", azure_api_version, _AZURE_VERSION_CHARS, 40
+        ),
+    }
+
+
+def _load_existing_blob(connector: LlmConnector) -> dict[str, Any]:
+    """Decode the connector's current credential blob (best-effort).
+
+    Returns an empty dict when the blob is missing or malformed so callers can
+    treat absent values as "no prior value" during partial rotation.
+    """
+    raw = connector.credentials or ""
+    try:
+        blob = json.loads(raw)
+    except (json.JSONDecodeError, TypeError):
+        return {}
+    return blob if isinstance(blob, dict) else {}
+
+
+def create_connector(db: Session, *, user_id: int, payload: CreateConnectorPayload) -> LlmConnector:
+    """Persist a new connector. Caller is responsible for audit event + commit."""
+    row = LlmConnector(
+        user_id=user_id,
+        connector_type=payload.connector_type,
+        display_name=payload.display_name,
+        status=STATUS_ACTIVE,
+        credentials=json.dumps(payload.credentials),
+        base_url_plain=payload.base_url_plain,
+        model_hint=payload.model_hint,
+    )
+    db.add(row)
+    db.flush()
+    db.refresh(row)
+    return row
+
+
+def rotate_credentials(
+    db: Session,
+    *,
+    connector: LlmConnector,
+    api_key: str | None = None,
+    base_url: str | None = None,
+    bearer: str | None = None,
+    aws_access_key_id: str | None = None,
+    aws_secret_access_key: str | None = None,
+    aws_region: str | None = None,
+    aws_model_id: str | None = None,
+    azure_resource_name: str | None = None,
+    azure_deployment_name: str | None = None,
+    azure_api_version: str | None = None,
+) -> LlmConnector:
+    """Rotate the credential blob in-place. Caller commits."""
+    blob: dict[str, Any]
+    if connector.connector_type in _APIKEY_CONNECTOR_TYPES:
+        blob = _validate_api_key_blob(
+            connector.connector_type, api_key, required_msg="api_key is required for rotation"
+        )
+    elif connector.connector_type == CONNECTOR_TYPE_OPENAI_COMPATIBLE:
+        if not base_url:
+            raise ValueError("base_url is required for rotation")
+        try:
+            base_url = validate_compatible_base_url(base_url)
+        except InvalidBaseUrlError as exc:
+            raise ValueError(str(exc)) from exc
+        blob = {"base_url": base_url, "bearer": bearer or None}
+        connector.base_url_plain = base_url
+    elif connector.connector_type == CONNECTOR_TYPE_BEDROCK:
+        # Partial rotation: keep existing fields when a new value isn't supplied.
+        existing: dict[str, Any] = {}
+        try:
+            parsed = json.loads(connector.credentials or "{}")
+            if isinstance(parsed, dict):
+                existing = parsed
+        except (json.JSONDecodeError, TypeError):
+            existing = {}
+        blob = _build_bedrock_creds(
+            aws_access_key_id=aws_access_key_id or existing.get("aws_access_key_id"),
+            aws_secret_access_key=(aws_secret_access_key or existing.get("aws_secret_access_key")),
+            aws_region=aws_region or existing.get("aws_region"),
+            aws_model_id=aws_model_id or existing.get("aws_model_id"),
+        )
+    elif connector.connector_type == CONNECTOR_TYPE_AZURE_OPENAI:
+        # Partial rotation: any omitted field keeps its current value, so an
+        # admin can swap just the resource/deployment/version (or just the key)
+        # without recreating the connector.
+        # Only None means "field omitted, keep current value". An explicit ""
+        # is passed through to _build_azure_creds() so it is rejected rather
+        # than silently preserving the old value.
+        current = _load_existing_blob(connector)
+        new_api_key = current.get("api_key") if api_key is None else api_key.strip()
+        blob = _build_azure_creds(
+            api_key=new_api_key,
+            azure_resource_name=(
+                current.get("azure_resource_name")
+                if azure_resource_name is None
+                else azure_resource_name
+            ),
+            azure_deployment_name=(
+                current.get("azure_deployment_name")
+                if azure_deployment_name is None
+                else azure_deployment_name
+            ),
+            azure_api_version=(
+                current.get("azure_api_version") if azure_api_version is None else azure_api_version
+            ),
+        )
+    else:  # pragma: no cover
+        raise ValueError(f"Unsupported connector_type: {connector.connector_type!r}")
+
+    connector.credentials = json.dumps(blob)
+    # Clear status/last_error on successful rotation — caller may run a fresh health check.
+    if connector.status == STATUS_AUTH_INVALID:
+        connector.status = STATUS_ACTIVE
+        connector.last_error = None
+    return connector
+
+
+def update_metadata(
+    connector: LlmConnector,
+    *,
+    display_name: str | None = None,
+    model_hint: str | None = None,
+) -> LlmConnector:
+    if display_name is not None:
+        display_name = display_name.strip()
+        if not display_name:
+            raise ValueError("display_name is required")
+        if len(display_name) > 80:
+            raise ValueError("display_name must be 80 characters or fewer")
+        if any(ord(c) < 0x20 for c in display_name):
+            raise ValueError("display_name must not contain control characters")
+        connector.display_name = display_name
+    if model_hint is not None:
+        connector.model_hint = _normalise_model_hint(
+            model_hint, invalid_msg="model_hint contains invalid characters"
+        )
+    return connector
+
+
+def delete_connector(db: Session, connector: LlmConnector) -> None:
+    db.delete(connector)
+
+
+def set_default_for_user(db: Session, *, connector: LlmConnector) -> LlmConnector:
+    """Mark ``connector`` as the DJ's default and clear any sibling defaults.
+
+    Atomic clear-then-set: all other rows for ``connector.user_id`` are flipped
+    to ``is_default = False`` in a single UPDATE before the target row is
+    flipped to True. This sidesteps the partial unique index race that would
+    otherwise occur if two SET requests landed concurrently — the worst case
+    is the second request overwriting the first, which is the user's intent.
+    The caller commits and writes the audit event.
+
+    No-ops gracefully when ``connector.is_default`` is already True (the
+    sibling clear still runs to fix any drift, e.g. a stale row left behind
+    by an aborted migration backfill).
+    """
+    db.query(LlmConnector).filter(
+        LlmConnector.user_id == connector.user_id,
+        LlmConnector.id != connector.id,
+        LlmConnector.is_default == True,  # noqa: E712
+    ).update({LlmConnector.is_default: False}, synchronize_session=False)
+    connector.is_default = True
+    db.flush()
+    return connector
+
+
+def unset_default_for_user(db: Session, *, connector: LlmConnector) -> LlmConnector:
+    """Clear the explicit-default flag. Caller commits + audits."""
+    connector.is_default = False
+    db.flush()
+    return connector
+
+
+def revoke_connector(connector: LlmConnector) -> LlmConnector:
+    """Admin-only: mark a connector disabled. Caller commits + audits."""
+    connector.status = STATUS_DISABLED
+    return connector
+
+
+def get_feature_preferences_for_user(db: Session, user_id: int) -> list[LlmFeaturePreference]:
+    """Return all of a DJ's per-feature connector pins (issue #337)."""
+    return (
+        db.query(LlmFeaturePreference)
+        .filter(LlmFeaturePreference.user_id == user_id)
+        .order_by(LlmFeaturePreference.feature.asc())
+        .all()
+    )
+
+
+def get_feature_preference(
+    db: Session, *, user_id: int, feature: str
+) -> LlmFeaturePreference | None:
+    """Return the DJ's pin for ``feature``, or ``None`` if unset."""
+    return (
+        db.query(LlmFeaturePreference)
+        .filter(
+            LlmFeaturePreference.user_id == user_id,
+            LlmFeaturePreference.feature == feature,
+        )
+        .one_or_none()
+    )
+
+
+def set_feature_preference(
+    db: Session, *, user_id: int, feature: str, connector_id: int
+) -> LlmFeaturePreference:
+    """Upsert the DJ's pin for ``feature`` → ``connector_id``. Caller commits.
+
+    Replace-in-place when a row already exists so the UNIQUE constraint on
+    ``(user_id, feature)`` is never violated.
+
+    Concurrency-safe via a DB-native ``ON CONFLICT … DO UPDATE`` upsert keyed on
+    ``(user_id, feature)``. Two requests racing to pin the same feature resolve
+    deterministically (last writer wins) in a single atomic statement, instead
+    of one of them tripping ``uq_llm_feature_pref_user_feature`` and bubbling a
+    500. Works on both Postgres (prod) and SQLite (tests).
+    """
+    table = LlmFeaturePreference.__table__
+    dialect = db.bind.dialect.name if db.bind is not None else ""
+    insert_fn = pg_insert if dialect == "postgresql" else sqlite_insert
+    stmt = insert_fn(table).values(user_id=user_id, feature=feature, connector_id=connector_id)
+    stmt = stmt.on_conflict_do_update(
+        index_elements=[table.c.user_id, table.c.feature],
+        set_={"connector_id": connector_id},
+    )
+    db.execute(stmt)
+    db.flush()
+    row = get_feature_preference(db, user_id=user_id, feature=feature)
+    if row is None:  # pragma: no cover - the upsert guarantees the row exists
+        raise RuntimeError("feature preference upsert did not persist a row")
+    # ON CONFLICT DO UPDATE bypasses the ORM, so an already-loaded row may hold a
+    # stale connector_id — refresh just this instance, not the whole session.
+    db.refresh(row)
+    return row
+
+
+def clear_feature_preference(db: Session, *, user_id: int, feature: str) -> bool:
+    """Delete the DJ's pin for ``feature``. Returns True iff a row was removed.
+
+    Caller commits.
+    """
+    existing = get_feature_preference(db, user_id=user_id, feature=feature)
+    if existing is None:
+        return False
+    db.delete(existing)
+    db.flush()
+    return True
+
+
+def audit_event(
+    db: Session,
+    *,
+    actor_user_id: int,
+    target_connector_id: int | None,
+    event_type: str,
+) -> LlmAuditEvent:
+    row = LlmAuditEvent(
+        actor_user_id=actor_user_id,
+        target_connector_id=target_connector_id,
+        event_type=event_type,
+    )
+    db.add(row)
+    db.flush()
+    return row
+
+
+def log_call(
+    db: Session,
+    *,
+    connector_id: int,
+    purpose: str,
+    status: str,
+    latency_ms: int,
+    tokens_in: int | None = None,
+    tokens_out: int | None = None,
+    error_code: str | None = None,
+) -> LlmCallLog:
+    row = LlmCallLog(
+        connector_id=connector_id,
+        purpose=purpose,
+        status=status,
+        latency_ms=latency_ms,
+        tokens_in=tokens_in,
+        tokens_out=tokens_out,
+        error_code=error_code,
+    )
+    db.add(row)
+    db.flush()
+    return row
+
+
+def purge_call_log_older_than(db: Session, *, retention_days: int) -> int:
+    """Delete llm_call_log rows older than ``retention_days``.
+
+    Returns the number of rows deleted. The caller owns the transaction
+    (commits). ``retention_days`` is supplied by the caller (which reads it
+    from system settings each run) so the retention window stays configurable
+    without a hardcoded constant.
+    """
+    from datetime import timedelta
+
+    from app.core.time import utcnow
+
+    # Fail closed on out-of-bounds windows. A non-positive value would push the
+    # cutoff to now/future and delete nearly all history; an oversized value is
+    # equally suspect. The admin UI/schema clamp to 7-365, so a value outside
+    # that range means a corrupt or tampered persisted setting — refuse rather
+    # than over-delete. The daily cleanup loop catches this and retries next pass.
+    if not 7 <= retention_days <= 365:
+        raise ValueError("retention_days must be between 7 and 365")
+
+    cutoff = utcnow() - timedelta(days=retention_days)
+    result = db.execute(delete(LlmCallLog).where(LlmCallLog.created_at < cutoff))
+    return result.rowcount or 0
+
+
+def get_user_label(db: Session, user_id: int) -> str:
+    user = db.get(User, user_id)
+    return user.username if user else f"user#{user_id}"
+
+
+def get_usage_stats(db: Session, *, days: int = 30) -> list[dict]:
+    """Aggregate per-connector telemetry for the admin Usage card.
+
+    Returns a list of dicts with: connector_id, total_calls, total_tokens_in,
+    total_tokens_out, error_count. The caller joins back to LlmConnector for
+    display labels.
+    """
+    from datetime import timedelta
+
+    from app.core.time import utcnow
+
+    cutoff = utcnow() - timedelta(days=days)
+
+    stmt = (
+        select(
+            LlmCallLog.connector_id,
+            func.count(LlmCallLog.id).label("total_calls"),
+            func.coalesce(func.sum(LlmCallLog.tokens_in), 0).label("total_tokens_in"),
+            func.coalesce(func.sum(LlmCallLog.tokens_out), 0).label("total_tokens_out"),
+            func.sum(case((LlmCallLog.status != "ok", 1), else_=0)).label("error_count"),
+        )
+        .where(LlmCallLog.created_at >= cutoff)
+        .group_by(LlmCallLog.connector_id)
+    )
+    rows = db.execute(stmt).all()
+    return [
+        {
+            "connector_id": int(r.connector_id),
+            "total_calls": int(r.total_calls or 0),
+            "total_tokens_in": int(r.total_tokens_in or 0),
+            "total_tokens_out": int(r.total_tokens_out or 0),
+            "error_count": int(r.error_count or 0),
+        }
+        for r in rows
+    ]
+
+
+def _calendar_month_start() -> datetime:
+    """First instant (UTC, naive) of the current calendar month."""
+    from app.core.time import utcnow
+
+    now = utcnow()
+    return now.replace(day=1, hour=0, minute=0, second=0, microsecond=0)
+
+
+def current_month_token_usage(db: Session, connector_id: int) -> int:
+    """Sum tokens_in + tokens_out for ``connector_id`` in the current month.
+
+    Direct aggregation against the indexed ``llm_call_log.created_at`` column.
+    NULL token counts are coalesced to 0. Returns 0 when there are no rows.
+    Used by the gateway pre-flight cap check + the admin usage-vs-cap display
+    (issue #339).
+    """
+    month_start = _calendar_month_start()
+    total = db.execute(
+        select(
+            func.coalesce(func.sum(LlmCallLog.tokens_in), 0)
+            + func.coalesce(func.sum(LlmCallLog.tokens_out), 0)
+        ).where(
+            LlmCallLog.connector_id == connector_id,
+            LlmCallLog.created_at >= month_start,
+        )
+    ).scalar_one()
+    return int(total or 0)
+
+
+def current_month_token_usage_bulk(db: Session, connector_ids: list[int]) -> dict[int, int]:
+    """Sum current-month tokens (tokens_in + tokens_out) for many connectors.
+
+    Single grouped aggregate over the indexed ``llm_call_log.created_at`` column
+    — avoids the N+1 of calling :func:`current_month_token_usage` per connector
+    in the admin list endpoint. Returns a ``{connector_id: total}`` map;
+    connectors with no rows this month are simply absent (callers default to 0).
+    Returns an empty dict when ``connector_ids`` is empty.
+    """
+    if not connector_ids:
+        return {}
+    month_start = _calendar_month_start()
+    rows = db.execute(
+        select(
+            LlmCallLog.connector_id,
+            (
+                func.coalesce(func.sum(LlmCallLog.tokens_in), 0)
+                + func.coalesce(func.sum(LlmCallLog.tokens_out), 0)
+            ).label("total"),
+        )
+        .where(
+            LlmCallLog.connector_id.in_(connector_ids),
+            LlmCallLog.created_at >= month_start,
+        )
+        .group_by(LlmCallLog.connector_id)
+    ).all()
+    return {int(r.connector_id): int(r.total or 0) for r in rows}
+
+
+def set_monthly_cap(connector: LlmConnector, cap: int | None) -> LlmConnector:
+    """Set (or clear) the connector's monthly token cap. Caller commits.
+
+    ``cap=None`` clears the cap (unlimited). A non-None cap must be a
+    non-negative integer; negative values are rejected with ``ValueError``
+    (→ HTTP 400 at the API boundary).
+    """
+    if cap is not None and cap < 0:
+        raise ValueError("monthly_token_cap must be a non-negative integer or null")
+    connector.monthly_token_cap = cap
+    return connector
+
+
+# Re-export audit event constants for callers
+__all__ = [
+    "AUDIT_AUTH_INVALID_OBSERVED",
+    "AUDIT_CREATED",
+    "AUDIT_CREDENTIALS_ROTATED",
+    "AUDIT_DEFAULT_SET",
+    "AUDIT_DEFAULT_UNSET",
+    "AUDIT_DELETED",
+    "AUDIT_HEALTH_CHECK",
+    "AUDIT_POLICY_CHANGED",
+    "AUDIT_REVOKED_BY_ADMIN",
+    "CreateConnectorPayload",
+    "audit_event",
+    "build_create_payload",
+    "clear_feature_preference",
+    "create_connector",
+    "current_month_token_usage",
+    "current_month_token_usage_bulk",
+    "delete_connector",
+    "get_connector",
+    "get_connector_for_user",
+    "get_feature_preference",
+    "get_feature_preferences_for_user",
+    "get_usage_stats",
+    "get_user_label",
+    "list_all_connectors",
+    "list_connectors_for_user",
+    "log_call",
+    "purge_call_log_older_than",
+    "revoke_connector",
+    "rotate_credentials",
+    "set_default_for_user",
+    "set_feature_preference",
+    "set_monthly_cap",
+    "unset_default_for_user",
+    "update_metadata",
+]
diff --git a/server/app/services/llm/exceptions.py b/server/app/services/llm/exceptions.py
new file mode 100644
index 00000000..53166091
--- /dev/null
+++ b/server/app/services/llm/exceptions.py
@@ -0,0 +1,54 @@
+"""Typed exceptions for the LLM gateway.
+
+Adapters raise these specific types; the gateway never re-raises a provider's
+native exception or HTTP error body to callers — that prevents bearer-token /
+credential leakage in error messages.
+"""
+
+from __future__ import annotations
+
+
+class LlmError(Exception):
+    """Base class for all gateway-raised LLM errors."""
+
+
+class NoLlmConfigured(LlmError):
+    """No active connector for the actor and no system default connector."""
+
+
+class AuthInvalid(LlmError):
+    """The provider returned 401 / 403 — connector marked auth_invalid."""
+
+
+class RateLimited(LlmError):
+    """The provider returned 429 — caller should back off and try later."""
+
+    def __init__(self, message: str = "Rate limited", retry_after_seconds: int | None = None):
+        super().__init__(message)
+        self.retry_after_seconds = retry_after_seconds
+
+
+class QuotaExceeded(LlmError):
+    """Billing / quota failure (402 or provider-specific quota error)."""
+
+
+class QuotaCapReached(LlmError):
+    """The DJ's admin-set monthly token cap for this connector is reached.
+
+    Distinct from :class:`QuotaExceeded` (a provider-side billing/quota error):
+    this is a WrzDJ-internal pre-flight refusal raised *before* any provider
+    call, so no tokens are spent. The DJ-facing message is fixed and contains
+    no internal details — see the gateway pre-flight check (issue #339).
+    """
+
+
+class ProviderUnavailable(LlmError):
+    """Transient upstream failure — 5xx, network error, or timeout."""
+
+
+class ToolTranslationError(LlmError):
+    """Canonical ToolSpec couldn't be translated or the response couldn't be parsed."""
+
+
+class StreamingUnsupported(LlmError):
+    """The resolved adapter does not implement provider-native streaming."""
diff --git a/server/app/services/llm/gateway.py b/server/app/services/llm/gateway.py
index 0f39e9f0..0fad73d4 100644
--- a/server/app/services/llm/gateway.py
+++ b/server/app/services/llm/gateway.py
@@ -1,118 +1,492 @@
-"""Provider-agnostic LLM gateway (Phase 0 interface stub).
-
-This is the single call surface WrzDJSet codes against. The real gateway
-(OAuth multi-provider dispatch) ships in a parallel worktree; until it merges
-this stub delegates to the existing Anthropic path in
-``services/recommendation/llm_client.py``. Per exec-summary 6/9 ("slip
-insurance"), WrzDJSet is NOT blocked on the gateway merge.
-
-CRITICAL: no provider SDK is imported here. Model identifiers are plain
-strings resolved from a ``model_hint``. The actual provider call is isolated in
-``_raw_provider_call``, which delegates to the existing recommendation LLM
-client; the ``anthropic`` import lives only in that client module, never here.
+"""Gateway entrypoint — resolves a connector and dispatches to the adapter.
+
+See spec §4.3.
+
+Resolution order:
+1. If ``actor`` is not ``None``:
+   a. The DJ's per-feature pin for ``purpose`` if set and the pinned connector
+      is active (``LlmFeaturePreference`` — issue #337). Skipped gracefully when
+      the pinned connector was deleted or is no longer active.
+   b. Else: the DJ's explicit default active connector if one is pinned
+      (``LlmConnector.is_default = True``) — issue #336.
+   c. Else: most-recently-used active connector for the DJ.
+2. Else: ``SystemSettings.llm_default_connector_id`` if set and active.
+3. Else: raise :class:`NoLlmConfigured`.
+
+Auto-fallback (issue #338):
+When ``ChatRequest.fallback_policy`` is not ``"none"`` and the resolved
+connector fails with a transient / credential error (rate-limited, auth
+expired, provider unavailable, quota exceeded), the gateway optionally falls
+back to the org-default connector. Retries are explicitly bounded — at most one
+same-connector retry (for ``retry_then_org_default``) plus one org-default
+attempt; the chain never loops.
 """
 
-from dataclasses import dataclass, field
-from typing import Any, Literal
+from __future__ import annotations
+
+import logging
+from collections.abc import AsyncIterator
+from time import monotonic
+
+from sqlalchemy import desc, nulls_last
+from sqlalchemy.orm import Session
+
+from app.core.time import utcnow
+from app.models.llm_connector import (
+    AUDIT_AUTH_INVALID_OBSERVED,
+    STATUS_ACTIVE,
+    STATUS_AUTH_INVALID,
+    LlmConnector,
+)
+from app.models.system_settings import SystemSettings
+from app.models.user import User
+from app.services.llm.base import ChatRequest, ChatResponse, ChatResponseChunk
+from app.services.llm.connector_storage import (
+    audit_event,
+    current_month_token_usage,
+    get_feature_preference,
+    log_call,
+)
+from app.services.llm.exceptions import (
+    AuthInvalid,
+    LlmError,
+    NoLlmConfigured,
+    ProviderUnavailable,
+    QuotaCapReached,
+    QuotaExceeded,
+    RateLimited,
+    ToolTranslationError,
+)
+from app.services.llm.registry import get_adapter_class
 
-ModelHint = Literal["fast", "strong"]
-MODEL_HINTS: tuple[str, ...] = ("fast", "strong")
+logger = logging.getLogger(__name__)
 
+# Audit event type prefix for auto-fallback. The trigger reason is appended
+# (e.g. ``fallback_triggered:rate_limited``) so it fits the existing
+# ``llm_audit_event.event_type`` String(60) column without a migration. The
+# audit row's ``target_connector_id`` points at the fallback connector.
+AUDIT_FALLBACK_TRIGGERED = "fallback_triggered"
 
-@dataclass
-class GatewayResponse:
-    """Normalized LLM response: tool calls + free text, provider-agnostic."""
+# Maps fallback-eligible exception types → the trigger token recorded in the
+# audit event. Errors NOT in this map (ToolTranslationError, generic LlmError)
+# are never fallback-eligible: a different connector would hit the same problem.
+_FALLBACK_TRIGGERS: dict[type[LlmError], str] = {
+    RateLimited: "rate_limited",
+    AuthInvalid: "auth_invalid",
+    ProviderUnavailable: "provider_unavailable",
+    QuotaExceeded: "quota_exceeded",
+}
 
-    tool_calls: list[dict[str, Any]] = field(default_factory=list)
-    text: str = ""
 
+def _fallback_trigger(exc: LlmError) -> str | None:
+    """Return the trigger token for a fallback-eligible error, else ``None``."""
+    for exc_type, token in _FALLBACK_TRIGGERS.items():
+        if isinstance(exc, exc_type):
+            return token
+    return None
 
-def _resolve_model(model_hint: ModelHint) -> str:
-    """Map a coarse capability hint to a concrete model string.
 
-    Reads the configured Anthropic model for the temporary delegating impl.
-    When the OAuth gateway lands this becomes a provider-aware lookup driven
-    by SystemSettings; the hint contract ("fast" vs "strong") stays stable.
+def _enforce_monthly_cap(db: Session, connector: LlmConnector) -> None:
+    """Pre-flight: refuse dispatch when the connector's monthly cap is reached.
+
+    No-op when the connector has no cap (``monthly_token_cap is None``).
+    Compares the current calendar month's summed token usage against the cap;
+    refuses when usage already meets or exceeds it. Raised BEFORE any provider
+    call, so no tokens are spent and editing the cap never disrupts an
+    already-dispatched (in-flight) call (issue #339).
+
+    The error message is fixed and leaks no internals (usage totals, cap value,
+    connector id) — see the issue's security note.
     """
-    from app.core.config import get_settings
+    cap = connector.monthly_token_cap
+    if cap is None:
+        return
+    used = current_month_token_usage(db, connector.id)
+    if used >= cap:
+        raise QuotaCapReached("Your monthly token cap is reached. Contact your admin to raise it.")
+
+
+class Gateway:
+    """Single dispatch entrypoint."""
+
+    @staticmethod
+    async def dispatch(
+        db: Session,
+        actor: User | None,
+        request: ChatRequest,
+        *,
+        purpose: str,
+    ) -> ChatResponse:
+        primary = _resolve_connector(db, actor, purpose=purpose)
+        actor_id = actor.id if actor else _system_actor_id(db, primary)
+
+        # Pre-flight: refuse if the resolved connector's monthly cap is reached
+        # (issue #339). Raised before any provider call — no tokens spent, and
+        # a cap edit never disrupts an in-flight call. QuotaCapReached is not in
+        # _FALLBACK_TRIGGERS, so it short-circuits to the caller (a cap is not a
+        # transient/credential error a different connector would dodge).
+        _enforce_monthly_cap(db, primary)
+
+        # Attempt 1: primary connector.
+        try:
+            return await _attempt(db, primary, request, purpose=purpose, actor_id=actor_id)
+        except LlmError as exc:
+            trigger = _fallback_trigger(exc)
+            policy = request.fallback_policy
+            if policy == "none" or trigger is None:
+                raise
+
+            # Attempt 2 (retry_then_org_default only): one bounded retry on the
+            # SAME connector before falling back.
+            if policy == "retry_then_org_default":
+                try:
+                    return await _attempt(db, primary, request, purpose=purpose, actor_id=actor_id)
+                except LlmError as retry_exc:
+                    retry_trigger = _fallback_trigger(retry_exc)
+                    if retry_trigger is None:
+                        raise
+                    # Carry the retry's trigger forward to the fallback step.
+                    exc, trigger = retry_exc, retry_trigger
+
+            # Attempt 3: org-default fallback (one bounded attempt).
+            fallback = _resolve_org_default(db)
+            if fallback is None or fallback.id == primary.id:
+                # No distinct org default to fall back to — surface the original.
+                raise
+
+            # The fallback connector may itself be capped — refuse rather than
+            # silently spending another DJ's budget (issue #339).
+            _enforce_monthly_cap(db, fallback)
+
+            logger.info(
+                "llm fallback: primary connector %s failed (%s); "
+                "falling back to org-default connector %s",
+                primary.id,
+                trigger,
+                fallback.id,
+            )
+            # Record the fallback before attempting it, referencing the fallback
+            # connector + the trigger. Reuses the existing audit-write path.
+            audit_event(
+                db,
+                actor_user_id=actor_id,
+                target_connector_id=fallback.id,
+                event_type=f"{AUDIT_FALLBACK_TRIGGERED}:{trigger}",
+            )
+            db.commit()
+            # A failure here surfaces the fallback's own error (no further retry).
+            return await _attempt(db, fallback, request, purpose=purpose, actor_id=actor_id)
+
+    @staticmethod
+    async def stream(
+        db: Session,
+        actor: User | None,
+        request: ChatRequest,
+        *,
+        purpose: str,
+    ) -> AsyncIterator[ChatResponseChunk]:
+        """Stream a chat response, mirroring ``dispatch`` resolution + logging.
+
+        Connector resolution is identical to ``dispatch`` (per-feature pin → per-DJ
+        default → MRU → org default). Logging differs only in timing: a single counts-only
+        ``llm_call_log`` row is written when the stream finishes (success),
+        errors, or is cancelled by the consumer. Consumer cancellation (e.g. an
+        SSE client disconnect closing the generator) raises ``GeneratorExit``
+        into ``_attempt_stream``, whose ``finally`` writes the log and lets the
+        adapter's own ``async with`` cleanup close the upstream connection.
 
-    settings = get_settings()
-    # Phase 0: single-provider delegation. Both hints resolve to the
-    # configured model; the gateway epic differentiates fast/strong tiers.
-    return settings.anthropic_model
+        Auto-fallback (``ChatRequest.fallback_policy``) is intentionally NOT
+        applied to streaming: chunks have already been delivered to the consumer
+        by the time a mid-stream error surfaces, so transparently restarting on
+        another connector would corrupt the output. Streaming always fails fast.
+        """
+        primary = _resolve_connector(db, actor, purpose=purpose)
+        actor_id = actor.id if actor else _system_actor_id(db, primary)
+        inner = _attempt_stream(db, primary, request, purpose=purpose, actor_id=actor_id)
+        try:
+            async for chunk in inner:
+                yield chunk
+        finally:
+            # Closing the outer generator (e.g. SSE client disconnect) must
+            # synchronously close the inner one so ``_attempt_stream``'s finally
+            # fires now — writing the call log + closing the upstream connection —
+            # rather than waiting for garbage collection.
+            await inner.aclose()
 
 
-async def _raw_provider_call(
+async def _attempt(
+    db: Session,
+    connector: LlmConnector,
+    request: ChatRequest,
     *,
-    model: str,
-    system: str,
-    tools: list[dict[str, Any]],
-    tool_choice: dict[str, Any] | None,
-    messages: list[dict[str, Any]],
-    max_tokens: int,
-) -> Any:
-    """Isolated provider call. Delegates to the existing recommendation client.
-
-    The provider SDK import lives ONLY in services/recommendation/llm_client.py.
-    This module never imports a provider SDK (enforced by test).
+    purpose: str,
+    actor_id: int,
+) -> ChatResponse:
+    """Run a single adapter call against ``connector``, logging the outcome.
+
+    Raises the same typed exceptions the adapter raises after logging the call
+    (and, for auth failures, marking the connector + writing an audit event).
     """
-    from app.services.recommendation import llm_client
-
-    return await llm_client.raw_messages_create(
-        model=model,
-        system=system,
-        tools=tools,
-        tool_choice=tool_choice,
-        messages=messages,
-        max_tokens=max_tokens,
+    adapter_cls = get_adapter_class(connector.connector_type)
+    adapter = adapter_cls(connector)
+
+    started = monotonic()
+    try:
+        response = await adapter.chat(request)
+    except AuthInvalid:
+        connector.status = STATUS_AUTH_INVALID
+        connector.last_error = "auth_invalid"
+        db.commit()
+        log_call(
+            db,
+            connector_id=connector.id,
+            purpose=purpose,
+            status="auth_invalid",
+            latency_ms=int((monotonic() - started) * 1000),
+            error_code="401",
+        )
+        audit_event(
+            db,
+            actor_user_id=actor_id,
+            target_connector_id=connector.id,
+            event_type=AUDIT_AUTH_INVALID_OBSERVED,
+        )
+        db.commit()
+        raise
+    except RateLimited as exc:
+        log_call(
+            db,
+            connector_id=connector.id,
+            purpose=purpose,
+            status="rate_limited",
+            latency_ms=int((monotonic() - started) * 1000),
+            error_code=str(exc.retry_after_seconds or ""),
+        )
+        db.commit()
+        raise
+    except QuotaExceeded:
+        log_call(
+            db,
+            connector_id=connector.id,
+            purpose=purpose,
+            status="quota_exceeded",
+            latency_ms=int((monotonic() - started) * 1000),
+            error_code="402",
+        )
+        db.commit()
+        raise
+    except ProviderUnavailable as exc:
+        log_call(
+            db,
+            connector_id=connector.id,
+            purpose=purpose,
+            status="provider_unavailable",
+            latency_ms=int((monotonic() - started) * 1000),
+            error_code=type(exc).__name__,
+        )
+        db.commit()
+        raise
+    except ToolTranslationError:
+        log_call(
+            db,
+            connector_id=connector.id,
+            purpose=purpose,
+            status="tool_translation_error",
+            latency_ms=int((monotonic() - started) * 1000),
+            error_code="translation",
+        )
+        db.commit()
+        raise
+    except LlmError:
+        log_call(
+            db,
+            connector_id=connector.id,
+            purpose=purpose,
+            status="error",
+            latency_ms=int((monotonic() - started) * 1000),
+            error_code="llm_error",
+        )
+        db.commit()
+        raise
+
+    # success path
+    connector.last_used_at = utcnow()
+    connector.last_error = None
+    latency_ms = int((monotonic() - started) * 1000)
+    tokens_in = response.usage.prompt if response.usage else None
+    tokens_out = response.usage.completion if response.usage else None
+    log_call(
+        db,
+        connector_id=connector.id,
+        purpose=purpose,
+        status="ok",
+        latency_ms=latency_ms,
+        tokens_in=tokens_in,
+        tokens_out=tokens_out,
     )
+    db.commit()
+    return response
 
 
-def _normalize(response: Any) -> GatewayResponse:
-    """Translate a provider response into the normalized GatewayResponse."""
-    text = ""
-    tool_calls: list[dict[str, Any]] = []
-    for block in getattr(response, "content", []) or []:
-        btype = getattr(block, "type", None)
-        if btype == "text":
-            text += getattr(block, "text", "")
-        elif btype == "tool_use":
-            tool_calls.append(
-                {"name": getattr(block, "name", ""), "input": getattr(block, "input", {})}
+async def _attempt_stream(
+    db: Session,
+    connector: LlmConnector,
+    request: ChatRequest,
+    *,
+    purpose: str,
+    actor_id: int,
+) -> AsyncIterator[ChatResponseChunk]:
+    """Run a single adapter stream, logging exactly one outcome row.
+
+    The call log is written in a ``finally`` so it fires on success, on a typed
+    error, AND on consumer cancellation (``GeneratorExit`` raised into the
+    generator when the SSE client disconnects). The status reflects which path
+    fired; token counts come only from a terminal chunk's ``usage`` (never
+    prompt/completion content). Auth failures additionally mark the connector
+    ``auth_invalid`` and write an audit row, mirroring the non-stream ``_attempt``.
+    """
+    adapter_cls = get_adapter_class(connector.connector_type)
+    adapter = adapter_cls(connector)
+
+    started = monotonic()
+    status = "ok"
+    error_code: str | None = None
+    tokens_in: int | None = None
+    tokens_out: int | None = None
+    auth_failed = False
+
+    try:
+        async for chunk in adapter.stream(request):
+            if chunk.usage is not None:
+                tokens_in = chunk.usage.prompt
+                tokens_out = chunk.usage.completion
+            yield chunk
+    except GeneratorExit:
+        # Consumer disconnected — record as cancelled and re-raise so the
+        # adapter's own context-manager cleanup closes the upstream connection.
+        status = "cancelled"
+        error_code = "client_disconnect"
+        raise
+    except AuthInvalid:
+        status = "auth_invalid"
+        error_code = "401"
+        auth_failed = True
+        raise
+    except RateLimited as exc:
+        status = "rate_limited"
+        error_code = str(exc.retry_after_seconds or "")
+        raise
+    except QuotaExceeded:
+        status = "quota_exceeded"
+        error_code = "402"
+        raise
+    except ProviderUnavailable as exc:
+        status = "provider_unavailable"
+        error_code = type(exc).__name__
+        raise
+    except ToolTranslationError:
+        status = "tool_translation_error"
+        error_code = "translation"
+        raise
+    except LlmError:
+        status = "error"
+        error_code = "llm_error"
+        raise
+    finally:
+        latency_ms = int((monotonic() - started) * 1000)
+        if status == "ok":
+            connector.last_used_at = utcnow()
+            connector.last_error = None
+        if auth_failed:
+            connector.status = STATUS_AUTH_INVALID
+            connector.last_error = "auth_invalid"
+        log_call(
+            db,
+            connector_id=connector.id,
+            purpose=purpose,
+            status=status,
+            latency_ms=latency_ms,
+            tokens_in=tokens_in if status == "ok" else None,
+            tokens_out=tokens_out if status == "ok" else None,
+            error_code=error_code,
+        )
+        if auth_failed:
+            audit_event(
+                db,
+                actor_user_id=actor_id,
+                target_connector_id=connector.id,
+                event_type=AUDIT_AUTH_INVALID_OBSERVED,
             )
-    return GatewayResponse(tool_calls=tool_calls, text=text)
+        db.commit()
 
 
-async def dispatch(
-    *,
-    messages: list[dict[str, Any]],
-    tool: dict[str, Any] | None = None,
-    system: str = "",
-    model_hint: ModelHint = "fast",
-    max_tokens: int = 2048,
-) -> GatewayResponse:
-    """Dispatch a single LLM turn and return a normalized response.
-
-    Args:
-        messages: provider-agnostic message list ([{"role", "content"}]).
-        tool: a single JSONSchema tool spec ({"name", "input_schema"});
-            when provided, the gateway forces tool use.
-        system: optional system prompt.
-        model_hint: "fast" (batch/chat) or "strong" (critique/grading).
-        max_tokens: response token cap.
-
-    Returns:
-        GatewayResponse with ``tool_calls`` and ``text``.
+def _resolve_connector(db: Session, actor: User | None, *, purpose: str) -> LlmConnector:
+    if actor is not None:
+        # 0. Per-feature pin (issue #337) takes precedence over the per-DJ
+        #    default and MRU. Skipped gracefully when the pinned connector was
+        #    deleted (FK row gone) or is no longer active, so a stale/broken
+        #    pin never silently breaks the DJ — resolution falls through to the
+        #    per-DJ default / MRU / org-default chain below.
+        pref = get_feature_preference(db, user_id=actor.id, feature=purpose)
+        if pref is not None:
+            pinned_feature = db.get(LlmConnector, pref.connector_id)
+            if (
+                pinned_feature is not None
+                and pinned_feature.user_id == actor.id
+                and pinned_feature.status == STATUS_ACTIVE
+            ):
+                return pinned_feature
+
+        # Per-DJ explicit default takes precedence over MRU (issue #336).
+        # Falls through to MRU if the DJ hasn't pinned a default or the pinned
+        # connector is no longer active (so DJs aren't silently broken when
+        # their default's status flips to ``auth_invalid`` / ``disabled``).
+        pinned = (
+            db.query(LlmConnector)
+            .filter(
+                LlmConnector.user_id == actor.id,
+                LlmConnector.status == STATUS_ACTIVE,
+                LlmConnector.is_default == True,  # noqa: E712 (SQLAlchemy comparison)
+            )
+            .first()
+        )
+        if pinned is not None:
+            return pinned
+
+        row = (
+            db.query(LlmConnector)
+            .filter(
+                LlmConnector.user_id == actor.id,
+                LlmConnector.status == STATUS_ACTIVE,
+            )
+            .order_by(nulls_last(desc(LlmConnector.last_used_at)), desc(LlmConnector.id))
+            .first()
+        )
+        if row is not None:
+            return row
+
+    default = _resolve_org_default(db)
+    if default is not None:
+        return default
+
+    raise NoLlmConfigured("No active LLM connector for this DJ and no system default configured")
+
+
+def _resolve_org_default(db: Session) -> LlmConnector | None:
+    """Return the active org-default connector, or ``None`` if unset/inactive."""
+    settings = db.query(SystemSettings).first()
+    if settings and settings.llm_default_connector_id:
+        default = db.get(LlmConnector, settings.llm_default_connector_id)
+        if default is not None and default.status == STATUS_ACTIVE:
+            return default
+    return None
+
+
+def _system_actor_id(db: Session, connector: LlmConnector) -> int:
+    """Best-effort actor id for system-context audit rows.
+
+    When the gateway is called with ``actor=None`` (system context), audit
+    events should still record an actor; fall back to the connector's owner so
+    the trail is traceable.
     """
-    model = _resolve_model(model_hint)
-    tools = [tool] if tool else []
-    tool_choice = {"type": "tool", "name": tool["name"]} if tool else None
-    response = await _raw_provider_call(
-        model=model,
-        system=system,
-        tools=tools,
-        tool_choice=tool_choice,
-        messages=messages,
-        max_tokens=max_tokens,
-    )
-    return _normalize(response)
+    return connector.user_id
diff --git a/server/app/services/llm/health_check.py b/server/app/services/llm/health_check.py
new file mode 100644
index 00000000..b4d5eda7
--- /dev/null
+++ b/server/app/services/llm/health_check.py
@@ -0,0 +1,173 @@
+"""Shared connector health-check helper.
+
+Used by:
+- ``POST /api/llm/connectors/{id}/test`` (DJ-triggered manual test)
+- ``connector_health_monitor`` background task (issue #340)
+
+Every invocation:
+1. Stamps ``last_health_check_at = utcnow()`` and the outcome on
+   ``last_health_check_status`` (see :data:`HEALTH_CHECK_*` constants).
+2. On auth failure, flips ``status`` to ``auth_invalid`` and writes a
+   ``connector_health_check_failed`` audit row alongside the existing
+   ``connector_health_check`` audit row.
+3. Never raises — always returns the outcome. The caller decides whether to
+   surface the error.
+
+The helper does NOT commit. The caller owns the transaction so it can roll
+back or combine with other writes (e.g. the background loop commits in a
+single transaction per connector).
+"""
+
+from __future__ import annotations
+
+import logging
+from dataclasses import dataclass
+
+from sqlalchemy.orm import Session
+
+from app.core.time import utcnow
+from app.models.llm_connector import (
+    AUDIT_AUTH_INVALID_OBSERVED,
+    AUDIT_HEALTH_CHECK,
+    AUDIT_HEALTH_CHECK_FAILED,
+    HEALTH_CHECK_AUTH_INVALID,
+    HEALTH_CHECK_ERROR,
+    HEALTH_CHECK_OK,
+    HEALTH_CHECK_PROVIDER_UNAVAILABLE,
+    HEALTH_CHECK_QUOTA_EXCEEDED,
+    HEALTH_CHECK_RATE_LIMITED,
+    STATUS_ACTIVE,
+    STATUS_AUTH_INVALID,
+    STATUS_DISABLED,
+    LlmConnector,
+)
+from app.services.llm.connector_storage import audit_event
+from app.services.llm.exceptions import (
+    AuthInvalid,
+    ProviderUnavailable,
+    QuotaExceeded,
+    RateLimited,
+)
+from app.services.llm.registry import get_adapter_class
+
+logger = logging.getLogger(__name__)
+
+
+@dataclass(frozen=True)
+class HealthCheckOutcome:
+    """Result of a single connector health-check invocation."""
+
+    ok: bool
+    status: str
+    """One of the HEALTH_CHECK_* constants."""
+    error_code: str | None = None
+    """Sanitised provider-class label; never includes a credential or upstream body."""
+    status_flipped_to_auth_invalid: bool = False
+    """True iff this call flipped the connector from ``active`` to ``auth_invalid``.
+
+    The background monitor uses this to decide whether to notify the DJ —
+    sending a notification on every periodic check would be noisy when the
+    connector was already broken on the prior pass.
+    """
+
+
+async def run_health_check(
+    db: Session,
+    connector: LlmConnector,
+    *,
+    actor_user_id: int,
+) -> HealthCheckOutcome:
+    """Run ``adapter.health_check()`` against ``connector`` and record the outcome.
+
+    Writes (caller commits):
+    - ``connector.last_health_check_at`` (always)
+    - ``connector.last_health_check_status`` (always)
+    - One ``llm_audit_event`` row of type ``connector_health_check`` (always)
+    - If auth failed: flips ``connector.status`` to ``auth_invalid`` (unless
+      already disabled), sets ``last_error``, and writes a second audit row
+      of type ``auth_invalid_observed``.
+    - If the auth failure was a transition (was active, now auth_invalid),
+      writes a third ``connector_health_check_failed`` audit row so admins can
+      filter on "the moment this connector broke".
+
+    Never raises.
+    """
+    # Always write the AUDIT_HEALTH_CHECK row before the call so we have a
+    # record even if the worker crashes mid-flight.
+    audit_event(
+        db,
+        actor_user_id=actor_user_id,
+        target_connector_id=connector.id,
+        event_type=AUDIT_HEALTH_CHECK,
+    )
+
+    adapter_cls = get_adapter_class(connector.connector_type)
+    adapter = adapter_cls(connector)
+
+    now = utcnow()
+    connector.last_health_check_at = now
+
+    was_active = connector.status == STATUS_ACTIVE
+
+    try:
+        await adapter.health_check()
+    except AuthInvalid:
+        connector.last_health_check_status = HEALTH_CHECK_AUTH_INVALID
+        flipped = False
+        if connector.status != STATUS_DISABLED:
+            if was_active:
+                flipped = True
+            connector.status = STATUS_AUTH_INVALID
+            connector.last_error = "auth_invalid"
+        audit_event(
+            db,
+            actor_user_id=actor_user_id,
+            target_connector_id=connector.id,
+            event_type=AUDIT_AUTH_INVALID_OBSERVED,
+        )
+        if flipped:
+            # Distinct event so admins can filter "monitor caught a break"
+            # separately from the "every check fires AUDIT_HEALTH_CHECK" noise.
+            audit_event(
+                db,
+                actor_user_id=actor_user_id,
+                target_connector_id=connector.id,
+                event_type=AUDIT_HEALTH_CHECK_FAILED,
+            )
+        return HealthCheckOutcome(
+            ok=False,
+            status=HEALTH_CHECK_AUTH_INVALID,
+            error_code="auth_invalid",
+            status_flipped_to_auth_invalid=flipped,
+        )
+    except RateLimited:
+        # Transient — don't flip status. Record the outcome and move on.
+        connector.last_health_check_status = HEALTH_CHECK_RATE_LIMITED
+        return HealthCheckOutcome(
+            ok=False, status=HEALTH_CHECK_RATE_LIMITED, error_code="rate_limited"
+        )
+    except QuotaExceeded:
+        connector.last_health_check_status = HEALTH_CHECK_QUOTA_EXCEEDED
+        return HealthCheckOutcome(
+            ok=False, status=HEALTH_CHECK_QUOTA_EXCEEDED, error_code="quota_exceeded"
+        )
+    except ProviderUnavailable:
+        connector.last_health_check_status = HEALTH_CHECK_PROVIDER_UNAVAILABLE
+        return HealthCheckOutcome(
+            ok=False,
+            status=HEALTH_CHECK_PROVIDER_UNAVAILABLE,
+            error_code="provider_unavailable",
+        )
+    except Exception:  # noqa: BLE001 — adapter contract is broad; sanitised below
+        # Don't leak the upstream exception text — it may include API keys.
+        logger.exception("Connector health check failed unexpectedly")
+        connector.last_health_check_status = HEALTH_CHECK_ERROR
+        return HealthCheckOutcome(ok=False, status=HEALTH_CHECK_ERROR, error_code="unknown")
+
+    # Success path
+    connector.last_health_check_status = HEALTH_CHECK_OK
+    connector.last_error = None
+    # Clear auth_invalid on a successful check (mirrors test_connector behavior).
+    if connector.status == STATUS_AUTH_INVALID:
+        connector.status = STATUS_ACTIVE
+    return HealthCheckOutcome(ok=True, status=HEALTH_CHECK_OK)
diff --git a/server/app/services/llm/health_monitor.py b/server/app/services/llm/health_monitor.py
new file mode 100644
index 00000000..b802ae7d
--- /dev/null
+++ b/server/app/services/llm/health_monitor.py
@@ -0,0 +1,261 @@
+"""Background connector health monitor (issue #340).
+
+Scheduled task that periodically runs ``health_check`` on every
+``status="active"`` connector to catch expired / revoked credentials before
+a DJ tries to use one mid-event.
+
+Design:
+- Loop wakes every ``HEALTH_MONITOR_SCAN_INTERVAL_SECONDS`` (5 min).
+- For each active connector whose ``last_health_check_at`` is older than
+  ``effective_interval_seconds(connector)`` ago, run a check.
+- Per-connector jitter (±30%) staggers checks so a fleet of N connectors
+  doesn't all hit one provider at once (avoid a thundering-herd 429).
+- Sequential within a pass: one connector at a time, with a small sleep
+  between calls, so we respect per-provider rate limits even when all DJs
+  share a single upstream account.
+- On a transition active → auth_invalid, notify the DJ:
+    1. Email via Resend if configured AND the user has an email.
+    2. Otherwise, log a warning.
+  The flipped status itself is the in-app banner (the DJ's /settings/ai page
+  surfaces ``status`` per connector, and the recommendation engine raises
+  ``NoLlmConfigured`` when no active connector exists).
+"""
+
+from __future__ import annotations
+
+import asyncio
+import contextlib
+import hashlib
+import logging
+import os
+
+from sqlalchemy.orm import Session
+
+from app.core.time import utcnow
+from app.models.llm_connector import STATUS_ACTIVE, LlmConnector
+from app.models.user import User
+from app.services.llm.health_check import HealthCheckOutcome, run_health_check
+
+logger = logging.getLogger(__name__)
+
+# Default check interval in hours; overridable via env var
+# ``LLM_HEALTH_CHECK_INTERVAL_HOURS``. Six hours = four checks per day, which
+# is well under any provider's per-key rate limit but still catches breakage
+# inside a single working day.
+_DEFAULT_INTERVAL_HOURS = 6
+_HEALTH_CHECK_INTERVAL_HOURS_ENV = "LLM_HEALTH_CHECK_INTERVAL_HOURS"
+
+# How often the loop wakes to look for due connectors. Shorter than the
+# interval so jitter is smooth; the cost is one tiny SELECT per scan.
+HEALTH_MONITOR_SCAN_INTERVAL_SECONDS = 300
+
+# Sleep between consecutive health-check calls within a single scan pass.
+# Spreads load across the upstream providers and limits the per-DJ impact of
+# the monitor when many connectors are due at once.
+_PER_CHECK_SLEEP_SECONDS = 1.0
+
+
+def _get_interval_seconds() -> int:
+    """Read the configured interval from the env, clamped to safe bounds.
+
+    A non-positive or absurdly large value falls back to the default so a
+    misconfigured ``.env`` can never disable the monitor or DoS providers.
+    """
+    raw = os.environ.get(_HEALTH_CHECK_INTERVAL_HOURS_ENV)
+    if not raw:
+        hours = _DEFAULT_INTERVAL_HOURS
+    else:
+        try:
+            hours = int(raw)
+        except ValueError:
+            logger.warning(
+                "Invalid %s=%r; falling back to %s",
+                _HEALTH_CHECK_INTERVAL_HOURS_ENV,
+                raw,
+                _DEFAULT_INTERVAL_HOURS,
+            )
+            hours = _DEFAULT_INTERVAL_HOURS
+    # Floor: 1 hour (faster = wastes upstream rate limit).
+    # Ceiling: 168 hours / 7 days (slower = defeats the purpose).
+    hours = max(1, min(168, hours))
+    return hours * 3600
+
+
+def _jitter_factor(connector_id: int) -> float:
+    """Per-connector deterministic jitter in [0.7, 1.3].
+
+    Deterministic-by-id so successive scans don't reshuffle the schedule on
+    every wake (which would mean some connectors get hit far more often than
+    intended). The hash spreads connectors uniformly across the 30% band.
+    """
+    # SHA-256 is overkill cryptographically, but it's already in the stdlib
+    # and gives a clean uniform distribution. The first 4 bytes are plenty.
+    h = hashlib.sha256(str(connector_id).encode("ascii")).digest()
+    n = int.from_bytes(h[:4], "big")
+    # Map [0, 2**32) → [0, 1)
+    frac = n / float(1 << 32)
+    # Map [0, 1) → [0.7, 1.3)
+    return 0.7 + (frac * 0.6)
+
+
+def effective_interval_seconds(connector: LlmConnector) -> int:
+    """Effective check interval for ``connector`` (base × per-connector jitter)."""
+    return int(_get_interval_seconds() * _jitter_factor(connector.id))
+
+
+def _is_due(connector: LlmConnector) -> bool:
+    """True iff ``connector`` is overdue for a periodic health check."""
+    if connector.last_health_check_at is None:
+        return True
+    elapsed = (utcnow() - connector.last_health_check_at).total_seconds()
+    return elapsed >= effective_interval_seconds(connector)
+
+
+def _select_due_connectors(db: Session) -> list[LlmConnector]:
+    """Return active connectors whose last check is older than their effective interval.
+
+    Filtering ``status == STATUS_ACTIVE`` cheaply in SQL avoids reading
+    disabled rows. The per-row jitter calculation is done in Python because
+    SQLite (used in tests) lacks a stable hash function.
+    """
+    active = (
+        db.query(LlmConnector)
+        .filter(LlmConnector.status == STATUS_ACTIVE)
+        .order_by(LlmConnector.last_health_check_at.asc().nulls_first())
+        .all()
+    )
+    return [c for c in active if _is_due(c)]
+
+
+def _notify_dj_auth_invalid(db: Session, connector: LlmConnector) -> None:
+    """Best-effort email notification when the monitor flips a connector to auth_invalid.
+
+    Channels tried (in order):
+    1. Email via Resend, if the user has a non-empty ``email`` AND Resend is
+       configured (the sender raises ``EmailNotConfiguredError`` otherwise).
+    2. Logs at WARNING. The connector's flipped status itself surfaces in
+       the DJ's settings UI on next login.
+
+    Never raises — notification failures must not block subsequent health
+    checks in the same pass.
+    """
+    try:
+        user = db.get(User, connector.user_id)
+    except Exception:  # noqa: BLE001 — defensive: DB hiccup must not kill the loop
+        logger.exception("health monitor: failed to load user for connector %s", connector.id)
+        user = None
+
+    if user is None or not user.email:
+        logger.warning(
+            "health monitor: connector %s (user_id=%s) flipped to auth_invalid; "
+            "no email on file — DJ will see the banner on next login.",
+            connector.id,
+            connector.user_id,
+        )
+        return
+
+    try:
+        from app.services.email_sender import (
+            EmailNotConfiguredError,
+            EmailSendError,
+            send_connector_auth_invalid_notification,
+        )
+
+        send_connector_auth_invalid_notification(
+            to_address=user.email,
+            display_name=connector.display_name,
+            connector_type=connector.connector_type,
+        )
+    except EmailNotConfiguredError:
+        logger.warning(
+            "health monitor: connector %s flipped to auth_invalid; "
+            "email not configured — DJ will see the banner on next login.",
+            connector.id,
+        )
+    except EmailSendError:
+        logger.exception(
+            "health monitor: failed to send auth_invalid email for connector %s",
+            connector.id,
+        )
+    except Exception:  # noqa: BLE001
+        logger.exception(
+            "health monitor: unexpected error notifying DJ of connector %s",
+            connector.id,
+        )
+
+
+async def _check_one(db: Session, connector: LlmConnector) -> HealthCheckOutcome:
+    """Run a health check on ``connector``, commit, and notify if it just broke.
+
+    The audit row is written with ``actor_user_id = connector.user_id``
+    because the periodic check is *on behalf of* the DJ (vs the manual test
+    button, where the actor is whoever clicked it). This keeps the audit
+    trail attributable.
+    """
+    outcome = await run_health_check(db, connector, actor_user_id=connector.user_id)
+    db.commit()
+    if outcome.status_flipped_to_auth_invalid:
+        _notify_dj_auth_invalid(db, connector)
+    return outcome
+
+
+async def run_monitor_pass(db: Session) -> int:
+    """Run one full pass of the monitor: check every due connector.
+
+    Returns the number of connectors checked. Exposed for tests and for the
+    background loop. Sequential — see module docstring.
+    """
+    due = _select_due_connectors(db)
+    if not due:
+        return 0
+
+    checked = 0
+    for connector in due:
+        try:
+            await _check_one(db, connector)
+        except Exception:  # noqa: BLE001 — keep the loop alive
+            logger.exception("health monitor: error checking connector %s", connector.id)
+            # Defensive: rollback any half-applied state from the failed check
+            # so the next connector starts on a clean session.
+            with contextlib.suppress(Exception):
+                db.rollback()
+        checked += 1
+        if _PER_CHECK_SLEEP_SECONDS > 0 and checked < len(due):
+            await asyncio.sleep(_PER_CHECK_SLEEP_SECONDS)
+    return checked
+
+
+def _run_monitor_pass_sync() -> int:
+    """Synchronous wrapper for ``run_monitor_pass`` used by the background loop.
+
+    Each pass opens its own ``SessionLocal`` so the loop doesn't hold a
+    long-lived connection between scans. ``asyncio.run`` is fine here
+    because this function is executed in ``asyncio.to_thread`` from the
+    main event loop, not on the loop thread itself.
+    """
+    from app.db.session import SessionLocal
+
+    db = SessionLocal()
+    try:
+        return asyncio.run(run_monitor_pass(db))
+    finally:
+        db.close()
+
+
+async def health_monitor_loop() -> None:
+    """Background task — runs forever, scanning every ``HEALTH_MONITOR_SCAN_INTERVAL_SECONDS``.
+
+    Wrapped in a try/except so a single bug doesn't kill the loop; logs the
+    exception and sleeps before retrying.
+    """
+    # First sleep before first pass so startup isn't blocked by N upstream
+    # round-trips on cold boot.
+    await asyncio.sleep(HEALTH_MONITOR_SCAN_INTERVAL_SECONDS)
+    while True:
+        try:
+            checked = await asyncio.to_thread(_run_monitor_pass_sync)
+            if checked:
+                logger.info("llm health monitor pass: checked %s connectors", checked)
+        except Exception:  # noqa: BLE001 — loop must survive any error
+            logger.exception("llm health monitor loop error")
+        await asyncio.sleep(HEALTH_MONITOR_SCAN_INTERVAL_SECONDS)
diff --git a/server/app/services/llm/openrouter_models.py b/server/app/services/llm/openrouter_models.py
new file mode 100644
index 00000000..271e79b9
--- /dev/null
+++ b/server/app/services/llm/openrouter_models.py
@@ -0,0 +1,99 @@
+"""OpenRouter model catalogue fetcher with an in-memory TTL cache.
+
+OpenRouter publishes its full model catalogue at ``GET /api/v1/models`` (a
+public, unauthenticated endpoint). The DJ "AI providers" page surfaces this as
+a model-hint dropdown so DJs pick a valid namespaced model id ("provider/model")
+instead of free-typing.
+
+The catalogue changes rarely, so we cache it process-wide for one hour. The
+cache is best-effort: on any fetch failure (network, timeout, malformed body)
+we return the last good cache if present, otherwise an empty list. Callers
+treat an empty list as "dropdown unavailable, fall back to free-text input".
+
+No credentials are involved — the endpoint is public.
+"""
+
+from __future__ import annotations
+
+import logging
+import time
+
+import httpx
+
+from app.schemas.ai_settings import AIModelInfo
+
+logger = logging.getLogger(__name__)
+
+OPENROUTER_MODELS_URL = "https://openrouter.ai/api/v1/models"
+CACHE_TTL_SECONDS = 3600.0  # refresh hourly
+_FETCH_TIMEOUT_SECONDS = 10.0
+
+# Process-wide cache: (fetched_at_monotonic, models)
+_cache: tuple[float, list[AIModelInfo]] | None = None
+
+
+def _now() -> float:
+    return time.monotonic()
+
+
+def _parse_models(body: object) -> list[AIModelInfo]:
+    """Translate the OpenRouter /models payload into our AIModelInfo list.
+
+    The payload shape is ``{"data": [{"id": "provider/model", "name": "..."}]}``.
+    We defensively skip entries missing an ``id``.
+    """
+    if not isinstance(body, dict):
+        return []
+    data = body.get("data")
+    if not isinstance(data, list):
+        return []
+    out: list[AIModelInfo] = []
+    for entry in data:
+        if not isinstance(entry, dict):
+            continue
+        model_id = entry.get("id")
+        if not model_id or not isinstance(model_id, str):
+            continue
+        name = entry.get("name")
+        display = name if isinstance(name, str) and name else model_id
+        out.append(AIModelInfo(id=model_id, name=display))
+    return out
+
+
+async def get_openrouter_models(*, force_refresh: bool = False) -> list[AIModelInfo]:
+    """Return the OpenRouter model catalogue, served from cache when fresh.
+
+    On fetch failure, returns the last good cache (even if stale) or an empty
+    list. Never raises — the dropdown is a convenience, not a hard dependency.
+    """
+    global _cache
+
+    if not force_refresh and _cache is not None:
+        fetched_at, models = _cache
+        if _now() - fetched_at < CACHE_TTL_SECONDS:
+            return models
+
+    try:
+        async with httpx.AsyncClient(timeout=_FETCH_TIMEOUT_SECONDS) as client:
+            resp = await client.get(OPENROUTER_MODELS_URL)
+        resp.raise_for_status()
+        body = resp.json()
+    except Exception:  # noqa: BLE001 — best-effort, fall back to stale/empty
+        logger.warning("Failed to fetch OpenRouter model catalogue")
+        if _cache is not None:
+            return _cache[1]
+        return []
+
+    models = _parse_models(body)
+    if models:
+        _cache = (_now(), models)
+    elif _cache is not None:
+        # Empty parse but we had a prior good list — keep serving it.
+        return _cache[1]
+    return models
+
+
+def _reset_cache_for_tests() -> None:
+    """Clear the module cache. Test-only helper."""
+    global _cache
+    _cache = None
diff --git a/server/app/services/llm/plugin_loader.py b/server/app/services/llm/plugin_loader.py
new file mode 100644
index 00000000..edaacd83
--- /dev/null
+++ b/server/app/services/llm/plugin_loader.py
@@ -0,0 +1,122 @@
+"""Optional filesystem loader for third-party LLM adapter plug-ins.
+
+When the ``LLM_PLUGIN_DIR`` environment variable is set to a directory path,
+:func:`load_plugins_from_env` imports every ``.py`` file (non-recursive,
+excluding files whose names start with ``_``) from that directory at startup.
+
+Each imported plug-in is responsible for calling
+:func:`app.services.llm.registry.register_adapter` at module load time — same
+contract the built-in adapters use. The loader simply triggers the import; it
+performs no monkey-patching, manifest parsing, or sandbox.
+
+Security posture
+----------------
+Loading a plug-in is equivalent to giving the loaded code the full privileges
+of the backend process — same as installing a Python package. There is no
+sandbox. Operators must therefore:
+
+- Treat ``LLM_PLUGIN_DIR`` as a privileged path. Only the same user that owns
+  ``server/`` and its venv should have write access to it.
+- Audit each plug-in's source the same way they would audit a third-party
+  ``pip install``. The skeleton at ``docs/examples/echo_adapter.py`` is
+  reviewed; everything else must be reviewed by whoever sets up the
+  environment.
+- Never set ``LLM_PLUGIN_DIR`` to a world-writable or shared-tenancy path.
+
+In production we recommend leaving ``LLM_PLUGIN_DIR`` unset and packaging
+trusted plug-ins as ordinary Python modules imported from a controlled
+location. The env-var loader exists to make local experimentation and forks
+ergonomic.
+"""
+
+from __future__ import annotations
+
+import importlib.util
+import logging
+import os
+import sys
+import traceback
+from pathlib import Path
+
+logger = logging.getLogger(__name__)
+
+ENV_VAR = "LLM_PLUGIN_DIR"
+
+
+def load_plugins_from_env() -> list[str]:
+    """Load adapters from the directory named by ``LLM_PLUGIN_DIR``.
+
+    Returns the list of module names that were successfully imported (their
+    side-effectful ``register_adapter`` calls will have run by then).
+
+    The loader is intentionally permissive: a single broken plug-in must not
+    prevent the rest of the directory — or the backend process itself — from
+    starting. Each import error is logged with a full stack trace and the
+    plug-in name, then skipped.
+    """
+    dir_path = os.environ.get(ENV_VAR)
+    if not dir_path:
+        return []
+    return load_plugins_from_dir(dir_path)
+
+
+def load_plugins_from_dir(dir_path: str | os.PathLike[str]) -> list[str]:
+    """Same as :func:`load_plugins_from_env` but with an explicit path."""
+    root = Path(dir_path)
+    if not root.is_dir():
+        logger.warning(
+            "%s=%s does not exist or is not a directory; skipping plug-in load",
+            ENV_VAR,
+            dir_path,
+        )
+        return []
+
+    loaded: list[str] = []
+    # Sort for stable load order — useful when one plug-in depends on another
+    # being registered first (the registry rejects double-registration so the
+    # *first* import of any given connector_type wins).
+    for entry in sorted(root.iterdir()):
+        if not _is_loadable(entry):
+            continue
+        # Synthesise a stable, namespaced module name to avoid colliding with
+        # any installed package. We deliberately do NOT add the plug-in dir to
+        # ``sys.path`` — that would also expose every other file in the dir as
+        # an importable module from elsewhere in the codebase.
+        module_name = f"llm_plugins.{entry.stem}"
+        try:
+            spec = importlib.util.spec_from_file_location(module_name, entry)
+            if spec is None or spec.loader is None:
+                logger.warning("Could not build import spec for plug-in %s", entry)
+                continue
+            module = importlib.util.module_from_spec(spec)
+            sys.modules[module_name] = module
+            spec.loader.exec_module(module)
+        except Exception:
+            # ``traceback.format_exc()`` is logged so operators can debug
+            # plug-in import errors without crashing the backend. We pop the
+            # half-imported module out of ``sys.modules`` so a later retry
+            # (e.g. uvicorn --reload) re-runs the spec from scratch.
+            sys.modules.pop(module_name, None)
+            logger.error(
+                "Failed to load LLM plug-in %s (module=%s):\n%s",
+                entry.name,
+                module_name,
+                traceback.format_exc(),
+            )
+            continue
+        logger.info("Loaded LLM plug-in %s (module=%s)", entry.name, module_name)
+        loaded.append(module_name)
+    return loaded
+
+
+def _is_loadable(entry: Path) -> bool:
+    """Filter the directory listing to plain ``*.py`` source files."""
+    if not entry.is_file():
+        return False
+    if entry.suffix != ".py":
+        return False
+    if entry.name.startswith("_"):
+        # Skip ``__init__.py`` and any conventional "private" leading-underscore
+        # helpers — they are usually shared utilities, not plug-ins.
+        return False
+    return True
diff --git a/server/app/services/llm/registry.py b/server/app/services/llm/registry.py
new file mode 100644
index 00000000..ae4bc020
--- /dev/null
+++ b/server/app/services/llm/registry.py
@@ -0,0 +1,78 @@
+"""Adapter registry — maps connector_type strings to adapter classes.
+
+Importing the adapters package via ``from app.services.llm.adapters import *``
+auto-registers each adapter via ``register_adapter``.
+"""
+
+from __future__ import annotations
+
+from app.services.llm.base import LlmAdapter
+
+_REGISTRY: dict[str, type[LlmAdapter]] = {}
+
+
+def register_adapter(connector_type: str, cls: type[LlmAdapter]) -> None:
+    """Register an adapter class for a connector_type.
+
+    Re-registering the *same* class is a no-op (safe for re-imports during
+    tests). Registering a *different* class for an already-bound
+    ``connector_type`` raises :class:`ValueError` — silently overwriting
+    adapters would make behavior depend on import order and hide collisions.
+    """
+    if not connector_type:
+        raise ValueError("connector_type must be non-empty")
+    if not issubclass(cls, LlmAdapter):
+        raise TypeError("Adapter must subclass LlmAdapter")
+    existing = _REGISTRY.get(connector_type)
+    if existing is not None and existing is not cls:
+        raise ValueError(
+            f"connector_type {connector_type!r} already registered by "
+            f"{existing.__name__}; refusing to overwrite with {cls.__name__}"
+        )
+    _REGISTRY[connector_type] = cls
+
+
+def get_adapter_class(connector_type: str) -> type[LlmAdapter]:
+    """Return the adapter class for a connector_type or raise KeyError."""
+    if connector_type not in _REGISTRY:
+        raise KeyError(f"No adapter registered for connector_type={connector_type!r}")
+    return _REGISTRY[connector_type]
+
+
+def list_connector_types() -> list[str]:
+    """Return all registered connector_type names (sorted, stable order)."""
+    return sorted(_REGISTRY.keys())
+
+
+def is_registered(connector_type: str) -> bool:
+    """Cheap membership check, used by callers that wish to soft-validate."""
+    return connector_type in _REGISTRY
+
+
+# Eagerly import adapters to populate the registry. This avoids callers needing
+# to remember an explicit "register" step.
+def _bootstrap() -> None:
+    # Local imports keep the registry module dependency-free at import time.
+    from app.services.llm.adapters import (  # noqa: F401
+        anthropic_apikey,
+        azure_openai,
+        bedrock,
+        gemini_apikey,
+        openai_apikey,
+        openai_compatible,
+        openrouter_apikey,
+        xai_apikey,
+    )
+
+    # Optional third-party plug-in load: if LLM_PLUGIN_DIR is set, import every
+    # .py file in that directory. Built-in adapters are loaded first so a
+    # plug-in can never shadow a built-in (the registry refuses
+    # double-registration, surfacing a clear startup error instead of silently
+    # overriding the production adapter). Plug-in load failures are logged but
+    # never crash the backend — see app.services.llm.plugin_loader.
+    from app.services.llm.plugin_loader import load_plugins_from_env
+
+    load_plugins_from_env()
+
+
+_bootstrap()
diff --git a/server/app/services/llm/sigv4.py b/server/app/services/llm/sigv4.py
new file mode 100644
index 00000000..d6be38d5
--- /dev/null
+++ b/server/app/services/llm/sigv4.py
@@ -0,0 +1,141 @@
+"""Minimal AWS Signature Version 4 (SigV4) signing — dependency-free.
+
+We deliberately avoid ``boto3``/``botocore`` (per the CLAUDE.md CVE/dependency
+rule) and implement just enough of SigV4 to sign a single ``POST`` request to
+the Bedrock runtime ``InvokeModel`` endpoint over the existing ``httpx`` client.
+
+Reference: https://docs.aws.amazon.com/general/latest/gr/sigv4-create-canonical-request.html
+
+This module is pure stdlib (``hashlib`` / ``hmac`` / ``datetime`` / ``urllib``)
+so it adds no new third-party surface area. It only signs the request shape the
+Bedrock adapter produces — it is not a general-purpose AWS signer.
+"""
+
+from __future__ import annotations
+
+import hashlib
+import hmac
+from datetime import datetime
+from urllib.parse import quote
+
+_ALGORITHM = "AWS4-HMAC-SHA256"
+_SERVICE = "bedrock"
+
+
+def _sha256_hex(data: bytes) -> str:
+    return hashlib.sha256(data).hexdigest()
+
+
+def _hmac_sha256(key: bytes, msg: str) -> bytes:
+    return hmac.new(key, msg.encode("utf-8"), hashlib.sha256).digest()
+
+
+def _signing_key(secret_key: str, date_stamp: str, region: str, service: str) -> bytes:
+    """Derive the SigV4 signing key (the chained-HMAC ``kSigning``)."""
+    k_date = _hmac_sha256(("AWS4" + secret_key).encode("utf-8"), date_stamp)
+    k_region = _hmac_sha256(k_date, region)
+    k_service = _hmac_sha256(k_region, service)
+    return _hmac_sha256(k_service, "aws4_request")
+
+
+def sign_request(
+    *,
+    access_key_id: str,
+    secret_access_key: str,
+    region: str,
+    host: str,
+    canonical_uri: str,
+    body: bytes,
+    now: datetime,
+    service: str = _SERVICE,
+    content_type: str = "application/json",
+    session_token: str | None = None,
+) -> dict[str, str]:
+    """Return the headers required to authenticate a signed ``POST`` request.
+
+    ``canonical_uri`` is the request path (already percent-encoded as needed,
+    e.g. ``/model/anthropic.claude-3-5-sonnet-20241022-v2:0/invoke``). The
+    caller supplies the request ``body`` bytes; we hash and sign them.
+
+    The returned dict includes ``Authorization``, ``X-Amz-Date``,
+    ``X-Amz-Content-Sha256`` (and ``X-Amz-Security-Token`` when a session token
+    is provided). Callers merge these with ``Content-Type``/``Accept``.
+    """
+    amz_date = now.strftime("%Y%m%dT%H%M%SZ")
+    date_stamp = now.strftime("%Y%m%d")
+
+    payload_hash = _sha256_hex(body)
+
+    # --- Canonical request -------------------------------------------------
+    # Headers must be sorted by lowercased name and trimmed. We sign the
+    # minimal set: host, content-type, x-amz-content-sha256, x-amz-date
+    # (+ x-amz-security-token when present).
+    canonical_headers_map = {
+        "content-type": content_type,
+        "host": host,
+        "x-amz-content-sha256": payload_hash,
+        "x-amz-date": amz_date,
+    }
+    if session_token:
+        canonical_headers_map["x-amz-security-token"] = session_token
+
+    signed_headers = ";".join(sorted(canonical_headers_map))
+    canonical_headers = "".join(
+        f"{name}:{canonical_headers_map[name]}\n" for name in sorted(canonical_headers_map)
+    )
+
+    canonical_request = "\n".join(
+        [
+            "POST",
+            _canonicalize_uri(canonical_uri),
+            "",  # no query string
+            canonical_headers,
+            signed_headers,
+            payload_hash,
+        ]
+    )
+
+    # --- String to sign ----------------------------------------------------
+    credential_scope = f"{date_stamp}/{region}/{service}/aws4_request"
+    string_to_sign = "\n".join(
+        [
+            _ALGORITHM,
+            amz_date,
+            credential_scope,
+            _sha256_hex(canonical_request.encode("utf-8")),
+        ]
+    )
+
+    # --- Signature ---------------------------------------------------------
+    signing_key = _signing_key(secret_access_key, date_stamp, region, service)
+    signature = hmac.new(signing_key, string_to_sign.encode("utf-8"), hashlib.sha256).hexdigest()
+
+    authorization = (
+        f"{_ALGORITHM} "
+        f"Credential={access_key_id}/{credential_scope}, "
+        f"SignedHeaders={signed_headers}, "
+        f"Signature={signature}"
+    )
+
+    headers = {
+        "Authorization": authorization,
+        "X-Amz-Date": amz_date,
+        "X-Amz-Content-Sha256": payload_hash,
+    }
+    if session_token:
+        headers["X-Amz-Security-Token"] = session_token
+    return headers
+
+
+def _canonicalize_uri(path: str) -> str:
+    """Percent-encode each path segment per SigV4 rules (keeps ``/`` separators).
+
+    Bedrock model ids contain characters like ``:`` (e.g. ``...-v2:0``) which
+    must be encoded in the canonical URI even though they are valid in the URL.
+    """
+    if not path:
+        return "/"
+    segments = path.split("/")
+    # quote() leaves unreserved chars + nothing in safe=""; encode ':' too.
+    encoded = [quote(seg, safe="") for seg in segments]
+    return "/".join(encoded)
diff --git a/server/app/services/llm/streaming.py b/server/app/services/llm/streaming.py
new file mode 100644
index 00000000..88f99c6d
--- /dev/null
+++ b/server/app/services/llm/streaming.py
@@ -0,0 +1,98 @@
+"""Shared streaming primitives for LLM adapters.
+
+Holds SSE-line parsing helpers reused by the OpenAI-wire adapters (Platform +
+custom OpenAI-compatible). The chunk / delta models themselves live in
+``base.py`` alongside ``ChatResponse``.
+"""
+
+from __future__ import annotations
+
+from typing import Literal
+
+from app.services.llm.base import ChatResponseChunk, TokenUsage, ToolCallDelta
+
+CanonicalStopReason = Literal["end_turn", "tool_use", "max_tokens", "error"]
+
+
+def _as_int(value: object, default: int = 0) -> int:
+    """Coerce an external (provider-supplied) field to ``int``, tolerantly.
+
+    Streaming payloads come straight off the wire; a non-conforming provider can
+    send ``null`` or a non-numeric value for ``index`` / token counts. We never
+    want a malformed field to raise and abort an otherwise-usable stream, so fall
+    back to ``default`` instead of letting ``int()`` raise.
+    """
+    try:
+        return int(value)  # type: ignore[arg-type]
+    except (TypeError, ValueError):
+        return default
+
+
+# OpenAI streaming finish_reason → canonical stop_reason. Mirrors the
+# non-streaming mapping in ``tool_translation._FINISH_REASON_OPENAI``; kept local
+# so this module owns no private cross-module imports. Any reason absent from the
+# table maps to "error".
+_FINISH_REASON_OPENAI: dict[str, CanonicalStopReason] = {
+    "stop": "end_turn",
+    "tool_calls": "tool_use",
+    "function_call": "tool_use",
+    "length": "max_tokens",
+}
+
+
+def parse_openai_stream_event(payload: dict) -> ChatResponseChunk | None:
+    """Translate one parsed OpenAI streaming JSON object into a chunk.
+
+    Returns ``None`` for payloads carrying no usable signal (e.g. the initial
+    role-only delta). The terminal event (``finish_reason`` set) returns a chunk
+    with ``done=True``, the mapped ``stop_reason`` and (when present) token usage.
+    """
+    choices = payload.get("choices") or []
+    choice = choices[0] if choices else {}
+    delta = choice.get("delta") or {}
+
+    text_delta = delta.get("content") or ""
+
+    tool_call_deltas: list[ToolCallDelta] = []
+    for tc in delta.get("tool_calls") or []:
+        if not isinstance(tc, dict):
+            continue
+        fn = tc.get("function") if isinstance(tc.get("function"), dict) else {}
+        tool_call_deltas.append(
+            ToolCallDelta(
+                index=_as_int(tc.get("index", 0)),
+                id=tc.get("id"),
+                name=fn.get("name"),
+                input_json_fragment=fn.get("arguments") or "",
+            )
+        )
+
+    finish_reason = choice.get("finish_reason")
+    done = finish_reason is not None
+
+    stop_reason: CanonicalStopReason | None = None
+    if done:
+        stop_reason = _FINISH_REASON_OPENAI.get(finish_reason, "error")
+
+    # Usage can arrive on a *separate* terminal frame that carries no text/tool
+    # delta and no finish_reason: OpenAI's ``stream_options.include_usage`` emits a
+    # final ``choices: []`` event whose only payload is ``usage``. Compute it
+    # unconditionally (not just when ``done``) so token accounting survives.
+    usage: TokenUsage | None = None
+    usage_payload = payload.get("usage") or {}
+    if usage_payload:
+        usage = TokenUsage(
+            prompt=_as_int(usage_payload.get("prompt_tokens", 0)),
+            completion=_as_int(usage_payload.get("completion_tokens", 0)),
+        )
+
+    if not text_delta and not tool_call_deltas and not done and usage is None:
+        return None
+
+    return ChatResponseChunk(
+        text_delta=text_delta,
+        tool_call_deltas=tool_call_deltas,
+        stop_reason=stop_reason,
+        usage=usage,
+        done=done,
+    )
diff --git a/server/app/services/llm/tool_translation.py b/server/app/services/llm/tool_translation.py
new file mode 100644
index 00000000..cd0b0805
--- /dev/null
+++ b/server/app/services/llm/tool_translation.py
@@ -0,0 +1,511 @@
+"""Translate canonical ``ToolSpec`` → per-provider tool/function shape.
+
+Each translation helper returns a tuple ``(tools_list, tool_choice_or_none)``
+ready to drop into the provider's request body.
+
+Also exposes response parsers that convert provider-native message shapes
+back into canonical ``ChatResponse`` (with ``tool_calls``).
+"""
+
+from __future__ import annotations
+
+import json
+import logging
+from typing import Any, Literal
+
+from app.services.llm.base import ChatResponse, Message, TokenUsage, ToolCall, ToolSpec
+from app.services.llm.exceptions import ToolTranslationError
+
+logger = logging.getLogger(__name__)
+
+CanonicalStopReason = Literal["end_turn", "tool_use", "max_tokens", "error"]
+
+# Per-provider native-finish-reason → canonical mapping. ``None`` always means
+# "end_turn"; any reason absent from a table maps to "error".
+_FINISH_REASON_OPENAI = {
+    "stop": "end_turn",
+    "tool_calls": "tool_use",
+    "function_call": "tool_use",
+    "length": "max_tokens",
+}
+_FINISH_REASON_ANTHROPIC = {
+    "end_turn": "end_turn",
+    "stop_sequence": "end_turn",
+    "tool_use": "tool_use",
+    "max_tokens": "max_tokens",
+}
+_FINISH_REASON_GEMINI = {"STOP": "end_turn", "MAX_TOKENS": "max_tokens"}
+_FINISH_REASON_LLAMA = {"stop": "end_turn", "length": "max_tokens"}
+
+
+def _normalise_finish_reason(reason: str | None, mapping: dict[str, str]) -> CanonicalStopReason:
+    if reason is None:
+        return "end_turn"
+    return mapping.get(reason, "error")  # type: ignore[return-value]
+
+
+def normalise_anthropic_stop_reason(reason: str | None) -> CanonicalStopReason:
+    """Canonicalise an Anthropic ``stop_reason`` (shared by chat + streaming).
+
+    Single source of truth so the buffered (``parse_anthropic_response``) and
+    streamed (``AnthropicApiKeyAdapter.stream``) paths can never diverge. ``None``
+    → ``end_turn``; values Anthropic may emit but we don't model canonically
+    (``pause_turn``, ``refusal``) fall through to ``error``, matching the
+    non-stream path.
+    """
+    return _normalise_finish_reason(reason, _FINISH_REASON_ANTHROPIC)
+
+
+def _validate_force(tools: list[ToolSpec], force: str | None) -> None:
+    """Raise if ``force`` names a tool not present in ``tools`` (no-op when None)."""
+    if force is not None and not any(t.name == force for t in tools):
+        raise ToolTranslationError(f"force_tool={force!r} not in tools list")
+
+
+def content_to_text(content: str | list | None) -> str:
+    """Flatten a ``Message.content`` (str or list of text blocks) to plain text.
+
+    Blocks may be dicts (``{"type": "text", "text": "..."}``) or objects with a
+    ``.text`` attr. Shared by the OpenAI, Anthropic and Bedrock translators.
+    """
+    if isinstance(content, list):
+        parts: list[str] = []
+        for b in content:
+            if isinstance(b, dict):
+                parts.append(b.get("text") or "")
+            else:
+                parts.append(getattr(b, "text", "") or "")
+        return "".join(parts)
+    return content or ""
+
+
+def to_anthropic_messages(messages: list[Message]) -> list[dict]:
+    """Translate canonical messages to Anthropic's user/assistant shape.
+
+    System messages are pulled out by the caller (``request.system``).
+    Tool-result messages map to ``role=user`` with a ``tool_result`` block.
+    Shared by the Anthropic SDK adapter and the Bedrock anthropic-family path.
+    """
+    out: list[dict] = []
+    for m in messages:
+        if m.role == "system":
+            continue
+        text = content_to_text(m.content)
+        if m.role == "tool":
+            if not m.tool_call_id:
+                raise ToolTranslationError("Tool message missing tool_call_id")
+            out.append(
+                {
+                    "role": "user",
+                    "content": [
+                        {
+                            "type": "tool_result",
+                            "tool_use_id": m.tool_call_id,
+                            "content": text,
+                        }
+                    ],
+                }
+            )
+            continue
+        role = "assistant" if m.role == "assistant" else "user"
+        out.append({"role": role, "content": text})
+    return out
+
+
+# ---------------------------------------------------------------------------
+# OpenAI
+# ---------------------------------------------------------------------------
+def to_openai_tools(
+    tools: list[ToolSpec] | None, force: str | None
+) -> tuple[list[dict] | None, Any]:
+    if not tools:
+        return None, None
+    fns = [
+        {
+            "type": "function",
+            "function": {
+                "name": t.name,
+                "description": t.description,
+                "parameters": t.input_schema,
+            },
+        }
+        for t in tools
+    ]
+    _validate_force(tools, force)
+    choice: Any = None
+    if force is not None:
+        choice = {"type": "function", "function": {"name": force}}
+    return fns, choice
+
+
+def parse_openai_response(payload: dict) -> ChatResponse:
+    """Parse an OpenAI chat-completions response body."""
+    try:
+        choice = payload["choices"][0]
+        msg = choice["message"]
+    except (KeyError, IndexError, TypeError) as exc:
+        raise ToolTranslationError("OpenAI response missing choices/message") from exc
+
+    text = msg.get("content") or ""
+
+    tool_calls: list[ToolCall] = []
+    raw_tool_calls = msg.get("tool_calls") or []
+    if not isinstance(raw_tool_calls, list):
+        raise ToolTranslationError("OpenAI tool_calls must be a list")
+    for tc in raw_tool_calls:
+        if not isinstance(tc, dict):
+            raise ToolTranslationError("OpenAI tool_call entry must be an object")
+        fn = tc.get("function") or {}
+        if not isinstance(fn, dict):
+            raise ToolTranslationError("OpenAI tool_call function must be an object")
+        name = fn.get("name") or tc.get("name") or ""
+        raw_args = fn.get("arguments")
+        # Only None (and empty-string, which some compatible servers send for
+        # no-arg calls) falls back to {}. Other falsy non-objects ([], False, 0)
+        # must NOT be coerced to {} — they fall through to the isinstance check
+        # below and raise, rather than silently running a tool with empty input.
+        try:
+            if raw_args is None:
+                input_obj = {}
+            elif isinstance(raw_args, str):
+                input_obj = json.loads(raw_args) if raw_args else {}
+            else:
+                input_obj = raw_args
+        except (json.JSONDecodeError, TypeError) as exc:
+            raise ToolTranslationError("OpenAI tool_call arguments are not valid JSON") from exc
+        if not isinstance(input_obj, dict):
+            raise ToolTranslationError("OpenAI tool_call arguments must be an object")
+        tool_calls.append(ToolCall(id=str(tc.get("id") or name), name=name, input=input_obj))
+
+    stop_reason = _normalise_finish_reason(choice.get("finish_reason"), _FINISH_REASON_OPENAI)
+    usage_payload = payload.get("usage") or {}
+    usage = None
+    if usage_payload:
+        usage = TokenUsage(
+            prompt=int(usage_payload.get("prompt_tokens", 0)),
+            completion=int(usage_payload.get("completion_tokens", 0)),
+        )
+
+    # If the model used tool_calls, force-set stop_reason to tool_use even if
+    # finish_reason reported "stop" (some compatible servers do).
+    if tool_calls and stop_reason != "tool_use":
+        stop_reason = "tool_use"
+
+    return ChatResponse(
+        text=text,
+        tool_calls=tool_calls,
+        stop_reason=stop_reason,
+        usage=usage,
+        model=payload.get("model"),
+    )
+
+
+# ---------------------------------------------------------------------------
+# Anthropic
+# ---------------------------------------------------------------------------
+def to_anthropic_tools(
+    tools: list[ToolSpec] | None, force: str | None
+) -> tuple[list[dict] | None, Any]:
+    if not tools:
+        return None, None
+    anthropic_tools = [
+        {
+            "name": t.name,
+            "description": t.description,
+            "input_schema": t.input_schema,
+        }
+        for t in tools
+    ]
+    _validate_force(tools, force)
+    choice: Any = None
+    if force is not None:
+        choice = {"type": "tool", "name": force}
+    return anthropic_tools, choice
+
+
+def parse_anthropic_response(message: Any) -> ChatResponse:
+    """Parse the official ``anthropic`` SDK Message object."""
+    text_parts: list[str] = []
+    tool_calls: list[ToolCall] = []
+
+    if isinstance(message, dict):
+        content_blocks = message.get("content") or []
+    else:
+        content_blocks = getattr(message, "content", None) or []
+    for block in content_blocks:
+        if isinstance(block, dict):
+            btype = block.get("type")
+        else:
+            btype = getattr(block, "type", None)
+        if btype == "text":
+            if isinstance(block, dict):
+                text = block.get("text") or ""
+            else:
+                text = getattr(block, "text", "") or ""
+            text_parts.append(text)
+        elif btype == "tool_use":
+            if isinstance(block, dict):
+                name = block.get("name")
+                tool_id = block.get("id") or name
+                input_obj = block.get("input")
+            else:
+                name = getattr(block, "name", None)
+                tool_id = getattr(block, "id", None) or name
+                input_obj = getattr(block, "input", None)
+            if not name or not tool_id:
+                raise ToolTranslationError("Anthropic tool_use block missing id/name")
+            tool_calls.append(
+                ToolCall(id=str(tool_id), name=str(name), input=dict(input_obj or {}))
+            )
+
+    stop_raw = getattr(message, "stop_reason", None) or (
+        message.get("stop_reason") if isinstance(message, dict) else None
+    )
+    stop_reason = _normalise_finish_reason(stop_raw, _FINISH_REASON_ANTHROPIC)
+    if tool_calls and stop_reason != "tool_use":
+        stop_reason = "tool_use"
+
+    usage_obj = getattr(message, "usage", None) or (
+        message.get("usage") if isinstance(message, dict) else None
+    )
+    usage = None
+    if usage_obj is not None:
+        prompt = (
+            getattr(usage_obj, "input_tokens", None)
+            if not isinstance(usage_obj, dict)
+            else usage_obj.get("input_tokens")
+        )
+        completion = (
+            getattr(usage_obj, "output_tokens", None)
+            if not isinstance(usage_obj, dict)
+            else usage_obj.get("output_tokens")
+        )
+        if prompt is not None and completion is not None:
+            usage = TokenUsage(prompt=int(prompt), completion=int(completion))
+
+    model = getattr(message, "model", None) or (
+        message.get("model") if isinstance(message, dict) else None
+    )
+
+    return ChatResponse(
+        text="".join(text_parts),
+        tool_calls=tool_calls,
+        stop_reason=stop_reason,
+        usage=usage,
+        model=model,
+    )
+
+
+# ---------------------------------------------------------------------------
+# Google Gemini (native generativelanguage API)
+# ---------------------------------------------------------------------------
+def to_gemini_tools(
+    tools: list[ToolSpec] | None, force: str | None
+) -> tuple[list[dict] | None, Any]:
+    """Translate canonical tools → Gemini ``function_declarations`` + toolConfig.
+
+    Returns ``(tools_list, tool_config_or_none)``. Gemini nests every function
+    declaration under a single ``tools`` entry, distinct from OpenAI ``functions``
+    and Anthropic ``tools``.
+    """
+    if not tools:
+        return None, None
+    declarations = [
+        {
+            "name": t.name,
+            "description": t.description,
+            "parameters": t.input_schema,
+        }
+        for t in tools
+    ]
+    gemini_tools = [{"function_declarations": declarations}]
+    _validate_force(tools, force)
+    tool_config: Any = None
+    if force is not None:
+        tool_config = {
+            "function_calling_config": {
+                "mode": "ANY",
+                "allowed_function_names": [force],
+            }
+        }
+    return gemini_tools, tool_config
+
+
+def parse_gemini_response(payload: dict) -> ChatResponse:
+    """Parse a Gemini ``generateContent`` response body."""
+    try:
+        candidates = payload["candidates"]
+        candidate = candidates[0]
+    except (KeyError, IndexError, TypeError) as exc:
+        # Empty candidates (safety block) or missing key — surface as a
+        # translation error so the gateway logs/handles it consistently.
+        raise ToolTranslationError("Gemini response missing candidates") from exc
+
+    content = candidate.get("content") or {}
+    parts = content.get("parts") or []
+
+    text_parts: list[str] = []
+    tool_calls: list[ToolCall] = []
+    for part in parts:
+        if not isinstance(part, dict):
+            continue
+        if "functionCall" in part:
+            raw_fn = part.get("functionCall")
+            if raw_fn is None:
+                fn: dict = {}
+            elif isinstance(raw_fn, dict):
+                fn = raw_fn
+            else:
+                raise ToolTranslationError("Gemini functionCall must be an object")
+            name = fn.get("name")
+            if not name:
+                raise ToolTranslationError("Gemini functionCall missing name")
+            args = fn.get("args")
+            if args is None:
+                input_obj: dict = {}
+            elif isinstance(args, dict):
+                input_obj = args
+            else:
+                raise ToolTranslationError("Gemini functionCall args must be an object")
+            tool_calls.append(ToolCall(id=str(name), name=str(name), input=input_obj))
+        elif "text" in part:
+            text_parts.append(part.get("text") or "")
+
+    stop_reason = _normalise_finish_reason(candidate.get("finishReason"), _FINISH_REASON_GEMINI)
+    if tool_calls and stop_reason != "tool_use":
+        stop_reason = "tool_use"
+
+    usage_payload = payload.get("usageMetadata") or {}
+    usage = None
+    if usage_payload:
+        usage = TokenUsage(
+            prompt=int(usage_payload.get("promptTokenCount", 0)),
+            completion=int(usage_payload.get("candidatesTokenCount", 0)),
+        )
+
+    return ChatResponse(
+        text="".join(text_parts),
+        tool_calls=tool_calls,
+        stop_reason=stop_reason,
+        usage=usage,
+        model=payload.get("modelVersion"),
+    )
+
+
+# ---------------------------------------------------------------------------
+# Bedrock — Llama family
+#
+# Llama models on Bedrock (meta.llama*) have no structured tool/function field
+# in the InvokeModel request. The convention (matching Meta's tool-use prompt
+# format) is to describe the available tools inside the system prompt and ask
+# the model to emit a single JSON object as its reply. We then parse that JSON
+# back into a canonical ``ToolCall``.
+# ---------------------------------------------------------------------------
+def render_llama_tool_instructions(tools: list[ToolSpec] | None, force: str | None) -> str | None:
+    """Build a system-prompt fragment describing the available tools.
+
+    Returns ``None`` when there are no tools. When ``force`` is set, the
+    fragment instructs the model to call exactly that tool.
+    """
+    if not tools:
+        return None
+    _validate_force(tools, force)
+
+    lines = [
+        "You have access to the following tools. To call a tool, respond with "
+        "ONLY a single JSON object and no other text, of the form: "
+        '{"name": "<tool_name>", "input": {<arguments>}}.',
+    ]
+    for t in tools:
+        lines.append(
+            f"- {t.name}: {t.description} "
+            f"(input JSON schema: {json.dumps(t.input_schema, sort_keys=True)})"
+        )
+    if force is not None:
+        lines.append(f"You MUST call the tool named {force!r}.")
+    return "\n".join(lines)
+
+
+def parse_llama_response(payload: dict, tool_names: set[str] | None = None) -> ChatResponse:
+    """Parse a Bedrock Llama InvokeModel response body.
+
+    Bedrock Llama returns ``{"generation": "...", "stop_reason": "stop|length",
+    "prompt_token_count": int, "generation_token_count": int}``. When the
+    generated text is a tool-call JSON object whose ``name`` is one of the
+    expected tools, surface it as a ``ToolCall``.
+    """
+    if not isinstance(payload, dict):
+        raise ToolTranslationError("Bedrock Llama response is not a JSON object")
+
+    generation = payload.get("generation")
+    if generation is None:
+        raise ToolTranslationError("Bedrock Llama response missing 'generation'")
+    text = str(generation)
+
+    stop_reason = _normalise_finish_reason(payload.get("stop_reason"), _FINISH_REASON_LLAMA)
+
+    usage = None
+    prompt_tokens = payload.get("prompt_token_count")
+    completion_tokens = payload.get("generation_token_count")
+    if prompt_tokens is not None and completion_tokens is not None:
+        usage = TokenUsage(prompt=int(prompt_tokens), completion=int(completion_tokens))
+
+    tool_calls: list[ToolCall] = []
+    parsed = _try_parse_tool_json(text)
+    if parsed is not None:
+        name = parsed.get("name")
+        tool_input = parsed.get("input")
+        if (
+            isinstance(name, str)
+            and name
+            and isinstance(tool_input, dict)
+            and (tool_names is None or name in tool_names)
+        ):
+            tool_calls.append(ToolCall(id=name, name=name, input=tool_input))
+            stop_reason = "tool_use"
+            text = ""
+
+    return ChatResponse(
+        text=text,
+        tool_calls=tool_calls,
+        stop_reason=stop_reason,
+        usage=usage,
+        model=None,
+    )
+
+
+def _try_parse_tool_json(text: str) -> dict | None:
+    """Best-effort extraction of a single ``{"name":..., "input":...}`` object.
+
+    Llama sometimes wraps the JSON in prose or code fences; we extract the first
+    balanced ``{...}`` span and attempt to decode it.
+    """
+    candidate = text.strip()
+    if not candidate:
+        return None
+    # Strip ``` fences if present.
+    if candidate.startswith("```"):
+        candidate = candidate.strip("`")
+        # drop a leading "json" language tag
+        if candidate.lower().startswith("json"):
+            candidate = candidate[4:]
+        candidate = candidate.strip()
+
+    start = candidate.find("{")
+    if start == -1:
+        return None
+    depth = 0
+    for i in range(start, len(candidate)):
+        ch = candidate[i]
+        if ch == "{":
+            depth += 1
+        elif ch == "}":
+            depth -= 1
+            if depth == 0:
+                blob = candidate[start : i + 1]
+                try:
+                    obj = json.loads(blob)
+                except json.JSONDecodeError:
+                    return None
+                return obj if isinstance(obj, dict) else None
+    return None
diff --git a/server/app/services/llm/url_validator.py b/server/app/services/llm/url_validator.py
new file mode 100644
index 00000000..081ff107
--- /dev/null
+++ b/server/app/services/llm/url_validator.py
@@ -0,0 +1,96 @@
+"""Validate custom OpenAI-compatible base URLs.
+
+Rules (spec §4.7, §6.2):
+- Scheme: only ``http`` or ``https``
+- ``http``: only loopback (127.0.0.1, ::1, localhost) and RFC1918 private ranges
+  (10.0.0.0/8, 172.16.0.0/12, 192.168.0.0/16)
+- ``https``: any host
+- Reject embedded credentials in the URL (``user:pass@host``)
+- Accept optional path prefix (e.g., ``/v1``) — preserved
+- Reject query strings and fragments
+"""
+
+from __future__ import annotations
+
+import ipaddress
+from urllib.parse import urlsplit, urlunsplit
+
+# Private network blocks acceptable for plain HTTP base URLs.
+_PRIVATE_NETWORKS = (
+    ipaddress.ip_network("10.0.0.0/8"),
+    ipaddress.ip_network("172.16.0.0/12"),
+    ipaddress.ip_network("192.168.0.0/16"),
+    ipaddress.ip_network("127.0.0.0/8"),
+    ipaddress.ip_network("::1/128"),
+    ipaddress.ip_network("fc00::/7"),  # IPv6 unique local
+    ipaddress.ip_network("fe80::/10"),  # IPv6 link-local
+)
+
+
+class InvalidBaseUrlError(ValueError):
+    """Raised when a base URL fails validation."""
+
+
+def validate_compatible_base_url(raw: str) -> str:
+    """Validate and normalise a custom OpenAI-compatible base URL.
+
+    Returns the normalised URL (scheme + host + optional path, no trailing /).
+    Raises :class:`InvalidBaseUrlError` on failure.
+    """
+    if not raw or not isinstance(raw, str):
+        raise InvalidBaseUrlError("base_url is required")
+    raw = raw.strip()
+    if not raw:
+        raise InvalidBaseUrlError("base_url is empty")
+
+    try:
+        parts = urlsplit(raw)
+    except ValueError as exc:
+        raise InvalidBaseUrlError("base_url is malformed") from exc
+
+    scheme = parts.scheme.lower()
+    if scheme not in ("http", "https"):
+        raise InvalidBaseUrlError("base_url scheme must be 'http' or 'https'")
+
+    if not parts.netloc:
+        raise InvalidBaseUrlError("base_url is missing a host")
+
+    if parts.username or parts.password:
+        raise InvalidBaseUrlError(
+            "base_url must not embed credentials — provide a bearer separately"
+        )
+
+    if parts.query or parts.fragment:
+        raise InvalidBaseUrlError("base_url must not include a query string or fragment")
+
+    hostname = (parts.hostname or "").lower()
+    if not hostname:
+        raise InvalidBaseUrlError("base_url has an empty hostname")
+
+    if scheme == "http":
+        if hostname == "localhost":
+            pass
+        else:
+            try:
+                addr = ipaddress.ip_address(hostname)
+            except ValueError as exc:
+                raise InvalidBaseUrlError(
+                    "http:// base_url must be loopback or a private (RFC1918) IP"
+                ) from exc
+            if not any(addr in net for net in _PRIVATE_NETWORKS):
+                raise InvalidBaseUrlError(
+                    "http:// base_url must be loopback or a private (RFC1918) IP"
+                )
+
+    # Preserve path but drop trailing slash for stable storage. Empty path is OK.
+    path = (parts.path or "").rstrip("/")
+
+    # Rebuild without credentials / query / fragment.
+    # Use the netloc minus any user-info (urlsplit accepts these in raw form;
+    # we've already rejected those above, so netloc is host[:port]).
+    netloc = parts.netloc
+    if "@" in netloc:
+        netloc = netloc.rsplit("@", 1)[-1]
+
+    normalised = urlunsplit((scheme, netloc, path, "", ""))
+    return normalised
diff --git a/server/app/services/recommendation/llm_client.py b/server/app/services/recommendation/llm_client.py
index e9d2c735..7ccb040c 100644
--- a/server/app/services/recommendation/llm_client.py
+++ b/server/app/services/recommendation/llm_client.py
@@ -1,21 +1,33 @@
-"""LLM client for generating recommendation search queries via Claude Haiku.
+"""LLM client for generating recommendation search queries via the Gateway.
 
-Sends the event's musical profile and the DJ's prompt to Claude,
-which returns structured search queries (with target BPM/key/genre)
-that feed into the existing Tidal/Beatport search pipeline.
+The recommendation engine no longer talks directly to Anthropic — instead it
+calls ``Gateway.dispatch(...)``, which routes to the actor DJ's connector (or
+the org default). The forced tool_use semantics are preserved across providers
+via ``services/llm/tool_translation.py``.
+
+See ``docs/superpowers/specs/2026-05-24-admin-ai-oauth-design.md`` §7.
 """
 
+from __future__ import annotations
+
 import json
 import logging
 
-from anthropic import AsyncAnthropic
+from sqlalchemy.orm import Session
 
-from app.core.config import get_settings
+from app.models.user import User
+from app.services.llm.base import ChatRequest, Message, ToolSpec
+from app.services.llm.gateway import Gateway
 from app.services.recommendation.llm_hooks import LLMSuggestionQuery, LLMSuggestionResult
 from app.services.recommendation.scorer import EventProfile, TrackProfile
 
 logger = logging.getLogger(__name__)
 
+# Default max output tokens for query generation. Was previously sourced from
+# the ``ANTHROPIC_MAX_TOKENS`` env var via settings; that legacy env-var path was
+# removed in #343 now that the connector system is the source of truth.
+DEFAULT_MAX_TOKENS = 1024
+
 SYSTEM_PROMPT = """\
 You are a DJ assistant helping curate song suggestions for a live event.
 
@@ -76,8 +88,11 @@
 
 Include brief reasoning explaining why you chose each query."""
 
+# Tool name kept stable so any cached tool_use traces remain decodable.
+SEARCH_QUERIES_TOOL_NAME = "search_queries"
+
 SEARCH_QUERIES_TOOL = {
-    "name": "search_queries",
+    "name": SEARCH_QUERIES_TOOL_NAME,
     "description": (
         "Return structured search queries for finding tracks that match the DJ's intent."
     ),
@@ -191,28 +206,73 @@ def build_user_prompt(
     return "\n".join(parts)
 
 
-def _parse_tool_response(response) -> LLMSuggestionResult:
-    """Parse the Claude API response into an LLMSuggestionResult."""
+def _parse_query_items(items: object) -> list[LLMSuggestionQuery]:
+    """Defensively convert a tool payload ``queries`` array into query objects.
+
+    The tool output comes from an external LLM provider — including custom
+    OpenAI-compatible endpoints (Ollama, vLLM) that may not enforce the
+    forced-tool JSON schema. Skip any malformed item rather than letting one bad
+    entry crash the whole recommendation flow.
+    """
+    if not isinstance(items, list):
+        return []
+    parsed: list[LLMSuggestionQuery] = []
+    for q in items:
+        if not isinstance(q, dict):
+            continue
+        search_query = q.get("search_query")
+        if not isinstance(search_query, str) or not search_query.strip():
+            continue
+        parsed.append(
+            LLMSuggestionQuery(
+                search_query=search_query,
+                target_bpm=q.get("target_bpm"),
+                target_key=q.get("target_key"),
+                target_genre=q.get("target_genre"),
+                reasoning=q.get("reasoning", "") if isinstance(q.get("reasoning"), str) else "",
+            )
+        )
+    return parsed
+
+
+def _parse_tool_response(response) -> LLMSuggestionResult:  # noqa: ANN001 — dual-shape input
+    """Parse a gateway ``ChatResponse`` into an ``LLMSuggestionResult``.
+
+    The gateway is the only producer of responses (the legacy direct-Anthropic
+    path was removed in #343). A defensive second path also handles an
+    Anthropic-SDK ``Message``-like object (``.content`` blocks) so any cached
+    ``tool_use`` traces or hand-constructed fixtures remain decodable.
+    """
+    from app.services.llm.base import ChatResponse
+
     raw_text = ""
     queries: list[LLMSuggestionQuery] = []
 
-    for block in response.content:
-        if block.type == "text":
-            raw_text += block.text
-        elif block.type == "tool_use" and block.name == "search_queries":
-            raw_text += json.dumps(block.input)
-            for q in block.input.get("queries", []):
-                queries.append(
-                    LLMSuggestionQuery(
-                        search_query=q["search_query"],
-                        target_bpm=q.get("target_bpm"),
-                        target_key=q.get("target_key"),
-                        target_genre=q.get("target_genre"),
-                        reasoning=q.get("reasoning", ""),
-                    )
-                )
-
-    return LLMSuggestionResult(queries=queries, raw_response=raw_text)
+    # Path 1 — canonical ChatResponse (isinstance, not ducktype, so MagicMocks
+    # in legacy tests fall through to path 2 instead of matching here).
+    if isinstance(response, ChatResponse):
+        if response.text:
+            raw_text += response.text
+        for tc in response.tool_calls or []:
+            if tc.name == SEARCH_QUERIES_TOOL_NAME:
+                payload = tc.input if isinstance(tc.input, dict) else {}
+                raw_text += json.dumps(payload)
+                queries.extend(_parse_query_items(payload.get("queries", [])))
+        return LLMSuggestionResult(queries=queries, raw_response=raw_text, model=response.model)
+
+    # Path 2 — legacy Anthropic SDK Message-like object.
+    for block in getattr(response, "content", []) or []:
+        btype = getattr(block, "type", None)
+        if btype == "text":
+            raw_text += getattr(block, "text", "")
+        elif btype == "tool_use" and getattr(block, "name", "") == SEARCH_QUERIES_TOOL_NAME:
+            block_input = block.input if isinstance(block.input, dict) else {}
+            raw_text += json.dumps(block_input)
+            queries.extend(_parse_query_items(block_input.get("queries", [])))
+
+    return LLMSuggestionResult(
+        queries=queries, raw_response=raw_text, model=getattr(response, "model", None)
+    )
 
 
 async def call_llm(
@@ -222,18 +282,23 @@ async def call_llm(
     tracks: list[TrackProfile] | None = None,
     rejected_tracks: list[tuple[str, str]] | None = None,
     currently_playing: tuple[str, str, float | None] | None = None,
+    *,
+    db: Session | None = None,
+    actor: User | None = None,
 ) -> LLMSuggestionResult:
-    """Call Claude Haiku to generate search queries from a DJ prompt.
+    """Generate structured search queries via the LLM gateway.
 
-    Returns an LLMSuggestionResult with 1-max_queries structured queries.
-    Raises on API failure (caller should handle).
-    """
-    settings = get_settings()
+    Routes through ``Gateway.dispatch`` so credentials come from the actor DJ's
+    connector (or the org default). ``db`` is required; the legacy
+    direct-Anthropic env-var fallback was removed in #343 now that the connector
+    system is the sole source of truth.
 
-    client = AsyncAnthropic(
-        api_key=settings.anthropic_api_key,
-        timeout=settings.anthropic_timeout_seconds,
-    )
+    Returns at most ``max_queries`` queries.
+    """
+    if db is None:
+        raise ValueError(
+            "call_llm requires a db session — the connector system is the source of truth"
+        )
 
     user_message = build_user_prompt(
         profile,
@@ -243,22 +308,28 @@ async def call_llm(
         currently_playing=currently_playing,
     )
 
-    response = await client.messages.create(
-        model=settings.anthropic_model,
-        max_tokens=settings.anthropic_max_tokens,
+    chat_request = ChatRequest(
+        messages=[Message(role="user", content=user_message)],
         system=SYSTEM_PROMPT,
-        tools=[SEARCH_QUERIES_TOOL],
-        tool_choice={"type": "tool", "name": "search_queries"},
-        messages=[{"role": "user", "content": user_message}],
+        tools=[
+            ToolSpec(
+                name=SEARCH_QUERIES_TOOL_NAME,
+                description=SEARCH_QUERIES_TOOL["description"],
+                input_schema=SEARCH_QUERIES_TOOL["input_schema"],
+            )
+        ],
+        force_tool=SEARCH_QUERIES_TOOL_NAME,
+        max_tokens=DEFAULT_MAX_TOKENS,
+        temperature=None,
     )
-
+    response = await Gateway.dispatch(db, actor, chat_request, purpose="recommendation")
     result = _parse_tool_response(response)
 
-    # Trim to max_queries
     if len(result.queries) > max_queries:
         result = LLMSuggestionResult(
             queries=result.queries[:max_queries],
             raw_response=result.raw_response,
+            model=result.model,
         )
 
     logger.info(
@@ -268,33 +339,3 @@ async def call_llm(
     )
 
     return result
-
-
-async def raw_messages_create(
-    *,
-    model: str,
-    system: str,
-    tools: list[dict] | None,
-    tool_choice: dict | None,
-    messages: list[dict],
-    max_tokens: int,
-):
-    """Low-level Anthropic messages.create passthrough.
-
-    Exists so the provider-agnostic LLM gateway (``app.services.llm.gateway``)
-    can delegate here without importing a provider SDK itself. The ``anthropic``
-    import stays confined to this module.
-    """
-    settings = get_settings()
-    client = AsyncAnthropic(
-        api_key=settings.anthropic_api_key,
-        timeout=settings.anthropic_timeout_seconds,
-    )
-    kwargs: dict = {"model": model, "max_tokens": max_tokens, "messages": messages}
-    if system:
-        kwargs["system"] = system
-    if tools:
-        kwargs["tools"] = tools
-    if tool_choice:
-        kwargs["tool_choice"] = tool_choice
-    return await client.messages.create(**kwargs)
diff --git a/server/app/services/recommendation/llm_hooks.py b/server/app/services/recommendation/llm_hooks.py
index 271cdc66..d74efd74 100644
--- a/server/app/services/recommendation/llm_hooks.py
+++ b/server/app/services/recommendation/llm_hooks.py
@@ -30,6 +30,7 @@ class LLMSuggestionResult:
 
     queries: list[LLMSuggestionQuery]
     raw_response: str  # Full LLM response for debugging
+    model: str | None = None  # Provider model that actually produced the response
 
 
 async def generate_llm_suggestions(
@@ -39,12 +40,15 @@ async def generate_llm_suggestions(
     tracks: list[TrackProfile] | None = None,
     rejected_tracks: list[tuple[str, str]] | None = None,
     currently_playing: tuple[str, str, float | None] | None = None,
+    *,
+    db=None,
+    actor=None,
 ) -> LLMSuggestionResult:
-    """Generate search queries via LLM (Claude Haiku).
+    """Generate search queries via the LLM gateway.
 
-    Calls Claude to interpret the DJ's prompt in context of the event's
-    musical profile and track list, returning structured search queries
-    that feed into the existing search + scoring pipeline.
+    The gateway routes to the actor DJ's connector (or org default). ``db`` is
+    required by ``call_llm`` — the legacy direct-Anthropic env-var path was
+    removed in #343 now that the connector system is the source of truth.
     """
     from app.services.recommendation.llm_client import call_llm
 
@@ -55,24 +59,55 @@ async def generate_llm_suggestions(
         tracks=tracks,
         rejected_tracks=rejected_tracks,
         currently_playing=currently_playing,
+        db=db,
+        actor=actor,
     )
 
 
-def is_llm_available(db=None) -> bool:
+def is_llm_available(db=None, actor=None) -> bool:
     """Check if LLM recommendations are configured and available.
 
-    When db is provided, also checks the DB-backed llm_enabled toggle.
-    """
-    from app.core.config import get_settings
+    Mirrors :func:`app.services.llm.gateway._resolve_connector` semantics so the
+    "feature available" signal aligns with whether dispatch will actually
+    succeed:
+
+    - If ``actor`` is provided: returns True when the actor owns an active
+      connector (matches the per-DJ MRU lookup).
+    - Otherwise (no actor or no actor-owned active connector): returns True
+      when an active system-default connector is configured.
 
-    if not get_settings().anthropic_api_key:
+    Connector-backed only. Without ``db`` no connector can be resolved, so it
+    returns ``False`` — the legacy Anthropic env-var fallback was removed in #343.
+    """
+    if db is None:
         return False
 
-    if db is not None:
-        from app.services.system_settings import get_system_settings
+    from app.models.llm_connector import STATUS_ACTIVE, LlmConnector
+    from app.models.system_settings import SystemSettings
+    from app.services.system_settings import get_system_settings
 
-        settings = get_system_settings(db)
-        if not settings.llm_enabled:
-            return False
+    settings = get_system_settings(db)
+    if not settings.llm_enabled:
+        return False
 
-    return True
+    # Per-DJ active connector — matches gateway resolver step 1.
+    if actor is not None:
+        actor_active = (
+            db.query(LlmConnector.id)
+            .filter(
+                LlmConnector.user_id == actor.id,
+                LlmConnector.status == STATUS_ACTIVE,
+            )
+            .first()
+        )
+        if actor_active is not None:
+            return True
+
+    # System default fallback — matches gateway resolver step 2.
+    sys_settings = db.query(SystemSettings).first()
+    if sys_settings and sys_settings.llm_default_connector_id:
+        default = db.get(LlmConnector, sys_settings.llm_default_connector_id)
+        if default is not None and default.status == STATUS_ACTIVE:
+            return True
+
+    return False
diff --git a/server/app/services/recommendation/service.py b/server/app/services/recommendation/service.py
index 8a5d0c30..74df2ca0 100644
--- a/server/app/services/recommendation/service.py
+++ b/server/app/services/recommendation/service.py
@@ -811,6 +811,7 @@ class LLMRecommendationResult:
     total_candidates_searched: int
     services_used: list[str]
     llm_queries: list  # list of LLMSuggestionQuery
+    llm_model: str | None = None  # Provider model that produced the queries
     mb_verified: dict[str, bool] = None  # type: ignore[assignment]
 
     def __post_init__(self):
@@ -848,13 +849,16 @@ async def generate_recommendations_from_llm(
         (playing.artist, playing.song_title, getattr(playing, "bpm", None)) if playing else None
     )
 
-    # Step 2: Call LLM (pass enriched tracks + rejected + currently playing)
+    # Step 2: Call LLM (pass enriched tracks + rejected + currently playing).
+    # Route via the gateway by supplying db + actor (the event owner).
     llm_result = await generate_llm_suggestions(
         profile,
         prompt,
         tracks=enriched or None,
         rejected_tracks=rejected_names or None,
         currently_playing=currently_playing,
+        db=db,
+        actor=user,
     )
 
     if not llm_result.queries:
@@ -865,6 +869,7 @@ async def generate_recommendations_from_llm(
             total_candidates_searched=0,
             services_used=[],
             llm_queries=[],
+            llm_model=llm_result.model,
         )
 
     # Step 3: Use LLM query strings as search queries
@@ -915,6 +920,7 @@ async def generate_recommendations_from_llm(
         total_candidates_searched=total_searched,
         services_used=services_used,
         llm_queries=llm_result.queries,
+        llm_model=llm_result.model,
         mb_verified=mb_verified,
     )
 
diff --git a/server/app/services/system_settings.py b/server/app/services/system_settings.py
index 68109fc0..97d9f815 100644
--- a/server/app/services/system_settings.py
+++ b/server/app/services/system_settings.py
@@ -2,6 +2,11 @@
 
 from app.models.system_settings import SystemSettings
 
+# Sentinel for "field intentionally not provided" — distinguishes from explicit
+# None (which means "clear the FK"). update_system_settings uses this for the
+# llm_default_connector_id field which accepts None as a valid value.
+_UNSET: object = object()
+
 
 def get_system_settings(db: Session) -> SystemSettings:
     """Get the singleton system settings row, creating with defaults if missing."""
@@ -19,6 +24,10 @@ def get_system_settings(db: Session) -> SystemSettings:
             llm_enabled=True,
             llm_model="claude-haiku-4-5-20251001",
             llm_rate_limit_per_minute=3,
+            llm_apikey_connectors_enabled=True,
+            llm_compatible_connector_enabled=True,
+            llm_default_connector_id=None,
+            llm_call_log_retention_days=30,
         )
         db.add(settings)
         db.commit()
@@ -38,6 +47,10 @@ def update_system_settings(
     llm_enabled: bool | None = None,
     llm_model: str | None = None,
     llm_rate_limit_per_minute: int | None = None,
+    llm_apikey_connectors_enabled: bool | None = None,
+    llm_compatible_connector_enabled: bool | None = None,
+    llm_default_connector_id: int | None | object = _UNSET,
+    llm_call_log_retention_days: int | None = None,
 ) -> SystemSettings:
     """Update system settings fields."""
     settings = get_system_settings(db)
@@ -61,6 +74,14 @@ def update_system_settings(
         settings.llm_model = llm_model
     if llm_rate_limit_per_minute is not None:
         settings.llm_rate_limit_per_minute = llm_rate_limit_per_minute
+    if llm_apikey_connectors_enabled is not None:
+        settings.llm_apikey_connectors_enabled = llm_apikey_connectors_enabled
+    if llm_compatible_connector_enabled is not None:
+        settings.llm_compatible_connector_enabled = llm_compatible_connector_enabled
+    if llm_default_connector_id is not _UNSET:
+        settings.llm_default_connector_id = llm_default_connector_id  # type: ignore[assignment]
+    if llm_call_log_retention_days is not None:
+        settings.llm_call_log_retention_days = llm_call_log_retention_days
     db.commit()
     db.refresh(settings)
     return settings
diff --git a/server/openapi.json b/server/openapi.json
index 3b6d7956..e0551791 100644
--- a/server/openapi.json
+++ b/server/openapi.json
@@ -172,6 +172,233 @@
         "title": "ActivityLogEntry",
         "type": "object"
       },
+      "AdminAuditOut": {
+        "description": "Paginated audit-event browse response.",
+        "properties": {
+          "limit": {
+            "title": "Limit",
+            "type": "integer"
+          },
+          "offset": {
+            "title": "Offset",
+            "type": "integer"
+          },
+          "rows": {
+            "items": {
+              "$ref": "#/components/schemas/AuditEventRow"
+            },
+            "title": "Rows",
+            "type": "array"
+          },
+          "total": {
+            "title": "Total",
+            "type": "integer"
+          }
+        },
+        "required": [
+          "limit",
+          "offset",
+          "rows",
+          "total"
+        ],
+        "title": "AdminAuditOut",
+        "type": "object"
+      },
+      "AdminConnectorCapPatch": {
+        "description": "Admin set/clear a connector's monthly token cap (issue #339).\n\n``monthly_token_cap`` is **required** so intent is always explicit: an\ninteger sets the cap, ``null`` clears it (unlimited). Omitting the field\n(an empty ``{}`` body) is rejected with 422 rather than silently treated as\n``null`` \u2014 that would let an accidental no-field PATCH wipe a configured\ncap. A non-null value must be a non-negative integer; ``0`` means \"no\nfurther calls this month\". The upper bound is a sanity ceiling, not a\nbilling limit.",
+        "properties": {
+          "monthly_token_cap": {
+            "anyOf": [
+              {
+                "maximum": 1000000000.0,
+                "minimum": 0.0,
+                "type": "integer"
+              },
+              {
+                "type": "null"
+              }
+            ],
+            "title": "Monthly Token Cap"
+          }
+        },
+        "required": [
+          "monthly_token_cap"
+        ],
+        "title": "AdminConnectorCapPatch",
+        "type": "object"
+      },
+      "AdminConnectorOut": {
+        "description": "Admin view \u2014 adds the DJ's username for display.",
+        "properties": {
+          "base_url_plain": {
+            "anyOf": [
+              {
+                "type": "string"
+              },
+              {
+                "type": "null"
+              }
+            ],
+            "title": "Base Url Plain"
+          },
+          "connector_type": {
+            "enum": [
+              "openai_apikey",
+              "anthropic_apikey",
+              "openai_compatible",
+              "openrouter_apikey",
+              "xai_apikey",
+              "bedrock",
+              "azure_openai",
+              "gemini_apikey"
+            ],
+            "title": "Connector Type",
+            "type": "string"
+          },
+          "created_at": {
+            "format": "date-time",
+            "title": "Created At",
+            "type": "string"
+          },
+          "current_month_tokens": {
+            "default": 0,
+            "title": "Current Month Tokens",
+            "type": "integer"
+          },
+          "display_name": {
+            "title": "Display Name",
+            "type": "string"
+          },
+          "dj_username": {
+            "title": "Dj Username",
+            "type": "string"
+          },
+          "id": {
+            "title": "Id",
+            "type": "integer"
+          },
+          "is_default": {
+            "default": false,
+            "title": "Is Default",
+            "type": "boolean"
+          },
+          "last_error": {
+            "anyOf": [
+              {
+                "type": "string"
+              },
+              {
+                "type": "null"
+              }
+            ],
+            "title": "Last Error"
+          },
+          "last_health_check_at": {
+            "anyOf": [
+              {
+                "format": "date-time",
+                "type": "string"
+              },
+              {
+                "type": "null"
+              }
+            ],
+            "title": "Last Health Check At"
+          },
+          "last_health_check_status": {
+            "anyOf": [
+              {
+                "enum": [
+                  "ok",
+                  "auth_invalid",
+                  "rate_limited",
+                  "quota_exceeded",
+                  "provider_unavailable",
+                  "error"
+                ],
+                "type": "string"
+              },
+              {
+                "type": "null"
+              }
+            ],
+            "title": "Last Health Check Status"
+          },
+          "last_used_at": {
+            "anyOf": [
+              {
+                "format": "date-time",
+                "type": "string"
+              },
+              {
+                "type": "null"
+              }
+            ],
+            "title": "Last Used At"
+          },
+          "model_hint": {
+            "anyOf": [
+              {
+                "type": "string"
+              },
+              {
+                "type": "null"
+              }
+            ],
+            "title": "Model Hint"
+          },
+          "monthly_token_cap": {
+            "anyOf": [
+              {
+                "type": "integer"
+              },
+              {
+                "type": "null"
+              }
+            ],
+            "title": "Monthly Token Cap"
+          },
+          "status": {
+            "enum": [
+              "active",
+              "auth_invalid",
+              "disabled"
+            ],
+            "title": "Status",
+            "type": "string"
+          },
+          "updated_at": {
+            "format": "date-time",
+            "title": "Updated At",
+            "type": "string"
+          },
+          "user_id": {
+            "title": "User Id",
+            "type": "integer"
+          }
+        },
+        "required": [
+          "base_url_plain",
+          "connector_type",
+          "created_at",
+          "current_month_tokens",
+          "display_name",
+          "dj_username",
+          "id",
+          "is_default",
+          "last_error",
+          "last_health_check_at",
+          "last_health_check_status",
+          "last_used_at",
+          "model_hint",
+          "monthly_token_cap",
+          "status",
+          "updated_at",
+          "user_id"
+        ],
+        "title": "AdminConnectorOut",
+        "type": "object"
+      },
       "AdminEventOut": {
         "properties": {
           "code": {
@@ -233,6 +460,119 @@
         "title": "AdminEventOut",
         "type": "object"
       },
+      "AdminPolicyOut": {
+        "properties": {
+          "llm_apikey_connectors_enabled": {
+            "title": "Llm Apikey Connectors Enabled",
+            "type": "boolean"
+          },
+          "llm_call_log_retention_days": {
+            "title": "Llm Call Log Retention Days",
+            "type": "integer"
+          },
+          "llm_compatible_connector_enabled": {
+            "title": "Llm Compatible Connector Enabled",
+            "type": "boolean"
+          },
+          "llm_default_connector_id": {
+            "anyOf": [
+              {
+                "type": "integer"
+              },
+              {
+                "type": "null"
+              }
+            ],
+            "title": "Llm Default Connector Id"
+          }
+        },
+        "required": [
+          "llm_apikey_connectors_enabled",
+          "llm_call_log_retention_days",
+          "llm_compatible_connector_enabled",
+          "llm_default_connector_id"
+        ],
+        "title": "AdminPolicyOut",
+        "type": "object"
+      },
+      "AdminPolicyPatch": {
+        "properties": {
+          "clear_default": {
+            "default": false,
+            "title": "Clear Default",
+            "type": "boolean"
+          },
+          "llm_apikey_connectors_enabled": {
+            "anyOf": [
+              {
+                "type": "boolean"
+              },
+              {
+                "type": "null"
+              }
+            ],
+            "title": "Llm Apikey Connectors Enabled"
+          },
+          "llm_call_log_retention_days": {
+            "anyOf": [
+              {
+                "maximum": 365.0,
+                "minimum": 7.0,
+                "type": "integer"
+              },
+              {
+                "type": "null"
+              }
+            ],
+            "title": "Llm Call Log Retention Days"
+          },
+          "llm_compatible_connector_enabled": {
+            "anyOf": [
+              {
+                "type": "boolean"
+              },
+              {
+                "type": "null"
+              }
+            ],
+            "title": "Llm Compatible Connector Enabled"
+          },
+          "llm_default_connector_id": {
+            "anyOf": [
+              {
+                "type": "integer"
+              },
+              {
+                "type": "null"
+              }
+            ],
+            "title": "Llm Default Connector Id"
+          }
+        },
+        "title": "AdminPolicyPatch",
+        "type": "object"
+      },
+      "AdminUsageOut": {
+        "properties": {
+          "days": {
+            "title": "Days",
+            "type": "integer"
+          },
+          "rows": {
+            "items": {
+              "$ref": "#/components/schemas/UsageRow"
+            },
+            "title": "Rows",
+            "type": "array"
+          }
+        },
+        "required": [
+          "days",
+          "rows"
+        ],
+        "title": "AdminUsageOut",
+        "type": "object"
+      },
       "AdminUserCreate": {
         "properties": {
           "password": {
@@ -341,31 +681,102 @@
         "title": "AdminUserUpdate",
         "type": "object"
       },
-      "BeatportEventSettings": {
-        "description": "Beatport sync settings for an event.",
-        "properties": {
-          "beatport_sync_enabled": {
-            "title": "Beatport Sync Enabled",
-            "type": "boolean"
-          }
-        },
-        "required": [
-          "beatport_sync_enabled"
-        ],
-        "title": "BeatportEventSettings",
-        "type": "object"
-      },
-      "BeatportEventSettingsUpdate": {
-        "description": "Update Beatport sync settings for an event.",
+      "AuditEventRow": {
+        "description": "A single audit-trail row with joined display labels.\n\nNever includes credential material \u2014 only the target connector's\nhuman-readable display name (joined from ``llm_connectors``).",
         "properties": {
-          "beatport_sync_enabled": {
-            "title": "Beatport Sync Enabled",
-            "type": "boolean"
-          }
-        },
-        "required": [
-          "beatport_sync_enabled"
-        ],
+          "actor_user_id": {
+            "title": "Actor User Id",
+            "type": "integer"
+          },
+          "actor_username": {
+            "title": "Actor Username",
+            "type": "string"
+          },
+          "created_at": {
+            "format": "date-time",
+            "title": "Created At",
+            "type": "string"
+          },
+          "event_type": {
+            "title": "Event Type",
+            "type": "string"
+          },
+          "id": {
+            "title": "Id",
+            "type": "integer"
+          },
+          "notes": {
+            "anyOf": [
+              {
+                "type": "string"
+              },
+              {
+                "type": "null"
+              }
+            ],
+            "title": "Notes"
+          },
+          "target_connector_display_name": {
+            "anyOf": [
+              {
+                "type": "string"
+              },
+              {
+                "type": "null"
+              }
+            ],
+            "title": "Target Connector Display Name"
+          },
+          "target_connector_id": {
+            "anyOf": [
+              {
+                "type": "integer"
+              },
+              {
+                "type": "null"
+              }
+            ],
+            "title": "Target Connector Id"
+          }
+        },
+        "required": [
+          "actor_user_id",
+          "actor_username",
+          "created_at",
+          "event_type",
+          "id",
+          "notes",
+          "target_connector_display_name",
+          "target_connector_id"
+        ],
+        "title": "AuditEventRow",
+        "type": "object"
+      },
+      "BeatportEventSettings": {
+        "description": "Beatport sync settings for an event.",
+        "properties": {
+          "beatport_sync_enabled": {
+            "title": "Beatport Sync Enabled",
+            "type": "boolean"
+          }
+        },
+        "required": [
+          "beatport_sync_enabled"
+        ],
+        "title": "BeatportEventSettings",
+        "type": "object"
+      },
+      "BeatportEventSettingsUpdate": {
+        "description": "Update Beatport sync settings for an event.",
+        "properties": {
+          "beatport_sync_enabled": {
+            "title": "Beatport Sync Enabled",
+            "type": "boolean"
+          }
+        },
+        "required": [
+          "beatport_sync_enabled"
+        ],
         "title": "BeatportEventSettingsUpdate",
         "type": "object"
       },
@@ -1691,427 +2102,300 @@
         "title": "CollectVoteRequest",
         "type": "object"
       },
-      "DisplaySettingsResponse": {
-        "description": "Response for display settings update.",
+      "ConnectorCreate": {
+        "description": "Provider-agnostic create payload.\n\nField requirements vary by ``connector_type``:\n\n- ``openai_apikey`` / ``anthropic_apikey`` / ``openrouter_apikey`` /\n  ``xai_apikey`` / ``gemini_apikey``: ``api_key`` required; ``base_url``\n  and ``bearer`` are ignored.\n- ``openai_compatible``: ``base_url`` required; ``bearer`` optional;\n  ``api_key`` is ignored.\n- ``bedrock``: ``aws_access_key_id``, ``aws_secret_access_key``,\n  ``aws_region`` and ``aws_model_id`` required; other fields ignored.\n- ``azure_openai``: ``api_key``, ``azure_resource_name``,\n  ``azure_deployment_name`` and ``azure_api_version`` all required.\n\nThe combination is enforced by :meth:`_require_credentials_for_type`.\nSee ``build_create_payload`` in ``services/llm/connector_storage.py``\nfor the full validation flow (including key shape checks).",
         "properties": {
-          "kiosk_display_only": {
-            "default": false,
-            "title": "Kiosk Display Only",
-            "type": "boolean"
-          },
-          "now_playing_auto_hide_minutes": {
-            "default": 10,
-            "title": "Now Playing Auto Hide Minutes",
-            "type": "integer"
-          },
-          "now_playing_hidden": {
-            "title": "Now Playing Hidden",
-            "type": "boolean"
-          },
-          "requests_open": {
-            "default": true,
-            "title": "Requests Open",
-            "type": "boolean"
+          "api_key": {
+            "anyOf": [
+              {
+                "maxLength": 512,
+                "type": "string"
+              },
+              {
+                "type": "null"
+              }
+            ],
+            "title": "Api Key"
           },
-          "status": {
-            "default": "ok",
-            "title": "Status",
-            "type": "string"
-          }
-        },
-        "required": [
-          "kiosk_display_only",
-          "now_playing_auto_hide_minutes",
-          "now_playing_hidden",
-          "requests_open",
-          "status"
-        ],
-        "title": "DisplaySettingsResponse",
-        "type": "object"
-      },
-      "DisplaySettingsUpdate": {
-        "description": "Request body for updating display settings.",
-        "properties": {
-          "kiosk_display_only": {
+          "aws_access_key_id": {
             "anyOf": [
               {
-                "type": "boolean"
+                "maxLength": 128,
+                "type": "string"
               },
               {
                 "type": "null"
               }
             ],
-            "title": "Kiosk Display Only"
+            "title": "Aws Access Key Id"
           },
-          "now_playing_auto_hide_minutes": {
+          "aws_model_id": {
             "anyOf": [
               {
-                "maximum": 1440.0,
-                "minimum": 1.0,
-                "type": "integer"
+                "maxLength": 128,
+                "type": "string"
               },
               {
                 "type": "null"
               }
             ],
-            "title": "Now Playing Auto Hide Minutes"
+            "title": "Aws Model Id"
           },
-          "now_playing_hidden": {
+          "aws_region": {
             "anyOf": [
               {
-                "type": "boolean"
+                "maxLength": 64,
+                "type": "string"
               },
               {
                 "type": "null"
               }
             ],
-            "title": "Now Playing Hidden"
+            "title": "Aws Region"
           },
-          "requests_open": {
+          "aws_secret_access_key": {
             "anyOf": [
               {
-                "type": "boolean"
+                "maxLength": 512,
+                "type": "string"
               },
               {
                 "type": "null"
               }
             ],
-            "title": "Requests Open"
-          }
-        },
-        "title": "DisplaySettingsUpdate",
-        "type": "object"
-      },
-      "EnrichPreviewItem": {
-        "properties": {
-          "artist": {
-            "title": "Artist",
-            "type": "string"
+            "title": "Aws Secret Access Key"
           },
-          "source_url": {
+          "azure_api_version": {
             "anyOf": [
               {
+                "maxLength": 40,
                 "type": "string"
               },
               {
                 "type": "null"
               }
             ],
-            "title": "Source Url"
+            "title": "Azure Api Version"
           },
-          "title": {
-            "title": "Title",
-            "type": "string"
-          }
-        },
-        "required": [
-          "title",
-          "artist"
-        ],
-        "title": "EnrichPreviewItem",
-        "type": "object"
-      },
-      "EnrichPreviewRequest": {
-        "properties": {
-          "items": {
-            "items": {
-              "$ref": "#/components/schemas/EnrichPreviewItem"
-            },
-            "title": "Items",
-            "type": "array"
-          }
-        },
-        "required": [
-          "items"
-        ],
-        "title": "EnrichPreviewRequest",
-        "type": "object"
-      },
-      "EnrichPreviewResponse": {
-        "properties": {
-          "results": {
-            "items": {
-              "$ref": "#/components/schemas/EnrichPreviewResult"
-            },
-            "title": "Results",
-            "type": "array"
-          }
-        },
-        "required": [
-          "results"
-        ],
-        "title": "EnrichPreviewResponse",
-        "type": "object"
-      },
-      "EnrichPreviewResult": {
-        "properties": {
-          "artist": {
-            "title": "Artist",
-            "type": "string"
+          "azure_deployment_name": {
+            "anyOf": [
+              {
+                "maxLength": 120,
+                "type": "string"
+              },
+              {
+                "type": "null"
+              }
+            ],
+            "title": "Azure Deployment Name"
           },
-          "bpm": {
+          "azure_resource_name": {
             "anyOf": [
               {
-                "type": "integer"
+                "maxLength": 120,
+                "type": "string"
               },
               {
                 "type": "null"
               }
             ],
-            "title": "Bpm"
+            "title": "Azure Resource Name"
           },
-          "genre": {
+          "base_url": {
             "anyOf": [
               {
+                "maxLength": 512,
                 "type": "string"
               },
               {
                 "type": "null"
               }
             ],
-            "title": "Genre"
+            "title": "Base Url"
           },
-          "key": {
+          "bearer": {
             "anyOf": [
               {
+                "maxLength": 512,
                 "type": "string"
               },
               {
                 "type": "null"
               }
             ],
-            "title": "Key"
+            "title": "Bearer"
           },
-          "title": {
-            "title": "Title",
+          "connector_type": {
+            "enum": [
+              "openai_apikey",
+              "anthropic_apikey",
+              "openai_compatible",
+              "openrouter_apikey",
+              "xai_apikey",
+              "bedrock",
+              "azure_openai",
+              "gemini_apikey"
+            ],
+            "title": "Connector Type",
+            "type": "string"
+          },
+          "display_name": {
+            "maxLength": 80,
+            "minLength": 1,
+            "title": "Display Name",
             "type": "string"
+          },
+          "model_hint": {
+            "anyOf": [
+              {
+                "maxLength": 80,
+                "type": "string"
+              },
+              {
+                "type": "null"
+              }
+            ],
+            "title": "Model Hint"
           }
         },
         "required": [
-          "artist",
-          "bpm",
-          "genre",
-          "key",
-          "title"
+          "connector_type",
+          "display_name"
         ],
-        "title": "EnrichPreviewResult",
+        "title": "ConnectorCreate",
         "type": "object"
       },
-      "EnsureNameRequest": {
+      "ConnectorCredentialsRotate": {
+        "description": "Rotation payload \u2014 at least one credential field must be supplied.\n\nField semantics mirror :class:`ConnectorCreate`. The actual field required\ndepends on the connector being rotated (validated in ``rotate_credentials``).",
         "properties": {
-          "nickname": {
+          "api_key": {
             "anyOf": [
               {
-                "maxLength": 30,
-                "minLength": 2,
-                "pattern": "^[a-zA-Z0-9 _.-]+$",
+                "maxLength": 512,
                 "type": "string"
               },
               {
                 "type": "null"
               }
             ],
-            "title": "Nickname"
-          }
-        },
-        "title": "EnsureNameRequest",
-        "type": "object"
-      },
-      "EnsureNameResponse": {
-        "properties": {
-          "auto_generated": {
-            "title": "Auto Generated",
-            "type": "boolean"
-          },
-          "nickname": {
-            "title": "Nickname",
-            "type": "string"
-          }
-        },
-        "required": [
-          "auto_generated",
-          "nickname"
-        ],
-        "title": "EnsureNameResponse",
-        "type": "object"
-      },
-      "EventCreate": {
-        "properties": {
-          "expires_hours": {
-            "default": 6,
-            "maximum": 48.0,
-            "minimum": 1.0,
-            "title": "Expires Hours",
-            "type": "integer"
+            "title": "Api Key"
           },
-          "name": {
-            "maxLength": 100,
-            "minLength": 1,
-            "title": "Name",
-            "type": "string"
-          }
-        },
-        "required": [
-          "name"
-        ],
-        "title": "EventCreate",
-        "type": "object"
-      },
-      "EventMusicProfile": {
-        "properties": {
-          "avg_bpm": {
+          "aws_access_key_id": {
             "anyOf": [
               {
-                "type": "number"
+                "maxLength": 128,
+                "type": "string"
               },
               {
                 "type": "null"
               }
             ],
-            "title": "Avg Bpm"
+            "title": "Aws Access Key Id"
           },
-          "bpm_range_high": {
+          "aws_model_id": {
             "anyOf": [
               {
-                "type": "number"
+                "maxLength": 128,
+                "type": "string"
               },
               {
                 "type": "null"
               }
             ],
-            "title": "Bpm Range High"
+            "title": "Aws Model Id"
           },
-          "bpm_range_low": {
+          "aws_region": {
             "anyOf": [
               {
-                "type": "number"
+                "maxLength": 64,
+                "type": "string"
               },
               {
                 "type": "null"
               }
             ],
-            "title": "Bpm Range Low"
-          },
-          "dominant_genres": {
-            "default": [],
-            "items": {
-              "type": "string"
-            },
-            "title": "Dominant Genres",
-            "type": "array"
-          },
-          "dominant_keys": {
-            "default": [],
-            "items": {
-              "type": "string"
-            },
-            "title": "Dominant Keys",
-            "type": "array"
-          },
-          "enriched_count": {
-            "default": 0,
-            "title": "Enriched Count",
-            "type": "integer"
+            "title": "Aws Region"
           },
-          "track_count": {
-            "default": 0,
-            "title": "Track Count",
-            "type": "integer"
-          }
-        },
-        "required": [
-          "avg_bpm",
-          "bpm_range_high",
-          "bpm_range_low",
-          "dominant_genres",
-          "dominant_keys",
-          "enriched_count",
-          "track_count"
-        ],
-        "title": "EventMusicProfile",
-        "type": "object"
-      },
-      "EventOut": {
-        "properties": {
-          "archived_at": {
+          "aws_secret_access_key": {
             "anyOf": [
               {
+                "maxLength": 512,
                 "type": "string"
               },
               {
                 "type": "null"
               }
             ],
-            "title": "Archived At"
+            "title": "Aws Secret Access Key"
           },
-          "banner_colors": {
+          "azure_api_version": {
             "anyOf": [
               {
-                "items": {
-                  "type": "string"
-                },
-                "type": "array"
+                "maxLength": 40,
+                "type": "string"
               },
               {
                 "type": "null"
               }
             ],
-            "title": "Banner Colors"
+            "title": "Azure Api Version"
           },
-          "banner_kiosk_url": {
+          "azure_deployment_name": {
             "anyOf": [
               {
+                "maxLength": 120,
                 "type": "string"
               },
               {
                 "type": "null"
               }
             ],
-            "title": "Banner Kiosk Url"
+            "title": "Azure Deployment Name"
           },
-          "banner_url": {
+          "azure_resource_name": {
             "anyOf": [
               {
+                "maxLength": 120,
                 "type": "string"
               },
               {
                 "type": "null"
               }
             ],
-            "title": "Banner Url"
+            "title": "Azure Resource Name"
           },
-          "beatport_playlist_id": {
+          "base_url": {
             "anyOf": [
               {
+                "maxLength": 512,
                 "type": "string"
               },
               {
                 "type": "null"
               }
             ],
-            "title": "Beatport Playlist Id"
-          },
-          "beatport_sync_enabled": {
-            "default": false,
-            "title": "Beatport Sync Enabled",
-            "type": "boolean"
-          },
-          "code": {
-            "title": "Code",
-            "type": "string"
+            "title": "Base Url"
           },
-          "collect_url": {
+          "bearer": {
             "anyOf": [
               {
+                "maxLength": 512,
                 "type": "string"
               },
               {
                 "type": "null"
               }
             ],
-            "title": "Collect Url"
-          },
-          "collection_opens_at": {
+            "title": "Bearer"
+          }
+        },
+        "title": "ConnectorCredentialsRotate",
+        "type": "object"
+      },
+      "ConnectorOut": {
+        "description": "Public-safe connector view \u2014 never includes the credential blob.",
+        "properties": {
+          "base_url_plain": {
             "anyOf": [
               {
                 "type": "string"
@@ -2120,45 +2404,41 @@
                 "type": "null"
               }
             ],
-            "title": "Collection Opens At"
+            "title": "Base Url Plain"
           },
-          "collection_phase_override": {
-            "anyOf": [
-              {
-                "type": "string"
-              },
-              {
-                "type": "null"
-              }
+          "connector_type": {
+            "enum": [
+              "openai_apikey",
+              "anthropic_apikey",
+              "openai_compatible",
+              "openrouter_apikey",
+              "xai_apikey",
+              "bedrock",
+              "azure_openai",
+              "gemini_apikey"
             ],
-            "title": "Collection Phase Override"
+            "title": "Connector Type",
+            "type": "string"
           },
           "created_at": {
+            "format": "date-time",
             "title": "Created At",
             "type": "string"
           },
-          "expires_at": {
-            "title": "Expires At",
+          "display_name": {
+            "title": "Display Name",
             "type": "string"
           },
-          "frictionless_join": {
-            "default": false,
-            "title": "Frictionless Join",
-            "type": "boolean"
-          },
           "id": {
             "title": "Id",
             "type": "integer"
           },
-          "is_active": {
-            "title": "Is Active",
+          "is_default": {
+            "default": false,
+            "title": "Is Default",
             "type": "boolean"
           },
-          "join_code": {
-            "title": "Join Code",
-            "type": "string"
-          },
-          "join_url": {
+          "last_error": {
             "anyOf": [
               {
                 "type": "string"
@@ -2167,55 +2447,52 @@
                 "type": "null"
               }
             ],
-            "title": "Join Url"
+            "title": "Last Error"
           },
-          "live_starts_at": {
+          "last_health_check_at": {
             "anyOf": [
               {
+                "format": "date-time",
                 "type": "string"
               },
               {
                 "type": "null"
               }
             ],
-            "title": "Live Starts At"
+            "title": "Last Health Check At"
           },
-          "name": {
-            "title": "Name",
-            "type": "string"
-          },
-          "request_count": {
+          "last_health_check_status": {
             "anyOf": [
               {
-                "type": "integer"
+                "enum": [
+                  "ok",
+                  "auth_invalid",
+                  "rate_limited",
+                  "quota_exceeded",
+                  "provider_unavailable",
+                  "error"
+                ],
+                "type": "string"
               },
               {
                 "type": "null"
               }
             ],
-            "title": "Request Count"
-          },
-          "requests_open": {
-            "default": true,
-            "title": "Requests Open",
-            "type": "boolean"
+            "title": "Last Health Check Status"
           },
-          "status": {
+          "last_used_at": {
             "anyOf": [
               {
-                "$ref": "#/components/schemas/EventStatus"
+                "format": "date-time",
+                "type": "string"
               },
               {
                 "type": "null"
               }
-            ]
-          },
-          "submission_cap_per_guest": {
-            "default": 15,
-            "title": "Submission Cap Per Guest",
-            "type": "integer"
+            ],
+            "title": "Last Used At"
           },
-          "tidal_playlist_id": {
+          "model_hint": {
             "anyOf": [
               {
                 "type": "string"
@@ -2224,99 +2501,104 @@
                 "type": "null"
               }
             ],
-            "title": "Tidal Playlist Id"
+            "title": "Model Hint"
           },
-          "tidal_sync_enabled": {
-            "default": false,
-            "title": "Tidal Sync Enabled",
-            "type": "boolean"
+          "monthly_token_cap": {
+            "anyOf": [
+              {
+                "type": "integer"
+              },
+              {
+                "type": "null"
+              }
+            ],
+            "title": "Monthly Token Cap"
+          },
+          "status": {
+            "enum": [
+              "active",
+              "auth_invalid",
+              "disabled"
+            ],
+            "title": "Status",
+            "type": "string"
+          },
+          "updated_at": {
+            "format": "date-time",
+            "title": "Updated At",
+            "type": "string"
+          },
+          "user_id": {
+            "title": "User Id",
+            "type": "integer"
           }
         },
         "required": [
-          "archived_at",
-          "banner_colors",
-          "banner_kiosk_url",
-          "banner_url",
-          "beatport_playlist_id",
-          "beatport_sync_enabled",
-          "code",
-          "collect_url",
-          "collection_opens_at",
-          "collection_phase_override",
+          "base_url_plain",
+          "connector_type",
           "created_at",
-          "expires_at",
-          "frictionless_join",
+          "display_name",
           "id",
-          "is_active",
-          "join_code",
-          "join_url",
-          "live_starts_at",
-          "name",
-          "request_count",
-          "requests_open",
+          "is_default",
+          "last_error",
+          "last_health_check_at",
+          "last_health_check_status",
+          "last_used_at",
+          "model_hint",
+          "monthly_token_cap",
           "status",
-          "submission_cap_per_guest",
-          "tidal_playlist_id",
-          "tidal_sync_enabled"
+          "updated_at",
+          "user_id"
         ],
-        "title": "EventOut",
+        "title": "ConnectorOut",
         "type": "object"
       },
-      "EventStatus": {
-        "description": "Status of an event based on expiry and archive state.",
-        "enum": [
-          "active",
-          "expired",
-          "archived"
-        ],
-        "title": "EventStatus",
-        "type": "string"
-      },
-      "EventUpdate": {
+      "ConnectorPatch": {
+        "description": "Metadata-only patch (no credential rotation here).",
         "properties": {
-          "expires_at": {
+          "display_name": {
             "anyOf": [
               {
-                "format": "date-time",
+                "maxLength": 80,
+                "minLength": 1,
                 "type": "string"
               },
               {
                 "type": "null"
               }
             ],
-            "title": "Expires At"
+            "title": "Display Name"
           },
-          "frictionless_join": {
+          "model_hint": {
             "anyOf": [
               {
-                "type": "boolean"
+                "maxLength": 80,
+                "type": "string"
               },
               {
                 "type": "null"
               }
             ],
-            "title": "Frictionless Join"
-          },
-          "name": {
+            "title": "Model Hint"
+          }
+        },
+        "title": "ConnectorPatch",
+        "type": "object"
+      },
+      "ConnectorTestResult": {
+        "properties": {
+          "error_code": {
             "anyOf": [
               {
-                "maxLength": 100,
-                "minLength": 1,
                 "type": "string"
               },
               {
                 "type": "null"
               }
             ],
-            "title": "Name"
-          }
-        },
-        "title": "EventUpdate",
-        "type": "object"
-      },
-      "GuestNowPlaying": {
-        "properties": {
-          "album_art_url": {
+            "title": "Error Code"
+          },
+          "message": {
             "anyOf": [
               {
                 "type": "string"
@@ -2325,279 +2607,239 @@
                 "type": "null"
               }
             ],
-            "title": "Album Art Url"
+            "title": "Message"
           },
-          "artist": {
-            "title": "Artist",
-            "type": "string"
+          "ok": {
+            "title": "Ok",
+            "type": "boolean"
+          }
+        },
+        "required": [
+          "error_code",
+          "message",
+          "ok"
+        ],
+        "title": "ConnectorTestResult",
+        "type": "object"
+      },
+      "DisplaySettingsResponse": {
+        "description": "Response for display settings update.",
+        "properties": {
+          "kiosk_display_only": {
+            "default": false,
+            "title": "Kiosk Display Only",
+            "type": "boolean"
           },
-          "source": {
-            "title": "Source",
-            "type": "string"
+          "now_playing_auto_hide_minutes": {
+            "default": 10,
+            "title": "Now Playing Auto Hide Minutes",
+            "type": "integer"
           },
-          "title": {
-            "title": "Title",
+          "now_playing_hidden": {
+            "title": "Now Playing Hidden",
+            "type": "boolean"
+          },
+          "requests_open": {
+            "default": true,
+            "title": "Requests Open",
+            "type": "boolean"
+          },
+          "status": {
+            "default": "ok",
+            "title": "Status",
             "type": "string"
           }
         },
         "required": [
-          "album_art_url",
-          "artist",
-          "source",
-          "title"
+          "kiosk_display_only",
+          "now_playing_auto_hide_minutes",
+          "now_playing_hidden",
+          "requests_open",
+          "status"
         ],
-        "title": "GuestNowPlaying",
+        "title": "DisplaySettingsResponse",
         "type": "object"
       },
-      "GuestRequestInfo": {
+      "DisplaySettingsUpdate": {
+        "description": "Request body for updating display settings.",
         "properties": {
-          "artist": {
-            "title": "Artist",
-            "type": "string"
-          },
-          "artwork_url": {
+          "kiosk_display_only": {
             "anyOf": [
               {
-                "type": "string"
+                "type": "boolean"
               },
               {
                 "type": "null"
               }
             ],
-            "title": "Artwork Url"
+            "title": "Kiosk Display Only"
           },
-          "bpm": {
+          "now_playing_auto_hide_minutes": {
             "anyOf": [
               {
+                "maximum": 1440.0,
+                "minimum": 1.0,
                 "type": "integer"
               },
               {
                 "type": "null"
               }
             ],
-            "title": "Bpm"
-          },
-          "genre": {
-            "anyOf": [
-              {
-                "type": "string"
-              },
-              {
-                "type": "null"
-              }
-            ],
-            "title": "Genre"
-          },
-          "id": {
-            "title": "Id",
-            "type": "integer"
+            "title": "Now Playing Auto Hide Minutes"
           },
-          "musical_key": {
+          "now_playing_hidden": {
             "anyOf": [
               {
-                "type": "string"
+                "type": "boolean"
               },
               {
                 "type": "null"
               }
             ],
-            "title": "Musical Key"
+            "title": "Now Playing Hidden"
           },
-          "nickname": {
+          "requests_open": {
             "anyOf": [
               {
-                "type": "string"
+                "type": "boolean"
               },
               {
                 "type": "null"
               }
             ],
-            "title": "Nickname"
+            "title": "Requests Open"
+          }
+        },
+        "title": "DisplaySettingsUpdate",
+        "type": "object"
+      },
+      "DjPolicyOut": {
+        "description": "DJ-readable connector policy \u2014 the non-sensitive subset of the admin\npolicy surface.\n\nLets the settings/ai page fail *closed*: a normal DJ can learn which\nconnector types the admin has enabled (so disallowed providers are hidden\nin the picker) without exposing admin-only fields such as\n``llm_default_connector_id``.\n\n``allowed_connector_types`` is the pre-computed set of connector types a DJ\nmay create given the two toggles, so the frontend doesn't have to hard-code\nthe api-key-vs-compatible mapping.",
+        "properties": {
+          "allowed_connector_types": {
+            "items": {
+              "enum": [
+                "openai_apikey",
+                "anthropic_apikey",
+                "openai_compatible",
+                "openrouter_apikey",
+                "xai_apikey",
+                "bedrock",
+                "azure_openai",
+                "gemini_apikey"
+              ],
+              "type": "string"
+            },
+            "title": "Allowed Connector Types",
+            "type": "array"
           },
-          "requester_verified": {
-            "default": false,
-            "title": "Requester Verified",
+          "llm_apikey_connectors_enabled": {
+            "title": "Llm Apikey Connectors Enabled",
             "type": "boolean"
           },
-          "status": {
-            "enum": [
-              "new",
-              "accepted"
-            ],
-            "title": "Status",
-            "type": "string"
-          },
-          "title": {
-            "title": "Title",
-            "type": "string"
-          },
-          "vote_count": {
-            "default": 0,
-            "title": "Vote Count",
-            "type": "integer"
+          "llm_compatible_connector_enabled": {
+            "title": "Llm Compatible Connector Enabled",
+            "type": "boolean"
           }
         },
         "required": [
-          "artist",
-          "artwork_url",
-          "bpm",
-          "genre",
-          "id",
-          "musical_key",
-          "nickname",
-          "requester_verified",
-          "status",
-          "title",
-          "vote_count"
+          "allowed_connector_types",
+          "llm_apikey_connectors_enabled",
+          "llm_compatible_connector_enabled"
         ],
-        "title": "GuestRequestInfo",
+        "title": "DjPolicyOut",
         "type": "object"
       },
-      "GuestRequestListResponse": {
+      "EnrichPreviewItem": {
         "properties": {
-          "event": {
-            "$ref": "#/components/schemas/PublicEventInfo"
+          "artist": {
+            "title": "Artist",
+            "type": "string"
           },
-          "now_playing": {
+          "source_url": {
             "anyOf": [
               {
-                "$ref": "#/components/schemas/GuestNowPlaying"
+                "type": "string"
               },
               {
                 "type": "null"
               }
-            ]
-          },
-          "requests": {
-            "items": {
-              "$ref": "#/components/schemas/GuestRequestInfo"
-            },
-            "title": "Requests",
-            "type": "array"
+            ],
+            "title": "Source Url"
           },
-          "total": {
-            "default": 0,
-            "title": "Total",
-            "type": "integer"
+          "title": {
+            "title": "Title",
+            "type": "string"
           }
         },
         "required": [
-          "event",
-          "now_playing",
-          "requests",
-          "total"
+          "title",
+          "artist"
         ],
-        "title": "GuestRequestListResponse",
+        "title": "EnrichPreviewItem",
         "type": "object"
       },
-      "HTTPValidationError": {
+      "EnrichPreviewRequest": {
         "properties": {
-          "detail": {
+          "items": {
             "items": {
-              "$ref": "#/components/schemas/ValidationError"
+              "$ref": "#/components/schemas/EnrichPreviewItem"
             },
-            "title": "Detail",
+            "title": "Items",
             "type": "array"
           }
         },
         "required": [
-          "detail"
+          "items"
         ],
-        "title": "HTTPValidationError",
+        "title": "EnrichPreviewRequest",
         "type": "object"
       },
-      "HasRequestedResponse": {
+      "EnrichPreviewResponse": {
         "properties": {
-          "has_requested": {
-            "title": "Has Requested",
-            "type": "boolean"
+          "results": {
+            "items": {
+              "$ref": "#/components/schemas/EnrichPreviewResult"
+            },
+            "title": "Results",
+            "type": "array"
           }
         },
         "required": [
-          "has_requested"
+          "results"
         ],
-        "title": "HasRequestedResponse",
+        "title": "EnrichPreviewResponse",
         "type": "object"
       },
-      "HelpPageSeenRequest": {
+      "EnrichPreviewResult": {
         "properties": {
-          "page": {
-            "maxLength": 100,
-            "minLength": 1,
-            "pattern": "^[a-z0-9-]+$",
-            "title": "Page",
+          "artist": {
+            "title": "Artist",
             "type": "string"
-          }
-        },
-        "required": [
-          "page"
-        ],
-        "title": "HelpPageSeenRequest",
-        "type": "object"
-      },
-      "IdentifyRequest": {
-        "properties": {
-          "fingerprint_components": {
+          },
+          "bpm": {
             "anyOf": [
               {
-                "additionalProperties": true,
-                "type": "object"
+                "type": "integer"
               },
               {
                 "type": "null"
               }
             ],
-            "title": "Fingerprint Components"
+            "title": "Bpm"
           },
-          "fingerprint_hash": {
-            "maxLength": 64,
-            "minLength": 8,
-            "title": "Fingerprint Hash",
-            "type": "string"
-          }
-        },
-        "required": [
-          "fingerprint_hash"
-        ],
-        "title": "IdentifyRequest",
-        "type": "object"
-      },
-      "IdentifyResponse": {
-        "properties": {
-          "action": {
-            "enum": [
-              "create",
-              "cookie_hit",
-              "reconcile"
+          "genre": {
+            "anyOf": [
+              {
+                "type": "string"
+              },
+              {
+                "type": "null"
+              }
             ],
-            "title": "Action",
-            "type": "string"
-          },
-          "guest_id": {
-            "title": "Guest Id",
-            "type": "integer"
-          },
-          "reconcile_hint": {
-            "default": false,
-            "title": "Reconcile Hint",
-            "type": "boolean"
-          }
-        },
-        "required": [
-          "action",
-          "guest_id",
-          "reconcile_hint"
-        ],
-        "title": "IdentifyResponse",
-        "type": "object"
-      },
-      "IntegrationCheckResponse": {
-        "description": "Response for POST /api/admin/integrations/{service}/check.",
-        "properties": {
-          "capabilities": {
-            "$ref": "#/components/schemas/ServiceCapabilities"
+            "title": "Genre"
           },
-          "error": {
+          "key": {
             "anyOf": [
               {
                 "type": "string"
@@ -2606,279 +2848,160 @@
                 "type": "null"
               }
             ],
-            "title": "Error"
-          },
-          "healthy": {
-            "title": "Healthy",
-            "type": "boolean"
+            "title": "Key"
           },
-          "service": {
-            "title": "Service",
+          "title": {
+            "title": "Title",
             "type": "string"
           }
         },
         "required": [
-          "capabilities",
-          "error",
-          "healthy",
-          "service"
-        ],
-        "title": "IntegrationCheckResponse",
-        "type": "object"
-      },
-      "IntegrationHealthResponse": {
-        "description": "Response for GET /api/admin/integrations.",
-        "properties": {
-          "services": {
-            "items": {
-              "$ref": "#/components/schemas/IntegrationServiceStatus"
-            },
-            "title": "Services",
-            "type": "array"
-          }
-        },
-        "required": [
-          "services"
+          "artist",
+          "bpm",
+          "genre",
+          "key",
+          "title"
         ],
-        "title": "IntegrationHealthResponse",
+        "title": "EnrichPreviewResult",
         "type": "object"
       },
-      "IntegrationServiceStatus": {
-        "description": "Full status for a single integration service.",
+      "EnsureNameRequest": {
         "properties": {
-          "capabilities": {
-            "$ref": "#/components/schemas/ServiceCapabilities"
-          },
-          "configured": {
-            "title": "Configured",
-            "type": "boolean"
-          },
-          "display_name": {
-            "title": "Display Name",
-            "type": "string"
-          },
-          "enabled": {
-            "title": "Enabled",
-            "type": "boolean"
-          },
-          "last_check_error": {
+          "nickname": {
             "anyOf": [
               {
+                "maxLength": 30,
+                "minLength": 2,
+                "pattern": "^[a-zA-Z0-9 _.-]+$",
                 "type": "string"
               },
               {
                 "type": "null"
               }
             ],
-            "title": "Last Check Error"
-          },
-          "service": {
-            "title": "Service",
-            "type": "string"
-          }
-        },
-        "required": [
-          "capabilities",
-          "configured",
-          "display_name",
-          "enabled",
-          "last_check_error",
-          "service"
-        ],
-        "title": "IntegrationServiceStatus",
-        "type": "object"
-      },
-      "IntegrationToggleRequest": {
-        "description": "Request body for PATCH /api/admin/integrations/{service}.",
-        "properties": {
-          "enabled": {
-            "title": "Enabled",
-            "type": "boolean"
+            "title": "Nickname"
           }
         },
-        "required": [
-          "enabled"
-        ],
-        "title": "IntegrationToggleRequest",
+        "title": "EnsureNameRequest",
         "type": "object"
       },
-      "IntegrationToggleResponse": {
-        "description": "Response for PATCH /api/admin/integrations/{service}.",
+      "EnsureNameResponse": {
         "properties": {
-          "enabled": {
-            "title": "Enabled",
+          "auto_generated": {
+            "title": "Auto Generated",
             "type": "boolean"
           },
-          "service": {
-            "title": "Service",
-            "type": "string"
-          }
-        },
-        "required": [
-          "enabled",
-          "service"
-        ],
-        "title": "IntegrationToggleResponse",
-        "type": "object"
-      },
-      "JoinConfigResponse": {
-        "properties": {
-          "frictionless_join": {
-            "title": "Frictionless Join",
-            "type": "boolean"
-          }
-        },
-        "required": [
-          "frictionless_join"
-        ],
-        "title": "JoinConfigResponse",
-        "type": "object"
-      },
-      "KioskAssignRequest": {
-        "description": "Body for reassigning a kiosk to a different event.",
-        "properties": {
-          "event_code": {
-            "maxLength": 10,
-            "minLength": 1,
-            "title": "Event Code",
+          "nickname": {
+            "title": "Nickname",
             "type": "string"
           }
         },
         "required": [
-          "event_code"
+          "auto_generated",
+          "nickname"
         ],
-        "title": "KioskAssignRequest",
+        "title": "EnsureNameResponse",
         "type": "object"
       },
-      "KioskCompletePairingRequest": {
-        "description": "Body for completing a kiosk pairing.",
+      "EventCreate": {
         "properties": {
-          "event_code": {
-            "maxLength": 10,
+          "expires_hours": {
+            "default": 6,
+            "maximum": 48.0,
+            "minimum": 1.0,
+            "title": "Expires Hours",
+            "type": "integer"
+          },
+          "name": {
+            "maxLength": 100,
             "minLength": 1,
-            "title": "Event Code",
+            "title": "Name",
             "type": "string"
           }
         },
         "required": [
-          "event_code"
+          "name"
         ],
-        "title": "KioskCompletePairingRequest",
+        "title": "EventCreate",
         "type": "object"
       },
-      "KioskDisplayResponse": {
+      "EventMusicProfile": {
         "properties": {
-          "accepted_queue": {
-            "items": {
-              "$ref": "#/components/schemas/PublicRequestInfo"
-            },
-            "title": "Accepted Queue",
-            "type": "array"
-          },
-          "banner_colors": {
+          "avg_bpm": {
             "anyOf": [
               {
-                "items": {
-                  "type": "string"
-                },
-                "type": "array"
+                "type": "number"
               },
               {
                 "type": "null"
               }
             ],
-            "title": "Banner Colors"
+            "title": "Avg Bpm"
           },
-          "banner_kiosk_url": {
+          "bpm_range_high": {
             "anyOf": [
               {
-                "type": "string"
+                "type": "number"
               },
               {
                 "type": "null"
               }
             ],
-            "title": "Banner Kiosk Url"
+            "title": "Bpm Range High"
           },
-          "banner_url": {
+          "bpm_range_low": {
             "anyOf": [
               {
-                "type": "string"
+                "type": "number"
               },
               {
                 "type": "null"
               }
             ],
-            "title": "Banner Url"
+            "title": "Bpm Range Low"
           },
-          "event": {
-            "$ref": "#/components/schemas/PublicEventInfo"
+          "dominant_genres": {
+            "default": [],
+            "items": {
+              "type": "string"
+            },
+            "title": "Dominant Genres",
+            "type": "array"
           },
-          "kiosk_display_only": {
-            "default": false,
-            "title": "Kiosk Display Only",
-            "type": "boolean"
-          },
-          "now_playing": {
-            "anyOf": [
-              {
-                "$ref": "#/components/schemas/PublicRequestInfo"
-              },
-              {
-                "type": "null"
-              }
-            ]
-          },
-          "now_playing_hidden": {
-            "title": "Now Playing Hidden",
-            "type": "boolean"
-          },
-          "qr_join_url": {
-            "title": "Qr Join Url",
-            "type": "string"
+          "dominant_keys": {
+            "default": [],
+            "items": {
+              "type": "string"
+            },
+            "title": "Dominant Keys",
+            "type": "array"
           },
-          "requests_open": {
-            "default": true,
-            "title": "Requests Open",
-            "type": "boolean"
+          "enriched_count": {
+            "default": 0,
+            "title": "Enriched Count",
+            "type": "integer"
           },
-          "updated_at": {
-            "format": "date-time",
-            "title": "Updated At",
-            "type": "string"
+          "track_count": {
+            "default": 0,
+            "title": "Track Count",
+            "type": "integer"
           }
         },
         "required": [
-          "accepted_queue",
-          "banner_colors",
-          "banner_kiosk_url",
-          "banner_url",
-          "event",
-          "kiosk_display_only",
-          "now_playing",
-          "now_playing_hidden",
-          "qr_join_url",
-          "requests_open",
-          "updated_at"
+          "avg_bpm",
+          "bpm_range_high",
+          "bpm_range_low",
+          "dominant_genres",
+          "dominant_keys",
+          "enriched_count",
+          "track_count"
         ],
-        "title": "KioskDisplayResponse",
+        "title": "EventMusicProfile",
         "type": "object"
       },
-      "KioskOut": {
-        "description": "Kiosk info for DJ dashboard (no session_token).",
+      "EventOut": {
         "properties": {
-          "event_code": {
-            "anyOf": [
-              {
-                "type": "string"
-              },
-              {
-                "type": "null"
-              }
-            ],
-            "title": "Event Code"
-          },
-          "event_join_code": {
+          "archived_at": {
             "anyOf": [
               {
                 "type": "string"
@@ -2887,36 +3010,34 @@
                 "type": "null"
               }
             ],
-            "title": "Event Join Code"
+            "title": "Archived At"
           },
-          "event_name": {
+          "banner_colors": {
             "anyOf": [
               {
-                "type": "string"
+                "items": {
+                  "type": "string"
+                },
+                "type": "array"
               },
               {
                 "type": "null"
               }
             ],
-            "title": "Event Name"
-          },
-          "id": {
-            "title": "Id",
-            "type": "integer"
+            "title": "Banner Colors"
           },
-          "last_seen_at": {
+          "banner_kiosk_url": {
             "anyOf": [
               {
-                "format": "date-time",
                 "type": "string"
               },
               {
                 "type": "null"
               }
             ],
-            "title": "Last Seen At"
+            "title": "Banner Kiosk Url"
           },
-          "name": {
+          "banner_url": {
             "anyOf": [
               {
                 "type": "string"
@@ -2925,85 +3046,29 @@
                 "type": "null"
               }
             ],
-            "title": "Name"
+            "title": "Banner Url"
           },
-          "paired_at": {
+          "beatport_playlist_id": {
             "anyOf": [
               {
-                "format": "date-time",
                 "type": "string"
               },
               {
                 "type": "null"
               }
             ],
-            "title": "Paired At"
-          },
-          "status": {
-            "title": "Status",
-            "type": "string"
-          }
-        },
-        "required": [
-          "event_code",
-          "event_join_code",
-          "event_name",
-          "id",
-          "last_seen_at",
-          "name",
-          "paired_at",
-          "status"
-        ],
-        "title": "KioskOut",
-        "type": "object"
-      },
-      "KioskPairChallengeResponse": {
-        "properties": {
-          "expires_in": {
-            "title": "Expires In",
-            "type": "integer"
+            "title": "Beatport Playlist Id"
           },
-          "nonce": {
-            "title": "Nonce",
-            "type": "string"
-          }
-        },
-        "required": [
-          "expires_in",
-          "nonce"
-        ],
-        "title": "KioskPairChallengeResponse",
-        "type": "object"
-      },
-      "KioskPairResponse": {
-        "description": "Returned when a new kiosk pairing session is created.",
-        "properties": {
-          "expires_at": {
-            "format": "date-time",
-            "title": "Expires At",
-            "type": "string"
+          "beatport_sync_enabled": {
+            "default": false,
+            "title": "Beatport Sync Enabled",
+            "type": "boolean"
           },
-          "pair_code": {
-            "title": "Pair Code",
+          "code": {
+            "title": "Code",
             "type": "string"
           },
-          "session_token": {
-            "title": "Session Token",
-            "type": "string"
-          }
-        },
-        "required": [
-          "expires_at",
-          "pair_code",
-          "session_token"
-        ],
-        "title": "KioskPairResponse",
-        "type": "object"
-      },
-      "KioskPairStatusResponse": {
-        "description": "Returned when polling a pairing code's status.",
-        "properties": {
-          "event_code": {
+          "collect_url": {
             "anyOf": [
               {
                 "type": "string"
@@ -3012,9 +3077,9 @@
                 "type": "null"
               }
             ],
-            "title": "Event Code"
+            "title": "Collect Url"
           },
-          "event_join_code": {
+          "collection_opens_at": {
             "anyOf": [
               {
                 "type": "string"
@@ -3023,9 +3088,9 @@
                 "type": "null"
               }
             ],
-            "title": "Event Join Code"
+            "title": "Collection Opens At"
           },
-          "event_name": {
+          "collection_phase_override": {
             "anyOf": [
               {
                 "type": "string"
@@ -3034,45 +3099,45 @@
                 "type": "null"
               }
             ],
-            "title": "Event Name"
+            "title": "Collection Phase Override"
           },
-          "status": {
-            "title": "Status",
+          "created_at": {
+            "title": "Created At",
             "type": "string"
-          }
-        },
-        "required": [
-          "event_code",
-          "event_join_code",
-          "event_name",
-          "status"
-        ],
-        "title": "KioskPairStatusResponse",
-        "type": "object"
-      },
-      "KioskRenameRequest": {
-        "description": "Body for renaming a kiosk.",
-        "properties": {
-          "name": {
+          },
+          "expires_at": {
+            "title": "Expires At",
+            "type": "string"
+          },
+          "frictionless_join": {
+            "default": false,
+            "title": "Frictionless Join",
+            "type": "boolean"
+          },
+          "id": {
+            "title": "Id",
+            "type": "integer"
+          },
+          "is_active": {
+            "title": "Is Active",
+            "type": "boolean"
+          },
+          "join_code": {
+            "title": "Join Code",
+            "type": "string"
+          },
+          "join_url": {
             "anyOf": [
               {
-                "maxLength": 100,
                 "type": "string"
               },
               {
                 "type": "null"
               }
             ],
-            "title": "Name"
-          }
-        },
-        "title": "KioskRenameRequest",
-        "type": "object"
-      },
-      "KioskSessionResponse": {
-        "description": "Returned when polling a kiosk's current assignment.",
-        "properties": {
-          "event_code": {
+            "title": "Join Url"
+          },
+          "live_starts_at": {
             "anyOf": [
               {
                 "type": "string"
@@ -3081,93 +3146,221 @@
                 "type": "null"
               }
             ],
-            "title": "Event Code"
+            "title": "Live Starts At"
           },
-          "event_join_code": {
+          "name": {
+            "title": "Name",
+            "type": "string"
+          },
+          "request_count": {
             "anyOf": [
               {
-                "type": "string"
+                "type": "integer"
               },
               {
                 "type": "null"
               }
             ],
-            "title": "Event Join Code"
+            "title": "Request Count"
           },
-          "event_name": {
-            "anyOf": [
-              {
+          "requests_open": {
+            "default": true,
+            "title": "Requests Open",
+            "type": "boolean"
+          },
+          "status": {
+            "anyOf": [
+              {
+                "$ref": "#/components/schemas/EventStatus"
+              },
+              {
+                "type": "null"
+              }
+            ]
+          },
+          "submission_cap_per_guest": {
+            "default": 15,
+            "title": "Submission Cap Per Guest",
+            "type": "integer"
+          },
+          "tidal_playlist_id": {
+            "anyOf": [
+              {
                 "type": "string"
               },
               {
                 "type": "null"
               }
             ],
-            "title": "Event Name"
+            "title": "Tidal Playlist Id"
           },
-          "status": {
-            "title": "Status",
-            "type": "string"
+          "tidal_sync_enabled": {
+            "default": false,
+            "title": "Tidal Sync Enabled",
+            "type": "boolean"
           }
         },
         "required": [
-          "event_code",
-          "event_join_code",
-          "event_name",
-          "status"
+          "archived_at",
+          "banner_colors",
+          "banner_kiosk_url",
+          "banner_url",
+          "beatport_playlist_id",
+          "beatport_sync_enabled",
+          "code",
+          "collect_url",
+          "collection_opens_at",
+          "collection_phase_override",
+          "created_at",
+          "expires_at",
+          "frictionless_join",
+          "id",
+          "is_active",
+          "join_code",
+          "join_url",
+          "live_starts_at",
+          "name",
+          "request_count",
+          "requests_open",
+          "status",
+          "submission_cap_per_guest",
+          "tidal_playlist_id",
+          "tidal_sync_enabled"
         ],
-        "title": "KioskSessionResponse",
+        "title": "EventOut",
         "type": "object"
       },
-      "LLMPromptRequest": {
+      "EventStatus": {
+        "description": "Status of an event based on expiry and archive state.",
+        "enum": [
+          "active",
+          "expired",
+          "archived"
+        ],
+        "title": "EventStatus",
+        "type": "string"
+      },
+      "EventUpdate": {
         "properties": {
-          "prompt": {
-            "maxLength": 500,
-            "minLength": 3,
-            "title": "Prompt",
+          "expires_at": {
+            "anyOf": [
+              {
+                "format": "date-time",
+                "type": "string"
+              },
+              {
+                "type": "null"
+              }
+            ],
+            "title": "Expires At"
+          },
+          "frictionless_join": {
+            "anyOf": [
+              {
+                "type": "boolean"
+              },
+              {
+                "type": "null"
+              }
+            ],
+            "title": "Frictionless Join"
+          },
+          "name": {
+            "anyOf": [
+              {
+                "maxLength": 100,
+                "minLength": 1,
+                "type": "string"
+              },
+              {
+                "type": "null"
+              }
+            ],
+            "title": "Name"
+          }
+        },
+        "title": "EventUpdate",
+        "type": "object"
+      },
+      "FeaturePreferenceOut": {
+        "description": "A single per-feature connector pin (issue #337).",
+        "properties": {
+          "connector_id": {
+            "title": "Connector Id",
+            "type": "integer"
+          },
+          "feature": {
+            "enum": [
+              "recommendation",
+              "set_builder"
+            ],
+            "title": "Feature",
             "type": "string"
           }
         },
         "required": [
-          "prompt"
+          "connector_id",
+          "feature"
         ],
-        "title": "LLMPromptRequest",
+        "title": "FeaturePreferenceOut",
         "type": "object"
       },
-      "LiveJoinCodeResponse": {
-        "description": "Returns the live join_code for an event that has entered the live phase.\n\nGated by require_verified_human so the join_code never leaks to unverified\nbots scraping the collect URL during the collection-to-live transition.",
+      "FeaturePreferenceSet": {
+        "description": "Set/change a per-feature pin. Upsert \u2014 replaces any existing pin.",
         "properties": {
-          "join_code": {
-            "title": "Join Code",
+          "connector_id": {
+            "minimum": 1.0,
+            "title": "Connector Id",
+            "type": "integer"
+          },
+          "feature": {
+            "enum": [
+              "recommendation",
+              "set_builder"
+            ],
+            "title": "Feature",
             "type": "string"
           }
         },
         "required": [
-          "join_code"
+          "feature",
+          "connector_id"
         ],
-        "title": "LiveJoinCodeResponse",
+        "title": "FeaturePreferenceSet",
         "type": "object"
       },
-      "MePreferencesUpdate": {
+      "FeaturePreferencesListOut": {
+        "description": "All of a DJ's per-feature pins + the catalogue of pinnable features.",
         "properties": {
-          "frictionless_join_default": {
-            "title": "Frictionless Join Default",
-            "type": "boolean"
+          "known_features": {
+            "items": {
+              "enum": [
+                "recommendation",
+                "set_builder"
+              ],
+              "type": "string"
+            },
+            "title": "Known Features",
+            "type": "array"
+          },
+          "preferences": {
+            "items": {
+              "$ref": "#/components/schemas/FeaturePreferenceOut"
+            },
+            "title": "Preferences",
+            "type": "array"
           }
         },
         "required": [
-          "frictionless_join_default"
+          "known_features",
+          "preferences"
         ],
-        "title": "MePreferencesUpdate",
+        "title": "FeaturePreferencesListOut",
         "type": "object"
       },
-      "MyRequestInfo": {
+      "GuestNowPlaying": {
         "properties": {
-          "artist": {
-            "title": "Artist",
-            "type": "string"
-          },
-          "artwork_url": {
+          "album_art_url": {
             "anyOf": [
               {
                 "type": "string"
@@ -3176,136 +3369,74 @@
                 "type": "null"
               }
             ],
-            "title": "Artwork Url"
+            "title": "Album Art Url"
           },
-          "created_at": {
-            "format": "date-time",
-            "title": "Created At",
+          "artist": {
+            "title": "Artist",
             "type": "string"
           },
-          "id": {
-            "title": "Id",
-            "type": "integer"
-          },
-          "status": {
-            "enum": [
-              "new",
-              "accepted",
-              "playing",
-              "played",
-              "rejected"
-            ],
-            "title": "Status",
+          "source": {
+            "title": "Source",
             "type": "string"
           },
           "title": {
             "title": "Title",
             "type": "string"
-          },
-          "vote_count": {
-            "default": 0,
-            "title": "Vote Count",
-            "type": "integer"
           }
         },
         "required": [
+          "album_art_url",
           "artist",
-          "artwork_url",
-          "created_at",
-          "id",
-          "status",
-          "title",
-          "vote_count"
-        ],
-        "title": "MyRequestInfo",
-        "type": "object"
-      },
-      "MyRequestsResponse": {
-        "properties": {
-          "requests": {
-            "items": {
-              "$ref": "#/components/schemas/MyRequestInfo"
-            },
-            "title": "Requests",
-            "type": "array"
-          }
-        },
-        "required": [
-          "requests"
+          "source",
+          "title"
         ],
-        "title": "MyRequestsResponse",
+        "title": "GuestNowPlaying",
         "type": "object"
       },
-      "NowPlayingBridgePayload": {
-        "description": "Payload from bridge when a new track starts playing.",
+      "GuestRequestInfo": {
         "properties": {
-          "album": {
+          "artist": {
+            "title": "Artist",
+            "type": "string"
+          },
+          "artwork_url": {
             "anyOf": [
               {
-                "maxLength": 255,
                 "type": "string"
               },
               {
                 "type": "null"
               }
             ],
-            "title": "Album"
-          },
-          "artist": {
-            "maxLength": 255,
-            "minLength": 1,
-            "title": "Artist",
-            "type": "string"
+            "title": "Artwork Url"
           },
-          "deck": {
+          "bpm": {
             "anyOf": [
               {
-                "maxLength": 10,
-                "type": "string"
+                "type": "integer"
               },
               {
                 "type": "null"
               }
             ],
-            "title": "Deck"
-          },
-          "event_code": {
-            "maxLength": 10,
-            "minLength": 1,
-            "title": "Event Code",
-            "type": "string"
+            "title": "Bpm"
           },
-          "source": {
+          "genre": {
             "anyOf": [
               {
-                "maxLength": 20,
                 "type": "string"
               },
               {
                 "type": "null"
               }
             ],
-            "title": "Source"
+            "title": "Genre"
           },
-          "title": {
-            "maxLength": 255,
-            "minLength": 1,
-            "title": "Title",
-            "type": "string"
-          }
-        },
-        "required": [
-          "event_code",
-          "title",
-          "artist"
-        ],
-        "title": "NowPlayingBridgePayload",
-        "type": "object"
-      },
-      "NowPlayingResponse": {
-        "description": "Response for current now-playing track.",
-        "properties": {
-          "album": {
+          "id": {
+            "title": "Id",
+            "type": "integer"
+          },
+          "musical_key": {
             "anyOf": [
               {
                 "type": "string"
@@ -3314,9 +3445,9 @@
                 "type": "null"
               }
             ],
-            "title": "Album"
+            "title": "Musical Key"
           },
-          "album_art_url": {
+          "nickname": {
             "anyOf": [
               {
                 "type": "string"
@@ -3325,154 +3456,192 @@
                 "type": "null"
               }
             ],
-            "title": "Album Art Url"
-          },
-          "artist": {
-            "title": "Artist",
-            "type": "string"
+            "title": "Nickname"
           },
-          "bridge_connected": {
+          "requester_verified": {
             "default": false,
-            "title": "Bridge Connected",
+            "title": "Requester Verified",
             "type": "boolean"
           },
-          "matched_request_id": {
-            "anyOf": [
-              {
-                "type": "integer"
-              },
-              {
-                "type": "null"
-              }
-            ],
-            "title": "Matched Request Id"
-          },
-          "source": {
-            "title": "Source",
-            "type": "string"
-          },
-          "spotify_uri": {
-            "anyOf": [
-              {
-                "type": "string"
-              },
-              {
-                "type": "null"
-              }
+          "status": {
+            "enum": [
+              "new",
+              "accepted"
             ],
-            "title": "Spotify Uri"
-          },
-          "started_at": {
-            "title": "Started At",
+            "title": "Status",
             "type": "string"
           },
           "title": {
             "title": "Title",
             "type": "string"
+          },
+          "vote_count": {
+            "default": 0,
+            "title": "Vote Count",
+            "type": "integer"
           }
         },
         "required": [
-          "album",
-          "album_art_url",
           "artist",
-          "bridge_connected",
-          "matched_request_id",
-          "source",
-          "spotify_uri",
-          "started_at",
-          "title"
+          "artwork_url",
+          "bpm",
+          "genre",
+          "id",
+          "musical_key",
+          "nickname",
+          "requester_verified",
+          "status",
+          "title",
+          "vote_count"
         ],
-        "title": "NowPlayingResponse",
+        "title": "GuestRequestInfo",
         "type": "object"
       },
-      "PaginatedResponse": {
+      "GuestRequestListResponse": {
         "properties": {
-          "items": {
-            "items": {},
-            "title": "Items",
-            "type": "array"
+          "event": {
+            "$ref": "#/components/schemas/PublicEventInfo"
           },
-          "limit": {
-            "title": "Limit",
-            "type": "integer"
+          "now_playing": {
+            "anyOf": [
+              {
+                "$ref": "#/components/schemas/GuestNowPlaying"
+              },
+              {
+                "type": "null"
+              }
+            ]
           },
-          "page": {
-            "title": "Page",
-            "type": "integer"
+          "requests": {
+            "items": {
+              "$ref": "#/components/schemas/GuestRequestInfo"
+            },
+            "title": "Requests",
+            "type": "array"
           },
           "total": {
+            "default": 0,
             "title": "Total",
             "type": "integer"
           }
         },
         "required": [
-          "items",
-          "limit",
-          "page",
+          "event",
+          "now_playing",
+          "requests",
           "total"
         ],
-        "title": "PaginatedResponse",
+        "title": "GuestRequestListResponse",
         "type": "object"
       },
-      "PendingReviewResponse": {
+      "HTTPValidationError": {
         "properties": {
-          "requests": {
+          "detail": {
             "items": {
-              "$ref": "#/components/schemas/PendingReviewRow"
+              "$ref": "#/components/schemas/ValidationError"
             },
-            "title": "Requests",
+            "title": "Detail",
             "type": "array"
-          },
-          "total": {
-            "title": "Total",
-            "type": "integer"
           }
         },
         "required": [
-          "requests",
-          "total"
+          "detail"
         ],
-        "title": "PendingReviewResponse",
+        "title": "HTTPValidationError",
         "type": "object"
       },
-      "PendingReviewRow": {
+      "HasRequestedResponse": {
         "properties": {
-          "artist": {
-            "title": "Artist",
+          "has_requested": {
+            "title": "Has Requested",
+            "type": "boolean"
+          }
+        },
+        "required": [
+          "has_requested"
+        ],
+        "title": "HasRequestedResponse",
+        "type": "object"
+      },
+      "HelpPageSeenRequest": {
+        "properties": {
+          "page": {
+            "maxLength": 100,
+            "minLength": 1,
+            "pattern": "^[a-z0-9-]+$",
+            "title": "Page",
             "type": "string"
-          },
-          "artwork_url": {
+          }
+        },
+        "required": [
+          "page"
+        ],
+        "title": "HelpPageSeenRequest",
+        "type": "object"
+      },
+      "IdentifyRequest": {
+        "properties": {
+          "fingerprint_components": {
             "anyOf": [
               {
-                "type": "string"
+                "additionalProperties": true,
+                "type": "object"
               },
               {
                 "type": "null"
               }
             ],
-            "title": "Artwork Url"
+            "title": "Fingerprint Components"
           },
-          "created_at": {
-            "format": "date-time",
-            "title": "Created At",
+          "fingerprint_hash": {
+            "maxLength": 64,
+            "minLength": 8,
+            "title": "Fingerprint Hash",
+            "type": "string"
+          }
+        },
+        "required": [
+          "fingerprint_hash"
+        ],
+        "title": "IdentifyRequest",
+        "type": "object"
+      },
+      "IdentifyResponse": {
+        "properties": {
+          "action": {
+            "enum": [
+              "create",
+              "cookie_hit",
+              "reconcile"
+            ],
+            "title": "Action",
             "type": "string"
           },
-          "id": {
-            "title": "Id",
+          "guest_id": {
+            "title": "Guest Id",
             "type": "integer"
           },
-          "nickname": {
-            "anyOf": [
-              {
-                "type": "string"
-              },
-              {
-                "type": "null"
-              }
-            ],
-            "title": "Nickname"
+          "reconcile_hint": {
+            "default": false,
+            "title": "Reconcile Hint",
+            "type": "boolean"
+          }
+        },
+        "required": [
+          "action",
+          "guest_id",
+          "reconcile_hint"
+        ],
+        "title": "IdentifyResponse",
+        "type": "object"
+      },
+      "IntegrationCheckResponse": {
+        "description": "Response for POST /api/admin/integrations/{service}/check.",
+        "properties": {
+          "capabilities": {
+            "$ref": "#/components/schemas/ServiceCapabilities"
           },
-          "note": {
+          "error": {
             "anyOf": [
               {
                 "type": "string"
@@ -3481,106 +3650,62 @@
                 "type": "null"
               }
             ],
-            "title": "Note"
+            "title": "Error"
           },
-          "song_title": {
-            "title": "Song Title",
-            "type": "string"
+          "healthy": {
+            "title": "Healthy",
+            "type": "boolean"
           },
-          "status": {
-            "enum": [
-              "new",
-              "accepted",
-              "playing",
-              "played",
-              "rejected"
-            ],
-            "title": "Status",
+          "service": {
+            "title": "Service",
             "type": "string"
-          },
-          "vote_count": {
-            "title": "Vote Count",
-            "type": "integer"
           }
         },
         "required": [
-          "artist",
-          "artwork_url",
-          "created_at",
-          "id",
-          "nickname",
-          "note",
-          "song_title",
-          "status",
-          "vote_count"
+          "capabilities",
+          "error",
+          "healthy",
+          "service"
         ],
-        "title": "PendingReviewRow",
+        "title": "IntegrationCheckResponse",
         "type": "object"
       },
-      "PlayHistoryEntry": {
-        "description": "Single entry in play history.",
+      "IntegrationHealthResponse": {
+        "description": "Response for GET /api/admin/integrations.",
         "properties": {
-          "album": {
-            "anyOf": [
-              {
-                "type": "string"
-              },
-              {
-                "type": "null"
-              }
-            ],
-            "title": "Album"
+          "services": {
+            "items": {
+              "$ref": "#/components/schemas/IntegrationServiceStatus"
+            },
+            "title": "Services",
+            "type": "array"
+          }
+        },
+        "required": [
+          "services"
+        ],
+        "title": "IntegrationHealthResponse",
+        "type": "object"
+      },
+      "IntegrationServiceStatus": {
+        "description": "Full status for a single integration service.",
+        "properties": {
+          "capabilities": {
+            "$ref": "#/components/schemas/ServiceCapabilities"
           },
-          "album_art_url": {
-            "anyOf": [
-              {
-                "type": "string"
-              },
-              {
-                "type": "null"
-              }
-            ],
-            "title": "Album Art Url"
+          "configured": {
+            "title": "Configured",
+            "type": "boolean"
           },
-          "artist": {
-            "title": "Artist",
+          "display_name": {
+            "title": "Display Name",
             "type": "string"
           },
-          "ended_at": {
-            "anyOf": [
-              {
-                "type": "string"
-              },
-              {
-                "type": "null"
-              }
-            ],
-            "title": "Ended At"
-          },
-          "id": {
-            "title": "Id",
-            "type": "integer"
-          },
-          "matched_request_id": {
-            "anyOf": [
-              {
-                "type": "integer"
-              },
-              {
-                "type": "null"
-              }
-            ],
-            "title": "Matched Request Id"
-          },
-          "play_order": {
-            "title": "Play Order",
-            "type": "integer"
-          },
-          "source": {
-            "title": "Source",
-            "type": "string"
+          "enabled": {
+            "title": "Enabled",
+            "type": "boolean"
           },
-          "spotify_uri": {
+          "last_check_error": {
             "anyOf": [
               {
                 "type": "string"
@@ -3589,76 +3714,111 @@
                 "type": "null"
               }
             ],
-            "title": "Spotify Uri"
+            "title": "Last Check Error"
           },
-          "started_at": {
-            "title": "Started At",
+          "service": {
+            "title": "Service",
             "type": "string"
+          }
+        },
+        "required": [
+          "capabilities",
+          "configured",
+          "display_name",
+          "enabled",
+          "last_check_error",
+          "service"
+        ],
+        "title": "IntegrationServiceStatus",
+        "type": "object"
+      },
+      "IntegrationToggleRequest": {
+        "description": "Request body for PATCH /api/admin/integrations/{service}.",
+        "properties": {
+          "enabled": {
+            "title": "Enabled",
+            "type": "boolean"
+          }
+        },
+        "required": [
+          "enabled"
+        ],
+        "title": "IntegrationToggleRequest",
+        "type": "object"
+      },
+      "IntegrationToggleResponse": {
+        "description": "Response for PATCH /api/admin/integrations/{service}.",
+        "properties": {
+          "enabled": {
+            "title": "Enabled",
+            "type": "boolean"
           },
-          "title": {
-            "title": "Title",
+          "service": {
+            "title": "Service",
             "type": "string"
           }
         },
         "required": [
-          "album",
-          "album_art_url",
-          "artist",
-          "ended_at",
-          "id",
-          "matched_request_id",
-          "play_order",
-          "source",
-          "spotify_uri",
-          "started_at",
-          "title"
+          "enabled",
+          "service"
         ],
-        "title": "PlayHistoryEntry",
+        "title": "IntegrationToggleResponse",
         "type": "object"
       },
-      "PlayHistoryResponse": {
-        "description": "Paginated response for play history.",
+      "JoinConfigResponse": {
         "properties": {
-          "items": {
-            "items": {
-              "$ref": "#/components/schemas/PlayHistoryEntry"
-            },
-            "title": "Items",
-            "type": "array"
-          },
-          "total": {
-            "title": "Total",
-            "type": "integer"
+          "frictionless_join": {
+            "title": "Frictionless Join",
+            "type": "boolean"
           }
         },
         "required": [
-          "items",
-          "total"
+          "frictionless_join"
         ],
-        "title": "PlayHistoryResponse",
+        "title": "JoinConfigResponse",
         "type": "object"
       },
-      "PublicEventInfo": {
+      "KioskAssignRequest": {
+        "description": "Body for reassigning a kiosk to a different event.",
         "properties": {
-          "code": {
-            "title": "Code",
+          "event_code": {
+            "maxLength": 10,
+            "minLength": 1,
+            "title": "Event Code",
             "type": "string"
-          },
-          "name": {
-            "title": "Name",
+          }
+        },
+        "required": [
+          "event_code"
+        ],
+        "title": "KioskAssignRequest",
+        "type": "object"
+      },
+      "KioskCompletePairingRequest": {
+        "description": "Body for completing a kiosk pairing.",
+        "properties": {
+          "event_code": {
+            "maxLength": 10,
+            "minLength": 1,
+            "title": "Event Code",
             "type": "string"
           }
         },
         "required": [
-          "code",
-          "name"
+          "event_code"
         ],
-        "title": "PublicEventInfo",
+        "title": "KioskCompletePairingRequest",
         "type": "object"
       },
-      "PublicEventResponse": {
-        "description": "Guest-safe live-event projection. Deliberately omits event.id and any\nDJ-only fields (see #382 serializer hygiene).",
+      "KioskDisplayResponse": {
         "properties": {
+          "accepted_queue": {
+            "items": {
+              "$ref": "#/components/schemas/PublicRequestInfo"
+            },
+            "title": "Accepted Queue",
+            "type": "array"
+          },
           "banner_colors": {
             "anyOf": [
               {
@@ -3673,6 +3833,17 @@
             ],
             "title": "Banner Colors"
           },
+          "banner_kiosk_url": {
+            "anyOf": [
+              {
+                "type": "string"
+              },
+              {
+                "type": "null"
+              }
+            ],
+            "title": "Banner Kiosk Url"
+          },
           "banner_url": {
             "anyOf": [
               {
@@ -3684,57 +3855,63 @@
             ],
             "title": "Banner Url"
           },
-          "collection_code": {
-            "title": "Collection Code",
-            "type": "string"
-          },
-          "frictionless_join": {
-            "title": "Frictionless Join",
-            "type": "boolean"
+          "event": {
+            "$ref": "#/components/schemas/PublicEventInfo"
           },
-          "name": {
-            "title": "Name",
-            "type": "string"
+          "kiosk_display_only": {
+            "default": false,
+            "title": "Kiosk Display Only",
+            "type": "boolean"
           },
-          "phase": {
-            "enum": [
-              "pre_announce",
-              "collection",
-              "live",
-              "closed"
-            ],
-            "title": "Phase",
+          "now_playing": {
+            "anyOf": [
+              {
+                "$ref": "#/components/schemas/PublicRequestInfo"
+              },
+              {
+                "type": "null"
+              }
+            ]
+          },
+          "now_playing_hidden": {
+            "title": "Now Playing Hidden",
+            "type": "boolean"
+          },
+          "qr_join_url": {
+            "title": "Qr Join Url",
             "type": "string"
           },
           "requests_open": {
+            "default": true,
             "title": "Requests Open",
             "type": "boolean"
           },
-          "submission_cap_per_guest": {
-            "title": "Submission Cap Per Guest",
-            "type": "integer"
+          "updated_at": {
+            "format": "date-time",
+            "title": "Updated At",
+            "type": "string"
           }
         },
         "required": [
+          "accepted_queue",
           "banner_colors",
+          "banner_kiosk_url",
           "banner_url",
-          "collection_code",
-          "frictionless_join",
-          "name",
-          "phase",
+          "event",
+          "kiosk_display_only",
+          "now_playing",
+          "now_playing_hidden",
+          "qr_join_url",
           "requests_open",
-          "submission_cap_per_guest"
+          "updated_at"
         ],
-        "title": "PublicEventResponse",
+        "title": "KioskDisplayResponse",
         "type": "object"
       },
-      "PublicRequestInfo": {
+      "KioskOut": {
+        "description": "Kiosk info for DJ dashboard (no session_token).",
         "properties": {
-          "artist": {
-            "title": "Artist",
-            "type": "string"
-          },
-          "artwork_url": {
+          "event_code": {
             "anyOf": [
               {
                 "type": "string"
@@ -3743,20 +3920,20 @@
                 "type": "null"
               }
             ],
-            "title": "Artwork Url"
+            "title": "Event Code"
           },
-          "bpm": {
+          "event_join_code": {
             "anyOf": [
               {
-                "type": "integer"
+                "type": "string"
               },
               {
                 "type": "null"
               }
             ],
-            "title": "Bpm"
+            "title": "Event Join Code"
           },
-          "genre": {
+          "event_name": {
             "anyOf": [
               {
                 "type": "string"
@@ -3765,24 +3942,25 @@
                 "type": "null"
               }
             ],
-            "title": "Genre"
+            "title": "Event Name"
           },
           "id": {
             "title": "Id",
             "type": "integer"
           },
-          "musical_key": {
+          "last_seen_at": {
             "anyOf": [
               {
+                "format": "date-time",
                 "type": "string"
               },
               {
                 "type": "null"
               }
             ],
-            "title": "Musical Key"
+            "title": "Last Seen At"
           },
-          "nickname": {
+          "name": {
             "anyOf": [
               {
                 "type": "string"
@@ -3791,120 +3969,85 @@
                 "type": "null"
               }
             ],
-            "title": "Nickname"
+            "title": "Name"
           },
-          "requester_verified": {
-            "default": false,
-            "title": "Requester Verified",
-            "type": "boolean"
+          "paired_at": {
+            "anyOf": [
+              {
+                "format": "date-time",
+                "type": "string"
+              },
+              {
+                "type": "null"
+              }
+            ],
+            "title": "Paired At"
           },
-          "title": {
-            "title": "Title",
+          "status": {
+            "title": "Status",
             "type": "string"
-          },
-          "vote_count": {
-            "default": 0,
-            "title": "Vote Count",
-            "type": "integer"
           }
         },
         "required": [
-          "artist",
-          "artwork_url",
-          "bpm",
-          "genre",
+          "event_code",
+          "event_join_code",
+          "event_name",
           "id",
-          "musical_key",
-          "nickname",
-          "requester_verified",
-          "title",
-          "vote_count"
+          "last_seen_at",
+          "name",
+          "paired_at",
+          "status"
         ],
-        "title": "PublicRequestInfo",
+        "title": "KioskOut",
         "type": "object"
       },
-      "PublicSettings": {
+      "KioskPairChallengeResponse": {
         "properties": {
-          "registration_enabled": {
-            "title": "Registration Enabled",
-            "type": "boolean"
+          "expires_in": {
+            "title": "Expires In",
+            "type": "integer"
           },
-          "turnstile_site_key": {
-            "title": "Turnstile Site Key",
+          "nonce": {
+            "title": "Nonce",
             "type": "string"
           }
         },
         "required": [
-          "registration_enabled",
-          "turnstile_site_key"
+          "expires_in",
+          "nonce"
         ],
-        "title": "PublicSettings",
+        "title": "KioskPairChallengeResponse",
         "type": "object"
       },
-      "RecommendationResponse": {
+      "KioskPairResponse": {
+        "description": "Returned when a new kiosk pairing session is created.",
         "properties": {
-          "llm_available": {
-            "default": false,
-            "title": "Llm Available",
-            "type": "boolean"
-          },
-          "profile": {
-            "$ref": "#/components/schemas/EventMusicProfile"
-          },
-          "services_used": {
-            "default": [],
-            "items": {
-              "type": "string"
-            },
-            "title": "Services Used",
-            "type": "array"
+          "expires_at": {
+            "format": "date-time",
+            "title": "Expires At",
+            "type": "string"
           },
-          "suggestions": {
-            "default": [],
-            "items": {
-              "$ref": "#/components/schemas/RecommendedTrack"
-            },
-            "title": "Suggestions",
-            "type": "array"
+          "pair_code": {
+            "title": "Pair Code",
+            "type": "string"
           },
-          "total_candidates_searched": {
-            "default": 0,
-            "title": "Total Candidates Searched",
-            "type": "integer"
+          "session_token": {
+            "title": "Session Token",
+            "type": "string"
           }
         },
         "required": [
-          "llm_available",
-          "profile",
-          "services_used",
-          "suggestions",
-          "total_candidates_searched"
+          "expires_at",
+          "pair_code",
+          "session_token"
         ],
-        "title": "RecommendationResponse",
+        "title": "KioskPairResponse",
         "type": "object"
       },
-      "RecommendedTrack": {
+      "KioskPairStatusResponse": {
+        "description": "Returned when polling a pairing code's status.",
         "properties": {
-          "artist": {
-            "title": "Artist",
-            "type": "string"
-          },
-          "bpm": {
-            "anyOf": [
-              {
-                "type": "number"
-              },
-              {
-                "type": "null"
-              }
-            ],
-            "title": "Bpm"
-          },
-          "bpm_score": {
-            "title": "Bpm Score",
-            "type": "number"
-          },
-          "cover_url": {
+          "event_code": {
             "anyOf": [
               {
                 "type": "string"
@@ -3913,20 +4056,20 @@
                 "type": "null"
               }
             ],
-            "title": "Cover Url"
+            "title": "Event Code"
           },
-          "duration_seconds": {
+          "event_join_code": {
             "anyOf": [
               {
-                "type": "integer"
+                "type": "string"
               },
               {
                 "type": "null"
               }
             ],
-            "title": "Duration Seconds"
+            "title": "Event Join Code"
           },
-          "genre": {
+          "event_name": {
             "anyOf": [
               {
                 "type": "string"
@@ -3935,45 +4078,56 @@
                 "type": "null"
               }
             ],
-            "title": "Genre"
-          },
-          "genre_score": {
-            "title": "Genre Score",
-            "type": "number"
+            "title": "Event Name"
           },
-          "key": {
+          "status": {
+            "title": "Status",
+            "type": "string"
+          }
+        },
+        "required": [
+          "event_code",
+          "event_join_code",
+          "event_name",
+          "status"
+        ],
+        "title": "KioskPairStatusResponse",
+        "type": "object"
+      },
+      "KioskRenameRequest": {
+        "description": "Body for renaming a kiosk.",
+        "properties": {
+          "name": {
             "anyOf": [
               {
+                "maxLength": 100,
                 "type": "string"
               },
               {
                 "type": "null"
               }
             ],
-            "title": "Key"
-          },
-          "key_score": {
-            "title": "Key Score",
-            "type": "number"
-          },
-          "mb_verified": {
-            "default": false,
-            "title": "Mb Verified",
-            "type": "boolean"
-          },
-          "score": {
-            "title": "Score",
-            "type": "number"
-          },
-          "source": {
-            "title": "Source",
-            "type": "string"
-          },
-          "title": {
-            "title": "Title",
-            "type": "string"
+            "title": "Name"
+          }
+        },
+        "title": "KioskRenameRequest",
+        "type": "object"
+      },
+      "KioskSessionResponse": {
+        "description": "Returned when polling a kiosk's current assignment.",
+        "properties": {
+          "event_code": {
+            "anyOf": [
+              {
+                "type": "string"
+              },
+              {
+                "type": "null"
+              }
+            ],
+            "title": "Event Code"
           },
-          "track_id": {
+          "event_join_code": {
             "anyOf": [
               {
                 "type": "string"
@@ -3982,9 +4136,9 @@
                 "type": "null"
               }
             ],
-            "title": "Track Id"
+            "title": "Event Join Code"
           },
-          "url": {
+          "event_name": {
             "anyOf": [
               {
                 "type": "string"
@@ -3993,80 +4147,73 @@
                 "type": "null"
               }
             ],
-            "title": "Url"
+            "title": "Event Name"
+          },
+          "status": {
+            "title": "Status",
+            "type": "string"
           }
         },
         "required": [
-          "artist",
-          "bpm",
-          "bpm_score",
-          "cover_url",
-          "duration_seconds",
-          "genre",
-          "genre_score",
-          "key",
-          "key_score",
-          "mb_verified",
-          "score",
-          "source",
-          "title",
-          "track_id",
-          "url"
+          "event_code",
+          "event_join_code",
+          "event_name",
+          "status"
         ],
-        "title": "RecommendedTrack",
+        "title": "KioskSessionResponse",
         "type": "object"
       },
-      "RegisterRequest": {
+      "LLMPromptRequest": {
         "properties": {
-          "confirm_password": {
-            "title": "Confirm Password",
-            "type": "string"
-          },
-          "email": {
-            "format": "email",
-            "title": "Email",
-            "type": "string"
-          },
-          "password": {
-            "maxLength": 128,
-            "minLength": 8,
-            "title": "Password",
-            "type": "string"
-          },
-          "turnstile_token": {
-            "default": "",
-            "maxLength": 4096,
-            "title": "Turnstile Token",
-            "type": "string"
-          },
-          "username": {
-            "maxLength": 50,
+          "prompt": {
+            "maxLength": 500,
             "minLength": 3,
-            "title": "Username",
+            "title": "Prompt",
             "type": "string"
           }
         },
         "required": [
-          "username",
-          "email",
-          "password",
-          "confirm_password"
+          "prompt"
         ],
-        "title": "RegisterRequest",
+        "title": "LLMPromptRequest",
         "type": "object"
       },
-      "RequestCreate": {
+      "LiveJoinCodeResponse": {
+        "description": "Returns the live join_code for an event that has entered the live phase.\n\nGated by require_verified_human so the join_code never leaks to unverified\nbots scraping the collect URL during the collection-to-live transition.",
+        "properties": {
+          "join_code": {
+            "title": "Join Code",
+            "type": "string"
+          }
+        },
+        "required": [
+          "join_code"
+        ],
+        "title": "LiveJoinCodeResponse",
+        "type": "object"
+      },
+      "MePreferencesUpdate": {
+        "properties": {
+          "frictionless_join_default": {
+            "title": "Frictionless Join Default",
+            "type": "boolean"
+          }
+        },
+        "required": [
+          "frictionless_join_default"
+        ],
+        "title": "MePreferencesUpdate",
+        "type": "object"
+      },
+      "MyRequestInfo": {
         "properties": {
           "artist": {
-            "maxLength": 255,
-            "minLength": 1,
             "title": "Artist",
             "type": "string"
           },
           "artwork_url": {
             "anyOf": [
               {
-                "maxLength": 500,
                 "type": "string"
               },
               {
@@ -4075,32 +4222,104 @@
             ],
             "title": "Artwork Url"
           },
-          "bpm": {
+          "created_at": {
+            "format": "date-time",
+            "title": "Created At",
+            "type": "string"
+          },
+          "id": {
+            "title": "Id",
+            "type": "integer"
+          },
+          "status": {
+            "enum": [
+              "new",
+              "accepted",
+              "playing",
+              "played",
+              "rejected"
+            ],
+            "title": "Status",
+            "type": "string"
+          },
+          "title": {
+            "title": "Title",
+            "type": "string"
+          },
+          "vote_count": {
+            "default": 0,
+            "title": "Vote Count",
+            "type": "integer"
+          }
+        },
+        "required": [
+          "artist",
+          "artwork_url",
+          "created_at",
+          "id",
+          "status",
+          "title",
+          "vote_count"
+        ],
+        "title": "MyRequestInfo",
+        "type": "object"
+      },
+      "MyRequestsResponse": {
+        "properties": {
+          "requests": {
+            "items": {
+              "$ref": "#/components/schemas/MyRequestInfo"
+            },
+            "title": "Requests",
+            "type": "array"
+          }
+        },
+        "required": [
+          "requests"
+        ],
+        "title": "MyRequestsResponse",
+        "type": "object"
+      },
+      "NowPlayingBridgePayload": {
+        "description": "Payload from bridge when a new track starts playing.",
+        "properties": {
+          "album": {
             "anyOf": [
               {
-                "maximum": 999.0,
-                "minimum": 1.0,
-                "type": "number"
+                "maxLength": 255,
+                "type": "string"
               },
               {
                 "type": "null"
               }
             ],
-            "title": "Bpm"
+            "title": "Album"
           },
-          "genre": {
+          "artist": {
+            "maxLength": 255,
+            "minLength": 1,
+            "title": "Artist",
+            "type": "string"
+          },
+          "deck": {
             "anyOf": [
               {
-                "maxLength": 100,
+                "maxLength": 10,
                 "type": "string"
               },
               {
                 "type": "null"
               }
             ],
-            "title": "Genre"
+            "title": "Deck"
           },
-          "musical_key": {
+          "event_code": {
+            "maxLength": 10,
+            "minLength": 1,
+            "title": "Event Code",
+            "type": "string"
+          },
+          "source": {
             "anyOf": [
               {
                 "maxLength": 20,
@@ -4110,96 +4329,157 @@
                 "type": "null"
               }
             ],
-            "title": "Musical Key"
+            "title": "Source"
           },
-          "nickname": {
+          "title": {
+            "maxLength": 255,
+            "minLength": 1,
+            "title": "Title",
+            "type": "string"
+          }
+        },
+        "required": [
+          "event_code",
+          "title",
+          "artist"
+        ],
+        "title": "NowPlayingBridgePayload",
+        "type": "object"
+      },
+      "NowPlayingResponse": {
+        "description": "Response for current now-playing track.",
+        "properties": {
+          "album": {
             "anyOf": [
               {
-                "maxLength": 30,
                 "type": "string"
               },
               {
                 "type": "null"
               }
             ],
-            "title": "Nickname"
+            "title": "Album"
           },
-          "note": {
+          "album_art_url": {
             "anyOf": [
               {
-                "maxLength": 500,
                 "type": "string"
               },
               {
                 "type": "null"
               }
             ],
-            "title": "Note"
+            "title": "Album Art Url"
           },
-          "raw_search_query": {
+          "artist": {
+            "title": "Artist",
+            "type": "string"
+          },
+          "bridge_connected": {
+            "default": false,
+            "title": "Bridge Connected",
+            "type": "boolean"
+          },
+          "matched_request_id": {
             "anyOf": [
               {
-                "maxLength": 200,
-                "type": "string"
+                "type": "integer"
               },
               {
                 "type": "null"
               }
             ],
-            "title": "Raw Search Query"
+            "title": "Matched Request Id"
           },
           "source": {
-            "$ref": "#/components/schemas/RequestSource",
-            "default": "manual"
+            "title": "Source",
+            "type": "string"
           },
-          "source_url": {
+          "spotify_uri": {
             "anyOf": [
               {
-                "maxLength": 500,
                 "type": "string"
               },
               {
                 "type": "null"
               }
             ],
-            "title": "Source Url"
+            "title": "Spotify Uri"
+          },
+          "started_at": {
+            "title": "Started At",
+            "type": "string"
           },
           "title": {
-            "maxLength": 255,
-            "minLength": 1,
             "title": "Title",
             "type": "string"
           }
         },
         "required": [
+          "album",
+          "album_art_url",
           "artist",
+          "bridge_connected",
+          "matched_request_id",
+          "source",
+          "spotify_uri",
+          "started_at",
           "title"
         ],
-        "title": "RequestCreate",
+        "title": "NowPlayingResponse",
         "type": "object"
       },
-      "RequestEmailChangeRequest": {
+      "PaginatedResponse": {
         "properties": {
-          "current_password": {
-            "maxLength": 128,
-            "minLength": 1,
-            "title": "Current Password",
-            "type": "string"
+          "items": {
+            "items": {},
+            "title": "Items",
+            "type": "array"
           },
-          "new_email": {
-            "format": "email",
-            "title": "New Email",
-            "type": "string"
+          "limit": {
+            "title": "Limit",
+            "type": "integer"
+          },
+          "page": {
+            "title": "Page",
+            "type": "integer"
+          },
+          "total": {
+            "title": "Total",
+            "type": "integer"
           }
         },
         "required": [
-          "current_password",
-          "new_email"
+          "items",
+          "limit",
+          "page",
+          "total"
         ],
-        "title": "RequestEmailChangeRequest",
+        "title": "PaginatedResponse",
         "type": "object"
       },
-      "RequestOut": {
+      "PendingReviewResponse": {
+        "properties": {
+          "requests": {
+            "items": {
+              "$ref": "#/components/schemas/PendingReviewRow"
+            },
+            "title": "Requests",
+            "type": "array"
+          },
+          "total": {
+            "title": "Total",
+            "type": "integer"
+          }
+        },
+        "required": [
+          "requests",
+          "total"
+        ],
+        "title": "PendingReviewResponse",
+        "type": "object"
+      },
+      "PendingReviewRow": {
         "properties": {
           "artist": {
             "title": "Artist",
@@ -4216,26 +4496,16 @@
             ],
             "title": "Artwork Url"
           },
-          "bpm": {
-            "anyOf": [
-              {
-                "type": "number"
-              },
-              {
-                "type": "null"
-              }
-            ],
-            "title": "Bpm"
-          },
           "created_at": {
+            "format": "date-time",
             "title": "Created At",
             "type": "string"
           },
-          "event_id": {
-            "title": "Event Id",
+          "id": {
+            "title": "Id",
             "type": "integer"
           },
-          "genre": {
+          "nickname": {
             "anyOf": [
               {
                 "type": "string"
@@ -4244,18 +4514,9 @@
                 "type": "null"
               }
             ],
-            "title": "Genre"
-          },
-          "id": {
-            "title": "Id",
-            "type": "integer"
-          },
-          "is_duplicate": {
-            "default": false,
-            "title": "Is Duplicate",
-            "type": "boolean"
+            "title": "Nickname"
           },
-          "musical_key": {
+          "note": {
             "anyOf": [
               {
                 "type": "string"
@@ -4264,9 +4525,46 @@
                 "type": "null"
               }
             ],
-            "title": "Musical Key"
+            "title": "Note"
           },
-          "nickname": {
+          "song_title": {
+            "title": "Song Title",
+            "type": "string"
+          },
+          "status": {
+            "enum": [
+              "new",
+              "accepted",
+              "playing",
+              "played",
+              "rejected"
+            ],
+            "title": "Status",
+            "type": "string"
+          },
+          "vote_count": {
+            "title": "Vote Count",
+            "type": "integer"
+          }
+        },
+        "required": [
+          "artist",
+          "artwork_url",
+          "created_at",
+          "id",
+          "nickname",
+          "note",
+          "song_title",
+          "status",
+          "vote_count"
+        ],
+        "title": "PendingReviewRow",
+        "type": "object"
+      },
+      "PlayHistoryEntry": {
+        "description": "Single entry in play history.",
+        "properties": {
+          "album": {
             "anyOf": [
               {
                 "type": "string"
@@ -4275,9 +4573,9 @@
                 "type": "null"
               }
             ],
-            "title": "Nickname"
+            "title": "Album"
           },
-          "note": {
+          "album_art_url": {
             "anyOf": [
               {
                 "type": "string"
@@ -4286,39 +4584,47 @@
                 "type": "null"
               }
             ],
-            "title": "Note"
+            "title": "Album Art Url"
           },
-          "priority_score": {
+          "artist": {
+            "title": "Artist",
+            "type": "string"
+          },
+          "ended_at": {
             "anyOf": [
               {
-                "type": "number"
+                "type": "string"
               },
               {
                 "type": "null"
               }
             ],
-            "title": "Priority Score"
+            "title": "Ended At"
           },
-          "raw_search_query": {
+          "id": {
+            "title": "Id",
+            "type": "integer"
+          },
+          "matched_request_id": {
             "anyOf": [
               {
-                "type": "string"
+                "type": "integer"
               },
               {
                 "type": "null"
               }
             ],
-            "title": "Raw Search Query"
+            "title": "Matched Request Id"
           },
-          "song_title": {
-            "title": "Song Title",
-            "type": "string"
+          "play_order": {
+            "title": "Play Order",
+            "type": "integer"
           },
           "source": {
             "title": "Source",
             "type": "string"
           },
-          "source_url": {
+          "spotify_uri": {
             "anyOf": [
               {
                 "type": "string"
@@ -4327,107 +4633,91 @@
                 "type": "null"
               }
             ],
-            "title": "Source Url"
+            "title": "Spotify Uri"
           },
-          "status": {
-            "title": "Status",
+          "started_at": {
+            "title": "Started At",
             "type": "string"
           },
-          "sync_results_json": {
-            "anyOf": [
-              {
-                "type": "string"
-              },
-              {
-                "type": "null"
-              }
-            ],
-            "title": "Sync Results Json"
-          },
-          "updated_at": {
-            "title": "Updated At",
+          "title": {
+            "title": "Title",
             "type": "string"
-          },
-          "vote_count": {
-            "default": 0,
-            "title": "Vote Count",
-            "type": "integer"
           }
         },
         "required": [
+          "album",
+          "album_art_url",
           "artist",
-          "artwork_url",
-          "bpm",
-          "created_at",
-          "event_id",
-          "genre",
+          "ended_at",
           "id",
-          "is_duplicate",
-          "musical_key",
-          "nickname",
-          "note",
-          "priority_score",
-          "raw_search_query",
-          "song_title",
+          "matched_request_id",
+          "play_order",
           "source",
-          "source_url",
-          "status",
-          "sync_results_json",
-          "updated_at",
-          "vote_count"
-        ],
-        "title": "RequestOut",
-        "type": "object"
-      },
-      "RequestSource": {
-        "enum": [
-          "manual",
-          "musicbrainz",
-          "spotify",
-          "share_link",
-          "tidal",
-          "beatport"
+          "spotify_uri",
+          "started_at",
+          "title"
         ],
-        "title": "RequestSource",
-        "type": "string"
+        "title": "PlayHistoryEntry",
+        "type": "object"
       },
-      "RequestStatus": {
-        "enum": [
-          "new",
-          "accepted",
-          "playing",
-          "played",
-          "rejected"
+      "PlayHistoryResponse": {
+        "description": "Paginated response for play history.",
+        "properties": {
+          "items": {
+            "items": {
+              "$ref": "#/components/schemas/PlayHistoryEntry"
+            },
+            "title": "Items",
+            "type": "array"
+          },
+          "total": {
+            "title": "Total",
+            "type": "integer"
+          }
+        },
+        "required": [
+          "items",
+          "total"
         ],
-        "title": "RequestStatus",
-        "type": "string"
+        "title": "PlayHistoryResponse",
+        "type": "object"
       },
-      "RequestUpdate": {
+      "PublicEventInfo": {
         "properties": {
-          "status": {
-            "$ref": "#/components/schemas/RequestStatus"
+          "code": {
+            "title": "Code",
+            "type": "string"
+          },
+          "name": {
+            "title": "Name",
+            "type": "string"
           }
         },
         "required": [
-          "status"
+          "code",
+          "name"
         ],
-        "title": "RequestUpdate",
+        "title": "PublicEventInfo",
         "type": "object"
       },
-      "SearchResult": {
+      "PublicEventResponse": {
+        "description": "Guest-safe live-event projection. Deliberately omits event.id and any\nDJ-only fields (see #382 serializer hygiene).",
         "properties": {
-          "album": {
+          "banner_colors": {
             "anyOf": [
               {
-                "type": "string"
+                "items": {
+                  "type": "string"
+                },
+                "type": "array"
               },
               {
                 "type": "null"
               }
             ],
-            "title": "Album"
+            "title": "Banner Colors"
           },
-          "album_art": {
+          "banner_url": {
             "anyOf": [
               {
                 "type": "string"
@@ -4436,24 +4726,59 @@
                 "type": "null"
               }
             ],
-            "title": "Album Art"
+            "title": "Banner Url"
           },
-          "artist": {
-            "title": "Artist",
+          "collection_code": {
+            "title": "Collection Code",
             "type": "string"
           },
-          "bpm": {
-            "anyOf": [
-              {
-                "type": "integer"
-              },
-              {
-                "type": "null"
-              }
+          "frictionless_join": {
+            "title": "Frictionless Join",
+            "type": "boolean"
+          },
+          "name": {
+            "title": "Name",
+            "type": "string"
+          },
+          "phase": {
+            "enum": [
+              "pre_announce",
+              "collection",
+              "live",
+              "closed"
             ],
-            "title": "Bpm"
+            "title": "Phase",
+            "type": "string"
           },
-          "genre": {
+          "requests_open": {
+            "title": "Requests Open",
+            "type": "boolean"
+          },
+          "submission_cap_per_guest": {
+            "title": "Submission Cap Per Guest",
+            "type": "integer"
+          }
+        },
+        "required": [
+          "banner_colors",
+          "banner_url",
+          "collection_code",
+          "frictionless_join",
+          "name",
+          "phase",
+          "requests_open",
+          "submission_cap_per_guest"
+        ],
+        "title": "PublicEventResponse",
+        "type": "object"
+      },
+      "PublicRequestInfo": {
+        "properties": {
+          "artist": {
+            "title": "Artist",
+            "type": "string"
+          },
+          "artwork_url": {
             "anyOf": [
               {
                 "type": "string"
@@ -4462,20 +4787,20 @@
                 "type": "null"
               }
             ],
-            "title": "Genre"
+            "title": "Artwork Url"
           },
-          "isrc": {
+          "bpm": {
             "anyOf": [
               {
-                "type": "string"
+                "type": "integer"
               },
               {
                 "type": "null"
               }
             ],
-            "title": "Isrc"
+            "title": "Bpm"
           },
-          "key": {
+          "genre": {
             "anyOf": [
               {
                 "type": "string"
@@ -4484,14 +4809,13 @@
                 "type": "null"
               }
             ],
-            "title": "Key"
+            "title": "Genre"
           },
-          "popularity": {
-            "default": 0,
-            "title": "Popularity",
+          "id": {
+            "title": "Id",
             "type": "integer"
           },
-          "preview_url": {
+          "musical_key": {
             "anyOf": [
               {
                 "type": "string"
@@ -4500,14 +4824,9 @@
                 "type": "null"
               }
             ],
-            "title": "Preview Url"
-          },
-          "source": {
-            "default": "spotify",
-            "title": "Source",
-            "type": "string"
+            "title": "Musical Key"
           },
-          "spotify_id": {
+          "nickname": {
             "anyOf": [
               {
                 "type": "string"
@@ -4516,199 +4835,157 @@
                 "type": "null"
               }
             ],
-            "title": "Spotify Id"
+            "title": "Nickname"
+          },
+          "requester_verified": {
+            "default": false,
+            "title": "Requester Verified",
+            "type": "boolean"
           },
           "title": {
             "title": "Title",
             "type": "string"
           },
-          "url": {
-            "anyOf": [
-              {
-                "type": "string"
-              },
-              {
-                "type": "null"
-              }
-            ],
-            "title": "Url"
+          "vote_count": {
+            "default": 0,
+            "title": "Vote Count",
+            "type": "integer"
           }
         },
         "required": [
-          "album",
-          "album_art",
           "artist",
+          "artwork_url",
           "bpm",
           "genre",
-          "isrc",
-          "key",
-          "popularity",
-          "preview_url",
-          "source",
-          "spotify_id",
+          "id",
+          "musical_key",
+          "nickname",
+          "requester_verified",
           "title",
-          "url"
-        ],
-        "title": "SearchResult",
-        "type": "object"
-      },
-      "ServiceCapabilities": {
-        "description": "Capability matrix for a single integration service.",
-        "properties": {
-          "auth": {
-            "$ref": "#/components/schemas/CapabilityStatus"
-          },
-          "catalog_search": {
-            "$ref": "#/components/schemas/CapabilityStatus"
-          },
-          "playlist_sync": {
-            "$ref": "#/components/schemas/CapabilityStatus"
-          }
-        },
-        "required": [
-          "auth",
-          "catalog_search",
-          "playlist_sync"
+          "vote_count"
         ],
-        "title": "ServiceCapabilities",
+        "title": "PublicRequestInfo",
         "type": "object"
       },
-      "StatusMessageResponse": {
+      "PublicSettings": {
         "properties": {
-          "message": {
-            "title": "Message",
-            "type": "string"
+          "registration_enabled": {
+            "title": "Registration Enabled",
+            "type": "boolean"
           },
-          "status": {
-            "title": "Status",
+          "turnstile_site_key": {
+            "title": "Turnstile Site Key",
             "type": "string"
           }
         },
         "required": [
-          "message",
-          "status"
+          "registration_enabled",
+          "turnstile_site_key"
         ],
-        "title": "StatusMessageResponse",
+        "title": "PublicSettings",
         "type": "object"
       },
-      "StatusResponse": {
+      "RecommendationResponse": {
         "properties": {
-          "status": {
-            "title": "Status",
-            "type": "string"
-          }
-        },
-        "required": [
-          "status"
-        ],
-        "title": "StatusResponse",
-        "type": "object"
-      },
-      "SystemSettingsOut": {
-        "properties": {
-          "beatport_enabled": {
-            "title": "Beatport Enabled",
-            "type": "boolean"
-          },
-          "bridge_enabled": {
-            "title": "Bridge Enabled",
-            "type": "boolean"
-          },
-          "human_verification_enforced": {
-            "title": "Human Verification Enforced",
-            "type": "boolean"
-          },
-          "llm_enabled": {
-            "title": "Llm Enabled",
+          "llm_available": {
+            "default": false,
+            "title": "Llm Available",
             "type": "boolean"
           },
-          "llm_model": {
-            "title": "Llm Model",
-            "type": "string"
+          "profile": {
+            "$ref": "#/components/schemas/EventMusicProfile"
           },
-          "llm_rate_limit_per_minute": {
-            "title": "Llm Rate Limit Per Minute",
-            "type": "integer"
+          "services_used": {
+            "default": [],
+            "items": {
+              "type": "string"
+            },
+            "title": "Services Used",
+            "type": "array"
           },
-          "registration_enabled": {
-            "title": "Registration Enabled",
-            "type": "boolean"
+          "suggestions": {
+            "default": [],
+            "items": {
+              "$ref": "#/components/schemas/RecommendedTrack"
+            },
+            "title": "Suggestions",
+            "type": "array"
           },
-          "search_rate_limit_per_minute": {
-            "title": "Search Rate Limit Per Minute",
+          "total_candidates_searched": {
+            "default": 0,
+            "title": "Total Candidates Searched",
             "type": "integer"
-          },
-          "spotify_enabled": {
-            "title": "Spotify Enabled",
-            "type": "boolean"
-          },
-          "tidal_enabled": {
-            "title": "Tidal Enabled",
-            "type": "boolean"
           }
         },
         "required": [
-          "beatport_enabled",
-          "bridge_enabled",
-          "human_verification_enforced",
-          "llm_enabled",
-          "llm_model",
-          "llm_rate_limit_per_minute",
-          "registration_enabled",
-          "search_rate_limit_per_minute",
-          "spotify_enabled",
-          "tidal_enabled"
+          "llm_available",
+          "profile",
+          "services_used",
+          "suggestions",
+          "total_candidates_searched"
         ],
-        "title": "SystemSettingsOut",
+        "title": "RecommendationResponse",
         "type": "object"
       },
-      "SystemSettingsUpdate": {
+      "RecommendedTrack": {
         "properties": {
-          "beatport_enabled": {
+          "artist": {
+            "title": "Artist",
+            "type": "string"
+          },
+          "bpm": {
             "anyOf": [
               {
-                "type": "boolean"
+                "type": "number"
               },
               {
                 "type": "null"
               }
             ],
-            "title": "Beatport Enabled"
+            "title": "Bpm"
           },
-          "bridge_enabled": {
+          "bpm_score": {
+            "title": "Bpm Score",
+            "type": "number"
+          },
+          "cover_url": {
             "anyOf": [
               {
-                "type": "boolean"
+                "type": "string"
               },
               {
                 "type": "null"
               }
             ],
-            "title": "Bridge Enabled"
+            "title": "Cover Url"
           },
-          "human_verification_enforced": {
+          "duration_seconds": {
             "anyOf": [
               {
-                "type": "boolean"
+                "type": "integer"
               },
               {
                 "type": "null"
               }
             ],
-            "title": "Human Verification Enforced"
+            "title": "Duration Seconds"
           },
-          "llm_enabled": {
+          "genre": {
             "anyOf": [
               {
-                "type": "boolean"
+                "type": "string"
               },
               {
                 "type": "null"
               }
             ],
-            "title": "Llm Enabled"
+            "title": "Genre"
           },
-          "llm_model": {
+          "genre_score": {
+            "title": "Genre Score",
+            "type": "number"
+          },
+          "key": {
             "anyOf": [
               {
                 "type": "string"
@@ -4717,237 +4994,262 @@
                 "type": "null"
               }
             ],
-            "title": "Llm Model"
+            "title": "Key"
           },
-          "llm_rate_limit_per_minute": {
+          "key_score": {
+            "title": "Key Score",
+            "type": "number"
+          },
+          "mb_verified": {
+            "default": false,
+            "title": "Mb Verified",
+            "type": "boolean"
+          },
+          "score": {
+            "title": "Score",
+            "type": "number"
+          },
+          "source": {
+            "title": "Source",
+            "type": "string"
+          },
+          "title": {
+            "title": "Title",
+            "type": "string"
+          },
+          "track_id": {
             "anyOf": [
               {
-                "maximum": 30.0,
-                "minimum": 1.0,
-                "type": "integer"
+                "type": "string"
               },
               {
                 "type": "null"
               }
             ],
-            "title": "Llm Rate Limit Per Minute"
+            "title": "Track Id"
           },
-          "registration_enabled": {
+          "url": {
             "anyOf": [
               {
-                "type": "boolean"
+                "type": "string"
               },
               {
                 "type": "null"
               }
             ],
-            "title": "Registration Enabled"
+            "title": "Url"
+          }
+        },
+        "required": [
+          "artist",
+          "bpm",
+          "bpm_score",
+          "cover_url",
+          "duration_seconds",
+          "genre",
+          "genre_score",
+          "key",
+          "key_score",
+          "mb_verified",
+          "score",
+          "source",
+          "title",
+          "track_id",
+          "url"
+        ],
+        "title": "RecommendedTrack",
+        "type": "object"
+      },
+      "RegisterRequest": {
+        "properties": {
+          "confirm_password": {
+            "title": "Confirm Password",
+            "type": "string"
           },
-          "search_rate_limit_per_minute": {
+          "email": {
+            "format": "email",
+            "title": "Email",
+            "type": "string"
+          },
+          "password": {
+            "maxLength": 128,
+            "minLength": 8,
+            "title": "Password",
+            "type": "string"
+          },
+          "turnstile_token": {
+            "default": "",
+            "maxLength": 4096,
+            "title": "Turnstile Token",
+            "type": "string"
+          },
+          "username": {
+            "maxLength": 50,
+            "minLength": 3,
+            "title": "Username",
+            "type": "string"
+          }
+        },
+        "required": [
+          "username",
+          "email",
+          "password",
+          "confirm_password"
+        ],
+        "title": "RegisterRequest",
+        "type": "object"
+      },
+      "RequestCreate": {
+        "properties": {
+          "artist": {
+            "maxLength": 255,
+            "minLength": 1,
+            "title": "Artist",
+            "type": "string"
+          },
+          "artwork_url": {
             "anyOf": [
               {
-                "maximum": 100.0,
-                "minimum": 1.0,
-                "type": "integer"
+                "maxLength": 500,
+                "type": "string"
               },
               {
                 "type": "null"
               }
             ],
-            "title": "Search Rate Limit Per Minute"
+            "title": "Artwork Url"
           },
-          "spotify_enabled": {
+          "bpm": {
             "anyOf": [
               {
-                "type": "boolean"
+                "maximum": 999.0,
+                "minimum": 1.0,
+                "type": "number"
               },
               {
                 "type": "null"
               }
             ],
-            "title": "Spotify Enabled"
+            "title": "Bpm"
           },
-          "tidal_enabled": {
+          "genre": {
             "anyOf": [
               {
-                "type": "boolean"
+                "maxLength": 100,
+                "type": "string"
               },
               {
                 "type": "null"
               }
             ],
-            "title": "Tidal Enabled"
-          }
-        },
-        "title": "SystemSettingsUpdate",
-        "type": "object"
-      },
-      "SystemStats": {
-        "properties": {
-          "active_events": {
-            "title": "Active Events",
-            "type": "integer"
-          },
-          "active_users": {
-            "title": "Active Users",
-            "type": "integer"
+            "title": "Genre"
           },
-          "pending_users": {
-            "title": "Pending Users",
-            "type": "integer"
-          },
-          "total_events": {
-            "title": "Total Events",
-            "type": "integer"
-          },
-          "total_requests": {
-            "title": "Total Requests",
-            "type": "integer"
-          },
-          "total_users": {
-            "title": "Total Users",
-            "type": "integer"
-          }
-        },
-        "required": [
-          "active_events",
-          "active_users",
-          "pending_users",
-          "total_events",
-          "total_requests",
-          "total_users"
-        ],
-        "title": "SystemStats",
-        "type": "object"
-      },
-      "TemplatePlaylistRequest": {
-        "properties": {
-          "playlist_id": {
-            "maxLength": 200,
-            "minLength": 1,
-            "title": "Playlist Id",
-            "type": "string"
-          },
-          "source": {
-            "pattern": "^(tidal|beatport)$",
-            "title": "Source",
-            "type": "string"
-          }
-        },
-        "required": [
-          "source",
-          "playlist_id"
-        ],
-        "title": "TemplatePlaylistRequest",
-        "type": "object"
-      },
-      "TidalAuthCheckResponse": {
-        "properties": {
-          "complete": {
-            "title": "Complete",
-            "type": "boolean"
-          },
-          "error": {
+          "musical_key": {
             "anyOf": [
               {
+                "maxLength": 20,
                 "type": "string"
               },
               {
                 "type": "null"
               }
             ],
-            "title": "Error"
+            "title": "Musical Key"
           },
-          "pending": {
+          "nickname": {
             "anyOf": [
               {
-                "type": "boolean"
+                "maxLength": 30,
+                "type": "string"
               },
               {
                 "type": "null"
               }
             ],
-            "title": "Pending"
+            "title": "Nickname"
           },
-          "user_code": {
+          "note": {
             "anyOf": [
               {
+                "maxLength": 500,
                 "type": "string"
               },
               {
                 "type": "null"
               }
             ],
-            "title": "User Code"
+            "title": "Note"
           },
-          "user_id": {
+          "raw_search_query": {
             "anyOf": [
               {
+                "maxLength": 200,
                 "type": "string"
               },
               {
                 "type": "null"
               }
             ],
-            "title": "User Id"
+            "title": "Raw Search Query"
           },
-          "verification_url": {
+          "source": {
+            "$ref": "#/components/schemas/RequestSource",
+            "default": "manual"
+          },
+          "source_url": {
             "anyOf": [
               {
+                "maxLength": 500,
                 "type": "string"
               },
               {
                 "type": "null"
               }
             ],
-            "title": "Verification Url"
+            "title": "Source Url"
+          },
+          "title": {
+            "maxLength": 255,
+            "minLength": 1,
+            "title": "Title",
+            "type": "string"
           }
         },
         "required": [
-          "complete",
-          "error",
-          "pending",
-          "user_code",
-          "user_id",
-          "verification_url"
+          "artist",
+          "title"
         ],
-        "title": "TidalAuthCheckResponse",
+        "title": "RequestCreate",
         "type": "object"
       },
-      "TidalAuthStartResponse": {
+      "RequestEmailChangeRequest": {
         "properties": {
-          "message": {
-            "title": "Message",
+          "current_password": {
+            "maxLength": 128,
+            "minLength": 1,
+            "title": "Current Password",
             "type": "string"
           },
-          "user_code": {
-            "title": "User Code",
+          "new_email": {
+            "format": "email",
+            "title": "New Email",
             "type": "string"
-          },
-          "verification_url": {
-            "anyOf": [
-              {
-                "type": "string"
-              },
-              {
-                "type": "null"
-              }
-            ],
-            "title": "Verification Url"
           }
         },
         "required": [
-          "message",
-          "user_code",
-          "verification_url"
+          "current_password",
+          "new_email"
         ],
-        "title": "TidalAuthStartResponse",
+        "title": "RequestEmailChangeRequest",
         "type": "object"
       },
-      "TidalEventSettings": {
-        "description": "Tidal sync settings for an event.",
+      "RequestOut": {
         "properties": {
-          "tidal_playlist_id": {
+          "artist": {
+            "title": "Artist",
+            "type": "string"
+          },
+          "artwork_url": {
             "anyOf": [
               {
                 "type": "string"
@@ -4956,81 +5258,48 @@
                 "type": "null"
               }
             ],
-            "title": "Tidal Playlist Id"
+            "title": "Artwork Url"
           },
-          "tidal_sync_enabled": {
-            "title": "Tidal Sync Enabled",
-            "type": "boolean"
-          }
-        },
-        "required": [
-          "tidal_playlist_id",
-          "tidal_sync_enabled"
-        ],
-        "title": "TidalEventSettings",
-        "type": "object"
-      },
-      "TidalEventSettingsUpdate": {
-        "description": "Update Tidal sync settings for an event.",
-        "properties": {
-          "tidal_sync_enabled": {
-            "title": "Tidal Sync Enabled",
-            "type": "boolean"
-          }
-        },
-        "required": [
-          "tidal_sync_enabled"
-        ],
-        "title": "TidalEventSettingsUpdate",
-        "type": "object"
-      },
-      "TidalManualLink": {
-        "description": "Manual track linking request.",
-        "properties": {
-          "tidal_track_id": {
-            "maxLength": 100,
-            "minLength": 1,
-            "pattern": "^[0-9]+$",
-            "title": "Tidal Track Id",
-            "type": "string"
-          }
-        },
-        "required": [
-          "tidal_track_id"
-        ],
-        "title": "TidalManualLink",
-        "type": "object"
-      },
-      "TidalSearchResult": {
-        "description": "Track result from Tidal search.",
-        "properties": {
-          "album": {
+          "bpm": {
             "anyOf": [
               {
-                "type": "string"
+                "type": "number"
               },
               {
                 "type": "null"
               }
             ],
-            "title": "Album"
+            "title": "Bpm"
           },
-          "artist": {
-            "title": "Artist",
+          "created_at": {
+            "title": "Created At",
             "type": "string"
           },
-          "bpm": {
+          "event_id": {
+            "title": "Event Id",
+            "type": "integer"
+          },
+          "genre": {
             "anyOf": [
               {
-                "type": "number"
+                "type": "string"
               },
               {
                 "type": "null"
               }
             ],
-            "title": "Bpm"
+            "title": "Genre"
           },
-          "cover_url": {
+          "id": {
+            "title": "Id",
+            "type": "integer"
+          },
+          "is_duplicate": {
+            "default": false,
+            "title": "Is Duplicate",
+            "type": "boolean"
+          },
+          "musical_key": {
             "anyOf": [
               {
                 "type": "string"
@@ -5039,25 +5308,20 @@
                 "type": "null"
               }
             ],
-            "title": "Cover Url"
+            "title": "Musical Key"
           },
-          "duration_seconds": {
+          "nickname": {
             "anyOf": [
               {
-                "type": "integer"
+                "type": "string"
               },
               {
                 "type": "null"
               }
             ],
-            "title": "Duration Seconds"
-          },
-          "explicit": {
-            "default": false,
-            "title": "Explicit",
-            "type": "boolean"
+            "title": "Nickname"
           },
-          "isrc": {
+          "note": {
             "anyOf": [
               {
                 "type": "string"
@@ -5066,25 +5330,20 @@
                 "type": "null"
               }
             ],
-            "title": "Isrc"
+            "title": "Note"
           },
-          "key": {
+          "priority_score": {
             "anyOf": [
               {
-                "type": "string"
+                "type": "number"
               },
               {
                 "type": "null"
               }
             ],
-            "title": "Key"
-          },
-          "popularity": {
-            "default": 0,
-            "title": "Popularity",
-            "type": "integer"
+            "title": "Priority Score"
           },
-          "tidal_url": {
+          "raw_search_query": {
             "anyOf": [
               {
                 "type": "string"
@@ -5093,50 +5352,17 @@
                 "type": "null"
               }
             ],
-            "title": "Tidal Url"
+            "title": "Raw Search Query"
           },
-          "title": {
-            "title": "Title",
-            "type": "string"
+          "song_title": {
+            "title": "Song Title",
+            "type": "string"
           },
-          "track_id": {
-            "title": "Track Id",
+          "source": {
+            "title": "Source",
             "type": "string"
           },
-          "version": {
-            "anyOf": [
-              {
-                "type": "string"
-              },
-              {
-                "type": "null"
-              }
-            ],
-            "title": "Version"
-          }
-        },
-        "required": [
-          "album",
-          "artist",
-          "bpm",
-          "cover_url",
-          "duration_seconds",
-          "explicit",
-          "isrc",
-          "key",
-          "popularity",
-          "tidal_url",
-          "title",
-          "track_id",
-          "version"
-        ],
-        "title": "TidalSearchResult",
-        "type": "object"
-      },
-      "TidalStatus": {
-        "description": "Current Tidal account linking status.",
-        "properties": {
-          "expires_at": {
+          "source_url": {
             "anyOf": [
               {
                 "type": "string"
@@ -5145,18 +5371,13 @@
                 "type": "null"
               }
             ],
-            "title": "Expires At"
-          },
-          "integration_enabled": {
-            "default": true,
-            "title": "Integration Enabled",
-            "type": "boolean"
+            "title": "Source Url"
           },
-          "linked": {
-            "title": "Linked",
-            "type": "boolean"
+          "status": {
+            "title": "Status",
+            "type": "string"
           },
-          "user_id": {
+          "sync_results_json": {
             "anyOf": [
               {
                 "type": "string"
@@ -5165,22 +5386,81 @@
                 "type": "null"
               }
             ],
-            "title": "User Id"
+            "title": "Sync Results Json"
+          },
+          "updated_at": {
+            "title": "Updated At",
+            "type": "string"
+          },
+          "vote_count": {
+            "default": 0,
+            "title": "Vote Count",
+            "type": "integer"
           }
         },
         "required": [
-          "expires_at",
-          "integration_enabled",
-          "linked",
-          "user_id"
+          "artist",
+          "artwork_url",
+          "bpm",
+          "created_at",
+          "event_id",
+          "genre",
+          "id",
+          "is_duplicate",
+          "musical_key",
+          "nickname",
+          "note",
+          "priority_score",
+          "raw_search_query",
+          "song_title",
+          "source",
+          "source_url",
+          "status",
+          "sync_results_json",
+          "updated_at",
+          "vote_count"
         ],
-        "title": "TidalStatus",
+        "title": "RequestOut",
         "type": "object"
       },
-      "TidalSyncResult": {
-        "description": "Result of syncing a request to Tidal playlist.",
+      "RequestSource": {
+        "enum": [
+          "manual",
+          "musicbrainz",
+          "spotify",
+          "share_link",
+          "tidal",
+          "beatport"
+        ],
+        "title": "RequestSource",
+        "type": "string"
+      },
+      "RequestStatus": {
+        "enum": [
+          "new",
+          "accepted",
+          "playing",
+          "played",
+          "rejected"
+        ],
+        "title": "RequestStatus",
+        "type": "string"
+      },
+      "RequestUpdate": {
         "properties": {
-          "error": {
+          "status": {
+            "$ref": "#/components/schemas/RequestStatus"
+          }
+        },
+        "required": [
+          "status"
+        ],
+        "title": "RequestUpdate",
+        "type": "object"
+      },
+      "SearchResult": {
+        "properties": {
+          "album": {
             "anyOf": [
               {
                 "type": "string"
@@ -5189,16 +5469,9 @@
                 "type": "null"
               }
             ],
-            "title": "Error"
-          },
-          "request_id": {
-            "title": "Request Id",
-            "type": "integer"
-          },
-          "status": {
-            "$ref": "#/components/schemas/TidalSyncStatus"
+            "title": "Album"
           },
-          "tidal_track_id": {
+          "album_art": {
             "anyOf": [
               {
                 "type": "string"
@@ -5207,135 +5480,93 @@
                 "type": "null"
               }
             ],
-            "title": "Tidal Track Id"
-          }
-        },
-        "required": [
-          "error",
-          "request_id",
-          "status",
-          "tidal_track_id"
-        ],
-        "title": "TidalSyncResult",
-        "type": "object"
-      },
-      "TidalSyncStatus": {
-        "enum": [
-          "pending",
-          "synced",
-          "not_found",
-          "error"
-        ],
-        "title": "TidalSyncStatus",
-        "type": "string"
-      },
-      "Token": {
-        "properties": {
-          "access_token": {
-            "title": "Access Token",
-            "type": "string"
+            "title": "Album Art"
           },
-          "token_type": {
-            "default": "bearer",
-            "title": "Token Type",
+          "artist": {
+            "title": "Artist",
             "type": "string"
-          }
-        },
-        "required": [
-          "access_token",
-          "token_type"
-        ],
-        "title": "Token",
-        "type": "object"
-      },
-      "UpdateCollectionSettings": {
-        "properties": {
-          "collection_opens_at": {
+          },
+          "bpm": {
             "anyOf": [
               {
-                "format": "date-time",
-                "type": "string"
+                "type": "integer"
               },
               {
                 "type": "null"
               }
             ],
-            "title": "Collection Opens At"
+            "title": "Bpm"
           },
-          "collection_phase_override": {
+          "genre": {
             "anyOf": [
               {
-                "enum": [
-                  "force_collection",
-                  "force_live"
-                ],
                 "type": "string"
               },
               {
                 "type": "null"
               }
             ],
-            "title": "Collection Phase Override"
+            "title": "Genre"
           },
-          "live_starts_at": {
+          "isrc": {
             "anyOf": [
               {
-                "format": "date-time",
                 "type": "string"
               },
               {
                 "type": "null"
               }
             ],
-            "title": "Live Starts At"
+            "title": "Isrc"
           },
-          "submission_cap_per_guest": {
+          "key": {
             "anyOf": [
               {
-                "maximum": 100.0,
-                "minimum": 0.0,
-                "type": "integer"
+                "type": "string"
               },
               {
                 "type": "null"
               }
             ],
-            "title": "Submission Cap Per Guest"
+            "title": "Key"
           },
-          "tidal_collection_bidirectional": {
+          "popularity": {
+            "default": 0,
+            "title": "Popularity",
+            "type": "integer"
+          },
+          "preview_url": {
             "anyOf": [
               {
-                "type": "boolean"
+                "type": "string"
               },
               {
                 "type": "null"
               }
             ],
-            "title": "Tidal Collection Bidirectional"
+            "title": "Preview Url"
           },
-          "tidal_sync_enabled": {
+          "source": {
+            "default": "spotify",
+            "title": "Source",
+            "type": "string"
+          },
+          "spotify_id": {
             "anyOf": [
               {
-                "type": "boolean"
+                "type": "string"
               },
               {
                 "type": "null"
               }
             ],
-            "title": "Tidal Sync Enabled"
-          }
-        },
-        "title": "UpdateCollectionSettings",
-        "type": "object"
-      },
-      "UserOut": {
-        "properties": {
-          "created_at": {
-            "format": "date-time",
-            "title": "Created At",
+            "title": "Spotify Id"
+          },
+          "title": {
+            "title": "Title",
             "type": "string"
           },
-          "email": {
+          "url": {
             "anyOf": [
               {
                 "type": "string"
@@ -5344,291 +5575,2313 @@
                 "type": "null"
               }
             ],
-            "title": "Email"
-          },
-          "frictionless_join_default": {
-            "default": false,
-            "title": "Frictionless Join Default",
-            "type": "boolean"
-          },
-          "help_pages_seen": {
-            "default": [],
-            "items": {
-              "type": "string"
-            },
-            "title": "Help Pages Seen",
-            "type": "array"
-          },
-          "id": {
-            "title": "Id",
-            "type": "integer"
+            "title": "Url"
+          }
+        },
+        "required": [
+          "album",
+          "album_art",
+          "artist",
+          "bpm",
+          "genre",
+          "isrc",
+          "key",
+          "popularity",
+          "preview_url",
+          "source",
+          "spotify_id",
+          "title",
+          "url"
+        ],
+        "title": "SearchResult",
+        "type": "object"
+      },
+      "ServiceCapabilities": {
+        "description": "Capability matrix for a single integration service.",
+        "properties": {
+          "auth": {
+            "$ref": "#/components/schemas/CapabilityStatus"
           },
-          "is_active": {
-            "title": "Is Active",
-            "type": "boolean"
+          "catalog_search": {
+            "$ref": "#/components/schemas/CapabilityStatus"
           },
-          "pending_email": {
+          "playlist_sync": {
+            "$ref": "#/components/schemas/CapabilityStatus"
+          }
+        },
+        "required": [
+          "auth",
+          "catalog_search",
+          "playlist_sync"
+        ],
+        "title": "ServiceCapabilities",
+        "type": "object"
+      },
+      "SetCreate": {
+        "description": "Body for creating a new (empty) set.",
+        "properties": {
+          "event_id": {
             "anyOf": [
               {
-                "type": "string"
+                "type": "integer"
               },
               {
                 "type": "null"
               }
             ],
-            "title": "Pending Email"
-          },
-          "role": {
-            "title": "Role",
-            "type": "string"
+            "title": "Event Id"
           },
-          "username": {
-            "title": "Username",
+          "name": {
+            "maxLength": 120,
+            "minLength": 1,
+            "title": "Name",
             "type": "string"
           }
         },
         "required": [
-          "created_at",
-          "email",
-          "frictionless_join_default",
-          "help_pages_seen",
-          "id",
-          "is_active",
-          "pending_email",
-          "role",
-          "username"
+          "name"
         ],
-        "title": "UserOut",
+        "title": "SetCreate",
         "type": "object"
       },
-      "ValidationError": {
+      "SetDetail": {
+        "description": "Full set record (Phase 0: no slot/curve expansion yet).",
         "properties": {
-          "ctx": {
-            "title": "Context",
-            "type": "object"
-          },
-          "input": {
-            "title": "Input"
+          "bpm_ceiling": {
+            "anyOf": [
+              {
+                "type": "integer"
+              },
+              {
+                "type": "null"
+              }
+            ],
+            "title": "Bpm Ceiling"
           },
-          "loc": {
-            "items": {
-              "anyOf": [
-                {
-                  "type": "string"
-                },
-                {
-                  "type": "integer"
-                }
-              ]
-            },
-            "title": "Location",
-            "type": "array"
+          "bpm_floor": {
+            "anyOf": [
+              {
+                "type": "integer"
+              },
+              {
+                "type": "null"
+              }
+            ],
+            "title": "Bpm Floor"
           },
-          "msg": {
-            "title": "Message",
+          "created_at": {
+            "format": "date-time",
+            "title": "Created At",
             "type": "string"
           },
-          "type": {
-            "title": "Error Type",
-            "type": "string"
-          }
-        },
-        "required": [
-          "ctx",
-          "input",
-          "loc",
-          "msg",
-          "type"
-        ],
-        "title": "ValidationError",
-        "type": "object"
-      },
-      "VerifyConfirmResponse": {
-        "properties": {
-          "guest_id": {
-            "title": "Guest Id",
+          "event_id": {
+            "anyOf": [
+              {
+                "type": "integer"
+              },
+              {
+                "type": "null"
+              }
+            ],
+            "title": "Event Id"
+          },
+          "exported_at": {
+            "anyOf": [
+              {
+                "format": "date-time",
+                "type": "string"
+              },
+              {
+                "type": "null"
+              }
+            ],
+            "title": "Exported At"
+          },
+          "id": {
+            "title": "Id",
             "type": "integer"
           },
-          "merged": {
-            "title": "Merged",
-            "type": "boolean"
+          "key_strictness": {
+            "title": "Key Strictness",
+            "type": "number"
           },
-          "verified": {
-            "title": "Verified",
-            "type": "boolean"
-          }
-        },
-        "required": [
-          "guest_id",
-          "merged",
-          "verified"
-        ],
-        "title": "VerifyConfirmResponse",
-        "type": "object"
-      },
-      "VerifyConfirmSchema": {
-        "properties": {
-          "code": {
-            "title": "Code",
+          "name": {
+            "title": "Name",
             "type": "string"
           },
-          "email": {
-            "format": "email",
-            "title": "Email",
+          "sharing_mode": {
+            "enum": [
+              "private",
+              "invite_only"
+            ],
+            "title": "Sharing Mode",
+            "type": "string"
+          },
+          "status": {
+            "enum": [
+              "draft",
+              "locked",
+              "exported"
+            ],
+            "title": "Status",
+            "type": "string"
+          },
+          "target_duration_sec": {
+            "anyOf": [
+              {
+                "type": "integer"
+              },
+              {
+                "type": "null"
+              }
+            ],
+            "title": "Target Duration Sec"
+          },
+          "tidal_playlist_id": {
+            "anyOf": [
+              {
+                "type": "string"
+              },
+              {
+                "type": "null"
+              }
+            ],
+            "title": "Tidal Playlist Id"
+          },
+          "updated_at": {
+            "format": "date-time",
+            "title": "Updated At",
             "type": "string"
+          },
+          "vibe_theme": {
+            "anyOf": [
+              {
+                "type": "string"
+              },
+              {
+                "type": "null"
+              }
+            ],
+            "title": "Vibe Theme"
           }
         },
         "required": [
-          "email",
-          "code"
+          "bpm_ceiling",
+          "bpm_floor",
+          "created_at",
+          "event_id",
+          "exported_at",
+          "id",
+          "key_strictness",
+          "name",
+          "sharing_mode",
+          "status",
+          "target_duration_sec",
+          "tidal_playlist_id",
+          "updated_at",
+          "vibe_theme"
         ],
-        "title": "VerifyConfirmSchema",
+        "title": "SetDetail",
         "type": "object"
       },
-      "VerifyHumanRequest": {
+      "SetRename": {
+        "description": "Body for renaming a set.",
         "properties": {
-          "turnstile_token": {
-            "maxLength": 4096,
+          "name": {
+            "maxLength": 120,
             "minLength": 1,
-            "title": "Turnstile Token",
+            "title": "Name",
             "type": "string"
           }
         },
         "required": [
-          "turnstile_token"
+          "name"
         ],
-        "title": "VerifyHumanRequest",
+        "title": "SetRename",
         "type": "object"
       },
-      "VerifyHumanResponse": {
+      "SetSummary": {
+        "description": "Set list item (no children).",
         "properties": {
-          "expires_in": {
-            "title": "Expires In",
+          "created_at": {
+            "format": "date-time",
+            "title": "Created At",
+            "type": "string"
+          },
+          "event_id": {
+            "anyOf": [
+              {
+                "type": "integer"
+              },
+              {
+                "type": "null"
+              }
+            ],
+            "title": "Event Id"
+          },
+          "id": {
+            "title": "Id",
             "type": "integer"
           },
-          "verified": {
-            "title": "Verified",
-            "type": "boolean"
+          "name": {
+            "title": "Name",
+            "type": "string"
+          },
+          "sharing_mode": {
+            "enum": [
+              "private",
+              "invite_only"
+            ],
+            "title": "Sharing Mode",
+            "type": "string"
+          },
+          "status": {
+            "enum": [
+              "draft",
+              "locked",
+              "exported"
+            ],
+            "title": "Status",
+            "type": "string"
+          },
+          "updated_at": {
+            "format": "date-time",
+            "title": "Updated At",
+            "type": "string"
           }
         },
         "required": [
-          "expires_in",
-          "verified"
+          "created_at",
+          "event_id",
+          "id",
+          "name",
+          "sharing_mode",
+          "status",
+          "updated_at"
         ],
-        "title": "VerifyHumanResponse",
+        "title": "SetSummary",
         "type": "object"
       },
-      "VerifyRequestResponse": {
+      "StatusMessageResponse": {
         "properties": {
-          "sent": {
-            "title": "Sent",
+          "message": {
+            "title": "Message",
+            "type": "string"
+          },
+          "status": {
+            "title": "Status",
+            "type": "string"
+          }
+        },
+        "required": [
+          "message",
+          "status"
+        ],
+        "title": "StatusMessageResponse",
+        "type": "object"
+      },
+      "StatusResponse": {
+        "properties": {
+          "status": {
+            "title": "Status",
+            "type": "string"
+          }
+        },
+        "required": [
+          "status"
+        ],
+        "title": "StatusResponse",
+        "type": "object"
+      },
+      "SystemSettingsOut": {
+        "properties": {
+          "beatport_enabled": {
+            "title": "Beatport Enabled",
+            "type": "boolean"
+          },
+          "bridge_enabled": {
+            "title": "Bridge Enabled",
+            "type": "boolean"
+          },
+          "human_verification_enforced": {
+            "title": "Human Verification Enforced",
+            "type": "boolean"
+          },
+          "llm_enabled": {
+            "title": "Llm Enabled",
+            "type": "boolean"
+          },
+          "llm_model": {
+            "title": "Llm Model",
+            "type": "string"
+          },
+          "llm_rate_limit_per_minute": {
+            "title": "Llm Rate Limit Per Minute",
+            "type": "integer"
+          },
+          "registration_enabled": {
+            "title": "Registration Enabled",
+            "type": "boolean"
+          },
+          "search_rate_limit_per_minute": {
+            "title": "Search Rate Limit Per Minute",
+            "type": "integer"
+          },
+          "spotify_enabled": {
+            "title": "Spotify Enabled",
+            "type": "boolean"
+          },
+          "tidal_enabled": {
+            "title": "Tidal Enabled",
             "type": "boolean"
           }
         },
-        "required": [
-          "sent"
+        "required": [
+          "beatport_enabled",
+          "bridge_enabled",
+          "human_verification_enforced",
+          "llm_enabled",
+          "llm_model",
+          "llm_rate_limit_per_minute",
+          "registration_enabled",
+          "search_rate_limit_per_minute",
+          "spotify_enabled",
+          "tidal_enabled"
+        ],
+        "title": "SystemSettingsOut",
+        "type": "object"
+      },
+      "SystemSettingsUpdate": {
+        "properties": {
+          "beatport_enabled": {
+            "anyOf": [
+              {
+                "type": "boolean"
+              },
+              {
+                "type": "null"
+              }
+            ],
+            "title": "Beatport Enabled"
+          },
+          "bridge_enabled": {
+            "anyOf": [
+              {
+                "type": "boolean"
+              },
+              {
+                "type": "null"
+              }
+            ],
+            "title": "Bridge Enabled"
+          },
+          "human_verification_enforced": {
+            "anyOf": [
+              {
+                "type": "boolean"
+              },
+              {
+                "type": "null"
+              }
+            ],
+            "title": "Human Verification Enforced"
+          },
+          "llm_enabled": {
+            "anyOf": [
+              {
+                "type": "boolean"
+              },
+              {
+                "type": "null"
+              }
+            ],
+            "title": "Llm Enabled"
+          },
+          "llm_model": {
+            "anyOf": [
+              {
+                "type": "string"
+              },
+              {
+                "type": "null"
+              }
+            ],
+            "title": "Llm Model"
+          },
+          "llm_rate_limit_per_minute": {
+            "anyOf": [
+              {
+                "maximum": 30.0,
+                "minimum": 1.0,
+                "type": "integer"
+              },
+              {
+                "type": "null"
+              }
+            ],
+            "title": "Llm Rate Limit Per Minute"
+          },
+          "registration_enabled": {
+            "anyOf": [
+              {
+                "type": "boolean"
+              },
+              {
+                "type": "null"
+              }
+            ],
+            "title": "Registration Enabled"
+          },
+          "search_rate_limit_per_minute": {
+            "anyOf": [
+              {
+                "maximum": 100.0,
+                "minimum": 1.0,
+                "type": "integer"
+              },
+              {
+                "type": "null"
+              }
+            ],
+            "title": "Search Rate Limit Per Minute"
+          },
+          "spotify_enabled": {
+            "anyOf": [
+              {
+                "type": "boolean"
+              },
+              {
+                "type": "null"
+              }
+            ],
+            "title": "Spotify Enabled"
+          },
+          "tidal_enabled": {
+            "anyOf": [
+              {
+                "type": "boolean"
+              },
+              {
+                "type": "null"
+              }
+            ],
+            "title": "Tidal Enabled"
+          }
+        },
+        "title": "SystemSettingsUpdate",
+        "type": "object"
+      },
+      "SystemStats": {
+        "properties": {
+          "active_events": {
+            "title": "Active Events",
+            "type": "integer"
+          },
+          "active_users": {
+            "title": "Active Users",
+            "type": "integer"
+          },
+          "pending_users": {
+            "title": "Pending Users",
+            "type": "integer"
+          },
+          "total_events": {
+            "title": "Total Events",
+            "type": "integer"
+          },
+          "total_requests": {
+            "title": "Total Requests",
+            "type": "integer"
+          },
+          "total_users": {
+            "title": "Total Users",
+            "type": "integer"
+          }
+        },
+        "required": [
+          "active_events",
+          "active_users",
+          "pending_users",
+          "total_events",
+          "total_requests",
+          "total_users"
+        ],
+        "title": "SystemStats",
+        "type": "object"
+      },
+      "TemplatePlaylistRequest": {
+        "properties": {
+          "playlist_id": {
+            "maxLength": 200,
+            "minLength": 1,
+            "title": "Playlist Id",
+            "type": "string"
+          },
+          "source": {
+            "pattern": "^(tidal|beatport)$",
+            "title": "Source",
+            "type": "string"
+          }
+        },
+        "required": [
+          "source",
+          "playlist_id"
+        ],
+        "title": "TemplatePlaylistRequest",
+        "type": "object"
+      },
+      "TidalAuthCheckResponse": {
+        "properties": {
+          "complete": {
+            "title": "Complete",
+            "type": "boolean"
+          },
+          "error": {
+            "anyOf": [
+              {
+                "type": "string"
+              },
+              {
+                "type": "null"
+              }
+            ],
+            "title": "Error"
+          },
+          "pending": {
+            "anyOf": [
+              {
+                "type": "boolean"
+              },
+              {
+                "type": "null"
+              }
+            ],
+            "title": "Pending"
+          },
+          "user_code": {
+            "anyOf": [
+              {
+                "type": "string"
+              },
+              {
+                "type": "null"
+              }
+            ],
+            "title": "User Code"
+          },
+          "user_id": {
+            "anyOf": [
+              {
+                "type": "string"
+              },
+              {
+                "type": "null"
+              }
+            ],
+            "title": "User Id"
+          },
+          "verification_url": {
+            "anyOf": [
+              {
+                "type": "string"
+              },
+              {
+                "type": "null"
+              }
+            ],
+            "title": "Verification Url"
+          }
+        },
+        "required": [
+          "complete",
+          "error",
+          "pending",
+          "user_code",
+          "user_id",
+          "verification_url"
+        ],
+        "title": "TidalAuthCheckResponse",
+        "type": "object"
+      },
+      "TidalAuthStartResponse": {
+        "properties": {
+          "message": {
+            "title": "Message",
+            "type": "string"
+          },
+          "user_code": {
+            "title": "User Code",
+            "type": "string"
+          },
+          "verification_url": {
+            "anyOf": [
+              {
+                "type": "string"
+              },
+              {
+                "type": "null"
+              }
+            ],
+            "title": "Verification Url"
+          }
+        },
+        "required": [
+          "message",
+          "user_code",
+          "verification_url"
+        ],
+        "title": "TidalAuthStartResponse",
+        "type": "object"
+      },
+      "TidalEventSettings": {
+        "description": "Tidal sync settings for an event.",
+        "properties": {
+          "tidal_playlist_id": {
+            "anyOf": [
+              {
+                "type": "string"
+              },
+              {
+                "type": "null"
+              }
+            ],
+            "title": "Tidal Playlist Id"
+          },
+          "tidal_sync_enabled": {
+            "title": "Tidal Sync Enabled",
+            "type": "boolean"
+          }
+        },
+        "required": [
+          "tidal_playlist_id",
+          "tidal_sync_enabled"
+        ],
+        "title": "TidalEventSettings",
+        "type": "object"
+      },
+      "TidalEventSettingsUpdate": {
+        "description": "Update Tidal sync settings for an event.",
+        "properties": {
+          "tidal_sync_enabled": {
+            "title": "Tidal Sync Enabled",
+            "type": "boolean"
+          }
+        },
+        "required": [
+          "tidal_sync_enabled"
+        ],
+        "title": "TidalEventSettingsUpdate",
+        "type": "object"
+      },
+      "TidalManualLink": {
+        "description": "Manual track linking request.",
+        "properties": {
+          "tidal_track_id": {
+            "maxLength": 100,
+            "minLength": 1,
+            "pattern": "^[0-9]+$",
+            "title": "Tidal Track Id",
+            "type": "string"
+          }
+        },
+        "required": [
+          "tidal_track_id"
+        ],
+        "title": "TidalManualLink",
+        "type": "object"
+      },
+      "TidalSearchResult": {
+        "description": "Track result from Tidal search.",
+        "properties": {
+          "album": {
+            "anyOf": [
+              {
+                "type": "string"
+              },
+              {
+                "type": "null"
+              }
+            ],
+            "title": "Album"
+          },
+          "artist": {
+            "title": "Artist",
+            "type": "string"
+          },
+          "bpm": {
+            "anyOf": [
+              {
+                "type": "number"
+              },
+              {
+                "type": "null"
+              }
+            ],
+            "title": "Bpm"
+          },
+          "cover_url": {
+            "anyOf": [
+              {
+                "type": "string"
+              },
+              {
+                "type": "null"
+              }
+            ],
+            "title": "Cover Url"
+          },
+          "duration_seconds": {
+            "anyOf": [
+              {
+                "type": "integer"
+              },
+              {
+                "type": "null"
+              }
+            ],
+            "title": "Duration Seconds"
+          },
+          "explicit": {
+            "default": false,
+            "title": "Explicit",
+            "type": "boolean"
+          },
+          "isrc": {
+            "anyOf": [
+              {
+                "type": "string"
+              },
+              {
+                "type": "null"
+              }
+            ],
+            "title": "Isrc"
+          },
+          "key": {
+            "anyOf": [
+              {
+                "type": "string"
+              },
+              {
+                "type": "null"
+              }
+            ],
+            "title": "Key"
+          },
+          "popularity": {
+            "default": 0,
+            "title": "Popularity",
+            "type": "integer"
+          },
+          "tidal_url": {
+            "anyOf": [
+              {
+                "type": "string"
+              },
+              {
+                "type": "null"
+              }
+            ],
+            "title": "Tidal Url"
+          },
+          "title": {
+            "title": "Title",
+            "type": "string"
+          },
+          "track_id": {
+            "title": "Track Id",
+            "type": "string"
+          },
+          "version": {
+            "anyOf": [
+              {
+                "type": "string"
+              },
+              {
+                "type": "null"
+              }
+            ],
+            "title": "Version"
+          }
+        },
+        "required": [
+          "album",
+          "artist",
+          "bpm",
+          "cover_url",
+          "duration_seconds",
+          "explicit",
+          "isrc",
+          "key",
+          "popularity",
+          "tidal_url",
+          "title",
+          "track_id",
+          "version"
+        ],
+        "title": "TidalSearchResult",
+        "type": "object"
+      },
+      "TidalStatus": {
+        "description": "Current Tidal account linking status.",
+        "properties": {
+          "expires_at": {
+            "anyOf": [
+              {
+                "type": "string"
+              },
+              {
+                "type": "null"
+              }
+            ],
+            "title": "Expires At"
+          },
+          "integration_enabled": {
+            "default": true,
+            "title": "Integration Enabled",
+            "type": "boolean"
+          },
+          "linked": {
+            "title": "Linked",
+            "type": "boolean"
+          },
+          "user_id": {
+            "anyOf": [
+              {
+                "type": "string"
+              },
+              {
+                "type": "null"
+              }
+            ],
+            "title": "User Id"
+          }
+        },
+        "required": [
+          "expires_at",
+          "integration_enabled",
+          "linked",
+          "user_id"
+        ],
+        "title": "TidalStatus",
+        "type": "object"
+      },
+      "TidalSyncResult": {
+        "description": "Result of syncing a request to Tidal playlist.",
+        "properties": {
+          "error": {
+            "anyOf": [
+              {
+                "type": "string"
+              },
+              {
+                "type": "null"
+              }
+            ],
+            "title": "Error"
+          },
+          "request_id": {
+            "title": "Request Id",
+            "type": "integer"
+          },
+          "status": {
+            "$ref": "#/components/schemas/TidalSyncStatus"
+          },
+          "tidal_track_id": {
+            "anyOf": [
+              {
+                "type": "string"
+              },
+              {
+                "type": "null"
+              }
+            ],
+            "title": "Tidal Track Id"
+          }
+        },
+        "required": [
+          "error",
+          "request_id",
+          "status",
+          "tidal_track_id"
+        ],
+        "title": "TidalSyncResult",
+        "type": "object"
+      },
+      "TidalSyncStatus": {
+        "enum": [
+          "pending",
+          "synced",
+          "not_found",
+          "error"
+        ],
+        "title": "TidalSyncStatus",
+        "type": "string"
+      },
+      "Token": {
+        "properties": {
+          "access_token": {
+            "title": "Access Token",
+            "type": "string"
+          },
+          "token_type": {
+            "default": "bearer",
+            "title": "Token Type",
+            "type": "string"
+          }
+        },
+        "required": [
+          "access_token",
+          "token_type"
+        ],
+        "title": "Token",
+        "type": "object"
+      },
+      "UpdateCollectionSettings": {
+        "properties": {
+          "collection_opens_at": {
+            "anyOf": [
+              {
+                "format": "date-time",
+                "type": "string"
+              },
+              {
+                "type": "null"
+              }
+            ],
+            "title": "Collection Opens At"
+          },
+          "collection_phase_override": {
+            "anyOf": [
+              {
+                "enum": [
+                  "force_collection",
+                  "force_live"
+                ],
+                "type": "string"
+              },
+              {
+                "type": "null"
+              }
+            ],
+            "title": "Collection Phase Override"
+          },
+          "live_starts_at": {
+            "anyOf": [
+              {
+                "format": "date-time",
+                "type": "string"
+              },
+              {
+                "type": "null"
+              }
+            ],
+            "title": "Live Starts At"
+          },
+          "submission_cap_per_guest": {
+            "anyOf": [
+              {
+                "maximum": 100.0,
+                "minimum": 0.0,
+                "type": "integer"
+              },
+              {
+                "type": "null"
+              }
+            ],
+            "title": "Submission Cap Per Guest"
+          },
+          "tidal_collection_bidirectional": {
+            "anyOf": [
+              {
+                "type": "boolean"
+              },
+              {
+                "type": "null"
+              }
+            ],
+            "title": "Tidal Collection Bidirectional"
+          },
+          "tidal_sync_enabled": {
+            "anyOf": [
+              {
+                "type": "boolean"
+              },
+              {
+                "type": "null"
+              }
+            ],
+            "title": "Tidal Sync Enabled"
+          }
+        },
+        "title": "UpdateCollectionSettings",
+        "type": "object"
+      },
+      "UsageRow": {
+        "properties": {
+          "connector_id": {
+            "title": "Connector Id",
+            "type": "integer"
+          },
+          "connector_type": {
+            "enum": [
+              "openai_apikey",
+              "anthropic_apikey",
+              "openai_compatible",
+              "openrouter_apikey",
+              "xai_apikey",
+              "bedrock",
+              "azure_openai",
+              "gemini_apikey"
+            ],
+            "title": "Connector Type",
+            "type": "string"
+          },
+          "display_name": {
+            "title": "Display Name",
+            "type": "string"
+          },
+          "dj_username": {
+            "title": "Dj Username",
+            "type": "string"
+          },
+          "error_count": {
+            "title": "Error Count",
+            "type": "integer"
+          },
+          "error_rate": {
+            "title": "Error Rate",
+            "type": "number"
+          },
+          "total_calls": {
+            "title": "Total Calls",
+            "type": "integer"
+          },
+          "total_tokens_in": {
+            "title": "Total Tokens In",
+            "type": "integer"
+          },
+          "total_tokens_out": {
+            "title": "Total Tokens Out",
+            "type": "integer"
+          }
+        },
+        "required": [
+          "connector_id",
+          "connector_type",
+          "display_name",
+          "dj_username",
+          "error_count",
+          "error_rate",
+          "total_calls",
+          "total_tokens_in",
+          "total_tokens_out"
+        ],
+        "title": "UsageRow",
+        "type": "object"
+      },
+      "UserOut": {
+        "properties": {
+          "created_at": {
+            "format": "date-time",
+            "title": "Created At",
+            "type": "string"
+          },
+          "email": {
+            "anyOf": [
+              {
+                "type": "string"
+              },
+              {
+                "type": "null"
+              }
+            ],
+            "title": "Email"
+          },
+          "frictionless_join_default": {
+            "default": false,
+            "title": "Frictionless Join Default",
+            "type": "boolean"
+          },
+          "help_pages_seen": {
+            "default": [],
+            "items": {
+              "type": "string"
+            },
+            "title": "Help Pages Seen",
+            "type": "array"
+          },
+          "id": {
+            "title": "Id",
+            "type": "integer"
+          },
+          "is_active": {
+            "title": "Is Active",
+            "type": "boolean"
+          },
+          "pending_email": {
+            "anyOf": [
+              {
+                "type": "string"
+              },
+              {
+                "type": "null"
+              }
+            ],
+            "title": "Pending Email"
+          },
+          "role": {
+            "title": "Role",
+            "type": "string"
+          },
+          "username": {
+            "title": "Username",
+            "type": "string"
+          }
+        },
+        "required": [
+          "created_at",
+          "email",
+          "frictionless_join_default",
+          "help_pages_seen",
+          "id",
+          "is_active",
+          "pending_email",
+          "role",
+          "username"
+        ],
+        "title": "UserOut",
+        "type": "object"
+      },
+      "ValidationError": {
+        "properties": {
+          "ctx": {
+            "title": "Context",
+            "type": "object"
+          },
+          "input": {
+            "title": "Input"
+          },
+          "loc": {
+            "items": {
+              "anyOf": [
+                {
+                  "type": "string"
+                },
+                {
+                  "type": "integer"
+                }
+              ]
+            },
+            "title": "Location",
+            "type": "array"
+          },
+          "msg": {
+            "title": "Message",
+            "type": "string"
+          },
+          "type": {
+            "title": "Error Type",
+            "type": "string"
+          }
+        },
+        "required": [
+          "ctx",
+          "input",
+          "loc",
+          "msg",
+          "type"
+        ],
+        "title": "ValidationError",
+        "type": "object"
+      },
+      "VerifyConfirmResponse": {
+        "properties": {
+          "guest_id": {
+            "title": "Guest Id",
+            "type": "integer"
+          },
+          "merged": {
+            "title": "Merged",
+            "type": "boolean"
+          },
+          "verified": {
+            "title": "Verified",
+            "type": "boolean"
+          }
+        },
+        "required": [
+          "guest_id",
+          "merged",
+          "verified"
+        ],
+        "title": "VerifyConfirmResponse",
+        "type": "object"
+      },
+      "VerifyConfirmSchema": {
+        "properties": {
+          "code": {
+            "title": "Code",
+            "type": "string"
+          },
+          "email": {
+            "format": "email",
+            "title": "Email",
+            "type": "string"
+          }
+        },
+        "required": [
+          "email",
+          "code"
+        ],
+        "title": "VerifyConfirmSchema",
+        "type": "object"
+      },
+      "VerifyHumanRequest": {
+        "properties": {
+          "turnstile_token": {
+            "maxLength": 4096,
+            "minLength": 1,
+            "title": "Turnstile Token",
+            "type": "string"
+          }
+        },
+        "required": [
+          "turnstile_token"
+        ],
+        "title": "VerifyHumanRequest",
+        "type": "object"
+      },
+      "VerifyHumanResponse": {
+        "properties": {
+          "expires_in": {
+            "title": "Expires In",
+            "type": "integer"
+          },
+          "verified": {
+            "title": "Verified",
+            "type": "boolean"
+          }
+        },
+        "required": [
+          "expires_in",
+          "verified"
+        ],
+        "title": "VerifyHumanResponse",
+        "type": "object"
+      },
+      "VerifyRequestResponse": {
+        "properties": {
+          "sent": {
+            "title": "Sent",
+            "type": "boolean"
+          }
+        },
+        "required": [
+          "sent"
+        ],
+        "title": "VerifyRequestResponse",
+        "type": "object"
+      },
+      "VerifyRequestSchema": {
+        "properties": {
+          "email": {
+            "format": "email",
+            "title": "Email",
+            "type": "string"
+          },
+          "turnstile_token": {
+            "maxLength": 4096,
+            "minLength": 1,
+            "title": "Turnstile Token",
+            "type": "string"
+          }
+        },
+        "required": [
+          "email",
+          "turnstile_token"
+        ],
+        "title": "VerifyRequestSchema",
+        "type": "object"
+      },
+      "VerifyStatusResponse": {
+        "description": "Reports whether the caller has a valid wrzdj_human cookie.",
+        "properties": {
+          "expires_in": {
+            "default": 0,
+            "title": "Expires In",
+            "type": "integer"
+          },
+          "verified": {
+            "title": "Verified",
+            "type": "boolean"
+          }
+        },
+        "required": [
+          "expires_in",
+          "verified"
+        ],
+        "title": "VerifyStatusResponse",
+        "type": "object"
+      },
+      "VoteResponse": {
+        "properties": {
+          "has_voted": {
+            "title": "Has Voted",
+            "type": "boolean"
+          },
+          "status": {
+            "title": "Status",
+            "type": "string"
+          },
+          "vote_count": {
+            "title": "Vote Count",
+            "type": "integer"
+          }
+        },
+        "required": [
+          "has_voted",
+          "status",
+          "vote_count"
+        ],
+        "title": "VoteResponse",
+        "type": "object"
+      }
+    },
+    "securitySchemes": {
+      "OAuth2PasswordBearer": {
+        "flows": {
+          "password": {
+            "scopes": {},
+            "tokenUrl": "/api/auth/login"
+          }
+        },
+        "type": "oauth2"
+      }
+    }
+  },
+  "info": {
+    "description": "Song request system for DJs",
+    "title": "WrzDJ API",
+    "version": "0.1.0"
+  },
+  "openapi": "3.1.0",
+  "paths": {
+    "/api/admin/ai/models": {
+      "get": {
+        "description": "List available AI models.",
+        "operationId": "admin_get_ai_models_api_admin_ai_models_get",
+        "responses": {
+          "200": {
+            "content": {
+              "application/json": {
+                "schema": {
+                  "$ref": "#/components/schemas/AIModelsResponse"
+                }
+              }
+            },
+            "description": "Successful Response"
+          }
+        },
+        "security": [
+          {
+            "OAuth2PasswordBearer": []
+          }
+        ],
+        "summary": "Admin Get Ai Models",
+        "tags": [
+          "admin"
+        ]
+      }
+    },
+    "/api/admin/ai/settings": {
+      "get": {
+        "description": "Get AI/LLM configuration.",
+        "operationId": "admin_get_ai_settings_api_admin_ai_settings_get",
+        "responses": {
+          "200": {
+            "content": {
+              "application/json": {
+                "schema": {
+                  "$ref": "#/components/schemas/AISettingsOut"
+                }
+              }
+            },
+            "description": "Successful Response"
+          }
+        },
+        "security": [
+          {
+            "OAuth2PasswordBearer": []
+          }
+        ],
+        "summary": "Admin Get Ai Settings",
+        "tags": [
+          "admin"
+        ]
+      },
+      "put": {
+        "description": "Update AI/LLM configuration.",
+        "operationId": "admin_update_ai_settings_api_admin_ai_settings_put",
+        "requestBody": {
+          "content": {
+            "application/json": {
+              "schema": {
+                "$ref": "#/components/schemas/AISettingsUpdate"
+              }
+            }
+          },
+          "required": true
+        },
+        "responses": {
+          "200": {
+            "content": {
+              "application/json": {
+                "schema": {
+                  "$ref": "#/components/schemas/AISettingsOut"
+                }
+              }
+            },
+            "description": "Successful Response"
+          },
+          "422": {
+            "content": {
+              "application/json": {
+                "schema": {
+                  "$ref": "#/components/schemas/HTTPValidationError"
+                }
+              }
+            },
+            "description": "Validation Error"
+          }
+        },
+        "security": [
+          {
+            "OAuth2PasswordBearer": []
+          }
+        ],
+        "summary": "Admin Update Ai Settings",
+        "tags": [
+          "admin"
+        ]
+      }
+    },
+    "/api/admin/events": {
+      "get": {
+        "operationId": "admin_list_events_api_admin_events_get",
+        "parameters": [
+          {
+            "in": "query",
+            "name": "page",
+            "required": false,
+            "schema": {
+              "default": 1,
+              "maximum": 1000,
+              "minimum": 1,
+              "title": "Page",
+              "type": "integer"
+            }
+          },
+          {
+            "in": "query",
+            "name": "limit",
+            "required": false,
+            "schema": {
+              "default": 20,
+              "maximum": 100,
+              "minimum": 1,
+              "title": "Limit",
+              "type": "integer"
+            }
+          }
+        ],
+        "responses": {
+          "200": {
+            "content": {
+              "application/json": {
+                "schema": {
+                  "$ref": "#/components/schemas/PaginatedResponse"
+                }
+              }
+            },
+            "description": "Successful Response"
+          },
+          "422": {
+            "content": {
+              "application/json": {
+                "schema": {
+                  "$ref": "#/components/schemas/HTTPValidationError"
+                }
+              }
+            },
+            "description": "Validation Error"
+          }
+        },
+        "security": [
+          {
+            "OAuth2PasswordBearer": []
+          }
+        ],
+        "summary": "Admin List Events",
+        "tags": [
+          "admin"
+        ]
+      }
+    },
+    "/api/admin/events/bulk-delete": {
+      "post": {
+        "description": "Admin can bulk delete events from any owner.",
+        "operationId": "admin_bulk_delete_events_api_admin_events_bulk_delete_post",
+        "requestBody": {
+          "content": {
+            "application/json": {
+              "schema": {
+                "$ref": "#/components/schemas/BulkDeleteEventsRequest"
+              }
+            }
+          },
+          "required": true
+        },
+        "responses": {
+          "200": {
+            "content": {
+              "application/json": {
+                "schema": {
+                  "$ref": "#/components/schemas/BulkActionResponse"
+                }
+              }
+            },
+            "description": "Successful Response"
+          },
+          "422": {
+            "content": {
+              "application/json": {
+                "schema": {
+                  "$ref": "#/components/schemas/HTTPValidationError"
+                }
+              }
+            },
+            "description": "Validation Error"
+          }
+        },
+        "security": [
+          {
+            "OAuth2PasswordBearer": []
+          }
+        ],
+        "summary": "Admin Bulk Delete Events",
+        "tags": [
+          "admin"
+        ]
+      }
+    },
+    "/api/admin/events/{code}": {
+      "delete": {
+        "description": "Admin can delete any event.",
+        "operationId": "admin_delete_event_api_admin_events__code__delete",
+        "parameters": [
+          {
+            "in": "path",
+            "name": "code",
+            "required": true,
+            "schema": {
+              "title": "Code",
+              "type": "string"
+            }
+          }
+        ],
+        "responses": {
+          "204": {
+            "description": "Successful Response"
+          },
+          "422": {
+            "content": {
+              "application/json": {
+                "schema": {
+                  "$ref": "#/components/schemas/HTTPValidationError"
+                }
+              }
+            },
+            "description": "Validation Error"
+          }
+        },
+        "security": [
+          {
+            "OAuth2PasswordBearer": []
+          }
+        ],
+        "summary": "Admin Delete Event",
+        "tags": [
+          "admin"
+        ]
+      },
+      "patch": {
+        "description": "Admin can edit any event (not just their own).",
+        "operationId": "admin_update_event_api_admin_events__code__patch",
+        "parameters": [
+          {
+            "in": "path",
+            "name": "code",
+            "required": true,
+            "schema": {
+              "title": "Code",
+              "type": "string"
+            }
+          }
+        ],
+        "requestBody": {
+          "content": {
+            "application/json": {
+              "schema": {
+                "$ref": "#/components/schemas/EventUpdate"
+              }
+            }
+          },
+          "required": true
+        },
+        "responses": {
+          "200": {
+            "content": {
+              "application/json": {
+                "schema": {
+                  "$ref": "#/components/schemas/AdminEventOut"
+                }
+              }
+            },
+            "description": "Successful Response"
+          },
+          "422": {
+            "content": {
+              "application/json": {
+                "schema": {
+                  "$ref": "#/components/schemas/HTTPValidationError"
+                }
+              }
+            },
+            "description": "Validation Error"
+          }
+        },
+        "security": [
+          {
+            "OAuth2PasswordBearer": []
+          }
+        ],
+        "summary": "Admin Update Event",
+        "tags": [
+          "admin"
+        ]
+      }
+    },
+    "/api/admin/integrations": {
+      "get": {
+        "description": "Get status of all external integrations (no active health checks).",
+        "operationId": "admin_get_integrations_api_admin_integrations_get",
+        "responses": {
+          "200": {
+            "content": {
+              "application/json": {
+                "schema": {
+                  "$ref": "#/components/schemas/IntegrationHealthResponse"
+                }
+              }
+            },
+            "description": "Successful Response"
+          }
+        },
+        "security": [
+          {
+            "OAuth2PasswordBearer": []
+          }
+        ],
+        "summary": "Admin Get Integrations",
+        "tags": [
+          "admin"
+        ]
+      }
+    },
+    "/api/admin/integrations/{service}": {
+      "patch": {
+        "description": "Enable or disable a specific integration.",
+        "operationId": "admin_toggle_integration_api_admin_integrations__service__patch",
+        "parameters": [
+          {
+            "in": "path",
+            "name": "service",
+            "required": true,
+            "schema": {
+              "title": "Service",
+              "type": "string"
+            }
+          }
+        ],
+        "requestBody": {
+          "content": {
+            "application/json": {
+              "schema": {
+                "$ref": "#/components/schemas/IntegrationToggleRequest"
+              }
+            }
+          },
+          "required": true
+        },
+        "responses": {
+          "200": {
+            "content": {
+              "application/json": {
+                "schema": {
+                  "$ref": "#/components/schemas/IntegrationToggleResponse"
+                }
+              }
+            },
+            "description": "Successful Response"
+          },
+          "422": {
+            "content": {
+              "application/json": {
+                "schema": {
+                  "$ref": "#/components/schemas/HTTPValidationError"
+                }
+              }
+            },
+            "description": "Validation Error"
+          }
+        },
+        "security": [
+          {
+            "OAuth2PasswordBearer": []
+          }
+        ],
+        "summary": "Admin Toggle Integration",
+        "tags": [
+          "admin"
+        ]
+      }
+    },
+    "/api/admin/integrations/{service}/check": {
+      "post": {
+        "description": "Run an active health check for a specific service (rate limited).",
+        "operationId": "admin_check_integration_api_admin_integrations__service__check_post",
+        "parameters": [
+          {
+            "in": "path",
+            "name": "service",
+            "required": true,
+            "schema": {
+              "title": "Service",
+              "type": "string"
+            }
+          }
+        ],
+        "responses": {
+          "200": {
+            "content": {
+              "application/json": {
+                "schema": {
+                  "$ref": "#/components/schemas/IntegrationCheckResponse"
+                }
+              }
+            },
+            "description": "Successful Response"
+          },
+          "422": {
+            "content": {
+              "application/json": {
+                "schema": {
+                  "$ref": "#/components/schemas/HTTPValidationError"
+                }
+              }
+            },
+            "description": "Validation Error"
+          }
+        },
+        "security": [
+          {
+            "OAuth2PasswordBearer": []
+          }
+        ],
+        "summary": "Admin Check Integration",
+        "tags": [
+          "admin"
+        ]
+      }
+    },
+    "/api/admin/llm/audit": {
+      "get": {
+        "description": "Browse the LLM audit trail (admin-only).\n\nRead-only view over ``llm_audit_event`` with optional filters and\npagination. The target connector's display name is joined in \u2014 credential\nmaterial is never read or returned.",
+        "operationId": "list_audit_events_api_admin_llm_audit_get",
+        "parameters": [
+          {
+            "in": "query",
+            "name": "event_type",
+            "required": false,
+            "schema": {
+              "anyOf": [
+                {
+                  "maxLength": 60,
+                  "type": "string"
+                },
+                {
+                  "type": "null"
+                }
+              ],
+              "title": "Event Type"
+            }
+          },
+          {
+            "in": "query",
+            "name": "actor_user_id",
+            "required": false,
+            "schema": {
+              "anyOf": [
+                {
+                  "minimum": 1,
+                  "type": "integer"
+                },
+                {
+                  "type": "null"
+                }
+              ],
+              "title": "Actor User Id"
+            }
+          },
+          {
+            "in": "query",
+            "name": "target_connector_id",
+            "required": false,
+            "schema": {
+              "anyOf": [
+                {
+                  "minimum": 1,
+                  "type": "integer"
+                },
+                {
+                  "type": "null"
+                }
+              ],
+              "title": "Target Connector Id"
+            }
+          },
+          {
+            "in": "query",
+            "name": "days",
+            "required": false,
+            "schema": {
+              "default": 30,
+              "maximum": 3650,
+              "minimum": 1,
+              "title": "Days",
+              "type": "integer"
+            }
+          },
+          {
+            "in": "query",
+            "name": "limit",
+            "required": false,
+            "schema": {
+              "default": 50,
+              "maximum": 200,
+              "minimum": 1,
+              "title": "Limit",
+              "type": "integer"
+            }
+          },
+          {
+            "in": "query",
+            "name": "offset",
+            "required": false,
+            "schema": {
+              "default": 0,
+              "minimum": 0,
+              "title": "Offset",
+              "type": "integer"
+            }
+          }
+        ],
+        "responses": {
+          "200": {
+            "content": {
+              "application/json": {
+                "schema": {
+                  "$ref": "#/components/schemas/AdminAuditOut"
+                }
+              }
+            },
+            "description": "Successful Response"
+          },
+          "422": {
+            "content": {
+              "application/json": {
+                "schema": {
+                  "$ref": "#/components/schemas/HTTPValidationError"
+                }
+              }
+            },
+            "description": "Validation Error"
+          }
+        },
+        "security": [
+          {
+            "OAuth2PasswordBearer": []
+          }
+        ],
+        "summary": "List Audit Events",
+        "tags": [
+          "admin",
+          "llm"
+        ]
+      }
+    },
+    "/api/admin/llm/audit.csv": {
+      "get": {
+        "description": "Export the (filtered) audit trail as CSV (admin-only).\n\nHonors the same filters as ``GET /audit``. Capped at\n``_AUDIT_CSV_ROW_CAP`` rows to avoid unbounded streaming. Columns:\ntimestamp, actor, event_type, target_connector, notes. Never includes\ncredential material.",
+        "operationId": "export_audit_events_csv_api_admin_llm_audit_csv_get",
+        "parameters": [
+          {
+            "in": "query",
+            "name": "event_type",
+            "required": false,
+            "schema": {
+              "anyOf": [
+                {
+                  "maxLength": 60,
+                  "type": "string"
+                },
+                {
+                  "type": "null"
+                }
+              ],
+              "title": "Event Type"
+            }
+          },
+          {
+            "in": "query",
+            "name": "actor_user_id",
+            "required": false,
+            "schema": {
+              "anyOf": [
+                {
+                  "minimum": 1,
+                  "type": "integer"
+                },
+                {
+                  "type": "null"
+                }
+              ],
+              "title": "Actor User Id"
+            }
+          },
+          {
+            "in": "query",
+            "name": "target_connector_id",
+            "required": false,
+            "schema": {
+              "anyOf": [
+                {
+                  "minimum": 1,
+                  "type": "integer"
+                },
+                {
+                  "type": "null"
+                }
+              ],
+              "title": "Target Connector Id"
+            }
+          },
+          {
+            "in": "query",
+            "name": "days",
+            "required": false,
+            "schema": {
+              "default": 30,
+              "maximum": 3650,
+              "minimum": 1,
+              "title": "Days",
+              "type": "integer"
+            }
+          }
+        ],
+        "responses": {
+          "200": {
+            "content": {
+              "text/csv": {
+                "schema": {
+                  "format": "binary",
+                  "type": "string"
+                }
+              }
+            },
+            "description": "CSV export of the filtered audit trail."
+          },
+          "422": {
+            "content": {
+              "application/json": {
+                "schema": {
+                  "$ref": "#/components/schemas/HTTPValidationError"
+                }
+              }
+            },
+            "description": "Validation Error"
+          }
+        },
+        "security": [
+          {
+            "OAuth2PasswordBearer": []
+          }
+        ],
+        "summary": "Export Audit Events Csv",
+        "tags": [
+          "admin",
+          "llm"
+        ]
+      }
+    },
+    "/api/admin/llm/connectors": {
+      "get": {
+        "operationId": "list_connectors_admin_api_admin_llm_connectors_get",
+        "responses": {
+          "200": {
+            "content": {
+              "application/json": {
+                "schema": {
+                  "items": {
+                    "$ref": "#/components/schemas/AdminConnectorOut"
+                  },
+                  "title": "Response List Connectors Admin Api Admin Llm Connectors Get",
+                  "type": "array"
+                }
+              }
+            },
+            "description": "Successful Response"
+          }
+        },
+        "security": [
+          {
+            "OAuth2PasswordBearer": []
+          }
+        ],
+        "summary": "List Connectors Admin",
+        "tags": [
+          "admin",
+          "llm"
+        ]
+      }
+    },
+    "/api/admin/llm/connectors/{connector_id}/cap": {
+      "patch": {
+        "description": "Set or clear a connector's monthly token cap (admin-only, issue #339).\n\n``monthly_token_cap = null`` clears the cap (unlimited). The change is\npre-flight only: an in-flight gateway call already past its cap check is\nunaffected. Pydantic enforces the non-negative bound (``ge=0``); the\nservice layer re-validates defensively.",
+        "operationId": "set_connector_cap_admin_api_admin_llm_connectors__connector_id__cap_patch",
+        "parameters": [
+          {
+            "in": "path",
+            "name": "connector_id",
+            "required": true,
+            "schema": {
+              "title": "Connector Id",
+              "type": "integer"
+            }
+          }
+        ],
+        "requestBody": {
+          "content": {
+            "application/json": {
+              "schema": {
+                "$ref": "#/components/schemas/AdminConnectorCapPatch"
+              }
+            }
+          },
+          "required": true
+        },
+        "responses": {
+          "200": {
+            "content": {
+              "application/json": {
+                "schema": {
+                  "$ref": "#/components/schemas/AdminConnectorOut"
+                }
+              }
+            },
+            "description": "Successful Response"
+          },
+          "422": {
+            "content": {
+              "application/json": {
+                "schema": {
+                  "$ref": "#/components/schemas/HTTPValidationError"
+                }
+              }
+            },
+            "description": "Validation Error"
+          }
+        },
+        "security": [
+          {
+            "OAuth2PasswordBearer": []
+          }
         ],
-        "title": "VerifyRequestResponse",
-        "type": "object"
-      },
-      "VerifyRequestSchema": {
-        "properties": {
-          "email": {
-            "format": "email",
-            "title": "Email",
-            "type": "string"
+        "summary": "Set Connector Cap Admin",
+        "tags": [
+          "admin",
+          "llm"
+        ]
+      }
+    },
+    "/api/admin/llm/connectors/{connector_id}/revoke": {
+      "post": {
+        "operationId": "revoke_connector_admin_api_admin_llm_connectors__connector_id__revoke_post",
+        "parameters": [
+          {
+            "in": "path",
+            "name": "connector_id",
+            "required": true,
+            "schema": {
+              "title": "Connector Id",
+              "type": "integer"
+            }
+          }
+        ],
+        "responses": {
+          "200": {
+            "content": {
+              "application/json": {
+                "schema": {
+                  "$ref": "#/components/schemas/AdminConnectorOut"
+                }
+              }
+            },
+            "description": "Successful Response"
           },
-          "turnstile_token": {
-            "maxLength": 4096,
-            "minLength": 1,
-            "title": "Turnstile Token",
-            "type": "string"
+          "422": {
+            "content": {
+              "application/json": {
+                "schema": {
+                  "$ref": "#/components/schemas/HTTPValidationError"
+                }
+              }
+            },
+            "description": "Validation Error"
           }
         },
-        "required": [
-          "email",
-          "turnstile_token"
+        "security": [
+          {
+            "OAuth2PasswordBearer": []
+          }
         ],
-        "title": "VerifyRequestSchema",
-        "type": "object"
-      },
-      "VerifyStatusResponse": {
-        "description": "Reports whether the caller has a valid wrzdj_human cookie.",
-        "properties": {
-          "expires_in": {
-            "default": 0,
-            "title": "Expires In",
-            "type": "integer"
-          },
-          "verified": {
-            "title": "Verified",
-            "type": "boolean"
+        "summary": "Revoke Connector Admin",
+        "tags": [
+          "admin",
+          "llm"
+        ]
+      }
+    },
+    "/api/admin/llm/policy": {
+      "get": {
+        "operationId": "get_policy_api_admin_llm_policy_get",
+        "responses": {
+          "200": {
+            "content": {
+              "application/json": {
+                "schema": {
+                  "$ref": "#/components/schemas/AdminPolicyOut"
+                }
+              }
+            },
+            "description": "Successful Response"
           }
         },
-        "required": [
-          "expires_in",
-          "verified"
+        "security": [
+          {
+            "OAuth2PasswordBearer": []
+          }
         ],
-        "title": "VerifyStatusResponse",
-        "type": "object"
+        "summary": "Get Policy",
+        "tags": [
+          "admin",
+          "llm"
+        ]
       },
-      "VoteResponse": {
-        "properties": {
-          "has_voted": {
-            "title": "Has Voted",
-            "type": "boolean"
+      "patch": {
+        "operationId": "patch_policy_api_admin_llm_policy_patch",
+        "requestBody": {
+          "content": {
+            "application/json": {
+              "schema": {
+                "$ref": "#/components/schemas/AdminPolicyPatch"
+              }
+            }
           },
-          "status": {
-            "title": "Status",
-            "type": "string"
+          "required": true
+        },
+        "responses": {
+          "200": {
+            "content": {
+              "application/json": {
+                "schema": {
+                  "$ref": "#/components/schemas/AdminPolicyOut"
+                }
+              }
+            },
+            "description": "Successful Response"
           },
-          "vote_count": {
-            "title": "Vote Count",
-            "type": "integer"
+          "422": {
+            "content": {
+              "application/json": {
+                "schema": {
+                  "$ref": "#/components/schemas/HTTPValidationError"
+                }
+              }
+            },
+            "description": "Validation Error"
           }
         },
-        "required": [
-          "has_voted",
-          "status",
-          "vote_count"
+        "security": [
+          {
+            "OAuth2PasswordBearer": []
+          }
         ],
-        "title": "VoteResponse",
-        "type": "object"
+        "summary": "Patch Policy",
+        "tags": [
+          "admin",
+          "llm"
+        ]
       }
     },
-    "securitySchemes": {
-      "OAuth2PasswordBearer": {
-        "flows": {
-          "password": {
-            "scopes": {},
-            "tokenUrl": "/api/auth/login"
-          }
-        },
-        "type": "oauth2"
-      }
-    }
-  },
-  "info": {
-    "description": "Song request system for DJs",
-    "title": "WrzDJ API",
-    "version": "0.1.0"
-  },
-  "openapi": "3.1.0",
-  "paths": {
-    "/api/admin/ai/models": {
+    "/api/admin/llm/usage": {
       "get": {
-        "description": "List available AI models.",
-        "operationId": "admin_get_ai_models_api_admin_ai_models_get",
+        "operationId": "get_usage_api_admin_llm_usage_get",
+        "parameters": [
+          {
+            "in": "query",
+            "name": "days",
+            "required": false,
+            "schema": {
+              "default": 30,
+              "maximum": 180,
+              "minimum": 1,
+              "title": "Days",
+              "type": "integer"
+            }
+          }
+        ],
         "responses": {
           "200": {
             "content": {
               "application/json": {
                 "schema": {
-                  "$ref": "#/components/schemas/AIModelsResponse"
+                  "$ref": "#/components/schemas/AdminUsageOut"
                 }
               }
             },
             "description": "Successful Response"
+          },
+          "422": {
+            "content": {
+              "application/json": {
+                "schema": {
+                  "$ref": "#/components/schemas/HTTPValidationError"
+                }
+              }
+            },
+            "description": "Validation Error"
           }
         },
         "security": [
@@ -5636,22 +7889,22 @@
             "OAuth2PasswordBearer": []
           }
         ],
-        "summary": "Admin Get Ai Models",
+        "summary": "Get Usage",
         "tags": [
-          "admin"
+          "admin",
+          "llm"
         ]
       }
     },
-    "/api/admin/ai/settings": {
+    "/api/admin/settings": {
       "get": {
-        "description": "Get AI/LLM configuration.",
-        "operationId": "admin_get_ai_settings_api_admin_ai_settings_get",
+        "operationId": "admin_get_settings_api_admin_settings_get",
         "responses": {
           "200": {
             "content": {
               "application/json": {
                 "schema": {
-                  "$ref": "#/components/schemas/AISettingsOut"
+                  "$ref": "#/components/schemas/SystemSettingsOut"
                 }
               }
             },
@@ -5663,19 +7916,18 @@
             "OAuth2PasswordBearer": []
           }
         ],
-        "summary": "Admin Get Ai Settings",
+        "summary": "Admin Get Settings",
         "tags": [
           "admin"
         ]
       },
-      "put": {
-        "description": "Update AI/LLM configuration.",
-        "operationId": "admin_update_ai_settings_api_admin_ai_settings_put",
+      "patch": {
+        "operationId": "admin_update_settings_api_admin_settings_patch",
         "requestBody": {
           "content": {
             "application/json": {
               "schema": {
-                "$ref": "#/components/schemas/AISettingsUpdate"
+                "$ref": "#/components/schemas/SystemSettingsUpdate"
               }
             }
           },
@@ -5686,7 +7938,7 @@
             "content": {
               "application/json": {
                 "schema": {
-                  "$ref": "#/components/schemas/AISettingsOut"
+                  "$ref": "#/components/schemas/SystemSettingsOut"
                 }
               }
             },
@@ -5708,15 +7960,41 @@
             "OAuth2PasswordBearer": []
           }
         ],
-        "summary": "Admin Update Ai Settings",
+        "summary": "Admin Update Settings",
         "tags": [
           "admin"
         ]
       }
     },
-    "/api/admin/events": {
+    "/api/admin/stats": {
       "get": {
-        "operationId": "admin_list_events_api_admin_events_get",
+        "operationId": "admin_stats_api_admin_stats_get",
+        "responses": {
+          "200": {
+            "content": {
+              "application/json": {
+                "schema": {
+                  "$ref": "#/components/schemas/SystemStats"
+                }
+              }
+            },
+            "description": "Successful Response"
+          }
+        },
+        "security": [
+          {
+            "OAuth2PasswordBearer": []
+          }
+        ],
+        "summary": "Admin Stats",
+        "tags": [
+          "admin"
+        ]
+      }
+    },
+    "/api/admin/users": {
+      "get": {
+        "operationId": "admin_list_users_api_admin_users_get",
         "parameters": [
           {
             "in": "query",
@@ -5735,11 +8013,27 @@
             "name": "limit",
             "required": false,
             "schema": {
-              "default": 20,
-              "maximum": 100,
-              "minimum": 1,
-              "title": "Limit",
-              "type": "integer"
+              "default": 20,
+              "maximum": 100,
+              "minimum": 1,
+              "title": "Limit",
+              "type": "integer"
+            }
+          },
+          {
+            "in": "query",
+            "name": "role",
+            "required": false,
+            "schema": {
+              "anyOf": [
+                {
+                  "type": "string"
+                },
+                {
+                  "type": "null"
+                }
+              ],
+              "title": "Role"
             }
           }
         ],
@@ -5770,32 +8064,29 @@
             "OAuth2PasswordBearer": []
           }
         ],
-        "summary": "Admin List Events",
+        "summary": "Admin List Users",
         "tags": [
           "admin"
         ]
-      }
-    },
-    "/api/admin/events/bulk-delete": {
+      },
       "post": {
-        "description": "Admin can bulk delete events from any owner.",
-        "operationId": "admin_bulk_delete_events_api_admin_events_bulk_delete_post",
+        "operationId": "admin_create_user_api_admin_users_post",
         "requestBody": {
           "content": {
             "application/json": {
               "schema": {
-                "$ref": "#/components/schemas/BulkDeleteEventsRequest"
+                "$ref": "#/components/schemas/AdminUserCreate"
               }
             }
           },
           "required": true
         },
         "responses": {
-          "200": {
+          "201": {
             "content": {
               "application/json": {
                 "schema": {
-                  "$ref": "#/components/schemas/BulkActionResponse"
+                  "$ref": "#/components/schemas/AdminUserOut"
                 }
               }
             },
@@ -5817,24 +8108,23 @@
             "OAuth2PasswordBearer": []
           }
         ],
-        "summary": "Admin Bulk Delete Events",
+        "summary": "Admin Create User",
         "tags": [
           "admin"
         ]
       }
     },
-    "/api/admin/events/{code}": {
+    "/api/admin/users/{user_id}": {
       "delete": {
-        "description": "Admin can delete any event.",
-        "operationId": "admin_delete_event_api_admin_events__code__delete",
+        "operationId": "admin_delete_user_api_admin_users__user_id__delete",
         "parameters": [
           {
             "in": "path",
-            "name": "code",
+            "name": "user_id",
             "required": true,
             "schema": {
-              "title": "Code",
-              "type": "string"
+              "title": "User Id",
+              "type": "integer"
             }
           }
         ],
@@ -5858,22 +8148,21 @@
             "OAuth2PasswordBearer": []
           }
         ],
-        "summary": "Admin Delete Event",
+        "summary": "Admin Delete User",
         "tags": [
           "admin"
         ]
       },
       "patch": {
-        "description": "Admin can edit any event (not just their own).",
-        "operationId": "admin_update_event_api_admin_events__code__patch",
+        "operationId": "admin_update_user_api_admin_users__user_id__patch",
         "parameters": [
           {
             "in": "path",
-            "name": "code",
+            "name": "user_id",
             "required": true,
             "schema": {
-              "title": "Code",
-              "type": "string"
+              "title": "User Id",
+              "type": "integer"
             }
           }
         ],
@@ -5881,7 +8170,7 @@
           "content": {
             "application/json": {
               "schema": {
-                "$ref": "#/components/schemas/EventUpdate"
+                "$ref": "#/components/schemas/AdminUserUpdate"
               }
             }
           },
@@ -5892,7 +8181,7 @@
             "content": {
               "application/json": {
                 "schema": {
-                  "$ref": "#/components/schemas/AdminEventOut"
+                  "$ref": "#/components/schemas/AdminUserOut"
                 }
               }
             },
@@ -5914,70 +8203,32 @@
             "OAuth2PasswordBearer": []
           }
         ],
-        "summary": "Admin Update Event",
+        "summary": "Admin Update User",
         "tags": [
           "admin"
         ]
       }
     },
-    "/api/admin/integrations": {
+    "/api/auth/email/confirm": {
       "get": {
-        "description": "Get status of all external integrations (no active health checks).",
-        "operationId": "admin_get_integrations_api_admin_integrations_get",
-        "responses": {
-          "200": {
-            "content": {
-              "application/json": {
-                "schema": {
-                  "$ref": "#/components/schemas/IntegrationHealthResponse"
-                }
-              }
-            },
-            "description": "Successful Response"
-          }
-        },
-        "security": [
-          {
-            "OAuth2PasswordBearer": []
-          }
-        ],
-        "summary": "Admin Get Integrations",
-        "tags": [
-          "admin"
-        ]
-      }
-    },
-    "/api/admin/integrations/{service}": {
-      "patch": {
-        "description": "Enable or disable a specific integration.",
-        "operationId": "admin_toggle_integration_api_admin_integrations__service__patch",
+        "operationId": "confirm_email_change_api_auth_email_confirm_get",
         "parameters": [
           {
-            "in": "path",
-            "name": "service",
+            "in": "query",
+            "name": "token",
             "required": true,
             "schema": {
-              "title": "Service",
+              "title": "Token",
               "type": "string"
             }
           }
         ],
-        "requestBody": {
-          "content": {
-            "application/json": {
-              "schema": {
-                "$ref": "#/components/schemas/IntegrationToggleRequest"
-              }
-            }
-          },
-          "required": true
-        },
         "responses": {
           "200": {
             "content": {
               "application/json": {
                 "schema": {
-                  "$ref": "#/components/schemas/IntegrationToggleResponse"
+                  "$ref": "#/components/schemas/StatusMessageResponse"
                 }
               }
             },
@@ -5994,38 +8245,32 @@
             "description": "Validation Error"
           }
         },
-        "security": [
-          {
-            "OAuth2PasswordBearer": []
-          }
-        ],
-        "summary": "Admin Toggle Integration",
+        "summary": "Confirm Email Change",
         "tags": [
-          "admin"
+          "auth"
         ]
       }
     },
-    "/api/admin/integrations/{service}/check": {
+    "/api/auth/help-seen": {
       "post": {
-        "description": "Run an active health check for a specific service (rate limited).",
-        "operationId": "admin_check_integration_api_admin_integrations__service__check_post",
-        "parameters": [
-          {
-            "in": "path",
-            "name": "service",
-            "required": true,
-            "schema": {
-              "title": "Service",
-              "type": "string"
+        "description": "Mark a help page as seen for the current user.",
+        "operationId": "mark_help_page_seen_api_auth_help_seen_post",
+        "requestBody": {
+          "content": {
+            "application/json": {
+              "schema": {
+                "$ref": "#/components/schemas/HelpPageSeenRequest"
+              }
             }
-          }
-        ],
+          },
+          "required": true
+        },
         "responses": {
           "200": {
             "content": {
               "application/json": {
                 "schema": {
-                  "$ref": "#/components/schemas/IntegrationCheckResponse"
+                  "$ref": "#/components/schemas/StatusMessageResponse"
                 }
               }
             },
@@ -6047,44 +8292,20 @@
             "OAuth2PasswordBearer": []
           }
         ],
-        "summary": "Admin Check Integration",
+        "summary": "Mark Help Page Seen",
         "tags": [
-          "admin"
+          "auth"
         ]
       }
     },
-    "/api/admin/settings": {
-      "get": {
-        "operationId": "admin_get_settings_api_admin_settings_get",
-        "responses": {
-          "200": {
-            "content": {
-              "application/json": {
-                "schema": {
-                  "$ref": "#/components/schemas/SystemSettingsOut"
-                }
-              }
-            },
-            "description": "Successful Response"
-          }
-        },
-        "security": [
-          {
-            "OAuth2PasswordBearer": []
-          }
-        ],
-        "summary": "Admin Get Settings",
-        "tags": [
-          "admin"
-        ]
-      },
-      "patch": {
-        "operationId": "admin_update_settings_api_admin_settings_patch",
+    "/api/auth/login": {
+      "post": {
+        "operationId": "login_api_auth_login_post",
         "requestBody": {
           "content": {
-            "application/json": {
+            "application/x-www-form-urlencoded": {
               "schema": {
-                "$ref": "#/components/schemas/SystemSettingsUpdate"
+                "$ref": "#/components/schemas/Body_login_api_auth_login_post"
               }
             }
           },
@@ -6095,7 +8316,7 @@
             "content": {
               "application/json": {
                 "schema": {
-                  "$ref": "#/components/schemas/SystemSettingsOut"
+                  "$ref": "#/components/schemas/Token"
                 }
               }
             },
@@ -6112,26 +8333,22 @@
             "description": "Validation Error"
           }
         },
-        "security": [
-          {
-            "OAuth2PasswordBearer": []
-          }
-        ],
-        "summary": "Admin Update Settings",
+        "summary": "Login",
         "tags": [
-          "admin"
+          "auth"
         ]
       }
     },
-    "/api/admin/stats": {
-      "get": {
-        "operationId": "admin_stats_api_admin_stats_get",
+    "/api/auth/logout": {
+      "post": {
+        "description": "Invalidate all outstanding JWTs for the current user.\n\nSECURITY (CRIT-2): bumps token_version so every previously-issued JWT\nfor this user fails the version check in get_current_user.",
+        "operationId": "logout_api_auth_logout_post",
         "responses": {
           "200": {
             "content": {
               "application/json": {
                 "schema": {
-                  "$ref": "#/components/schemas/SystemStats"
+                  "$ref": "#/components/schemas/StatusMessageResponse"
                 }
               }
             },
@@ -6143,77 +8360,25 @@
             "OAuth2PasswordBearer": []
           }
         ],
-        "summary": "Admin Stats",
-        "tags": [
-          "admin"
-        ]
-      }
-    },
-    "/api/admin/users": {
-      "get": {
-        "operationId": "admin_list_users_api_admin_users_get",
-        "parameters": [
-          {
-            "in": "query",
-            "name": "page",
-            "required": false,
-            "schema": {
-              "default": 1,
-              "maximum": 1000,
-              "minimum": 1,
-              "title": "Page",
-              "type": "integer"
-            }
-          },
-          {
-            "in": "query",
-            "name": "limit",
-            "required": false,
-            "schema": {
-              "default": 20,
-              "maximum": 100,
-              "minimum": 1,
-              "title": "Limit",
-              "type": "integer"
-            }
-          },
-          {
-            "in": "query",
-            "name": "role",
-            "required": false,
-            "schema": {
-              "anyOf": [
-                {
-                  "type": "string"
-                },
-                {
-                  "type": "null"
-                }
-              ],
-              "title": "Role"
-            }
-          }
-        ],
+        "summary": "Logout",
+        "tags": [
+          "auth"
+        ]
+      }
+    },
+    "/api/auth/me": {
+      "get": {
+        "operationId": "get_me_api_auth_me_get",
         "responses": {
           "200": {
             "content": {
               "application/json": {
                 "schema": {
-                  "$ref": "#/components/schemas/PaginatedResponse"
+                  "$ref": "#/components/schemas/UserOut"
                 }
               }
             },
             "description": "Successful Response"
-          },
-          "422": {
-            "content": {
-              "application/json": {
-                "schema": {
-                  "$ref": "#/components/schemas/HTTPValidationError"
-                }
-              }
-            },
-            "description": "Validation Error"
           }
         },
         "security": [
@@ -6221,29 +8386,31 @@
             "OAuth2PasswordBearer": []
           }
         ],
-        "summary": "Admin List Users",
+        "summary": "Get Me",
         "tags": [
-          "admin"
+          "auth"
         ]
-      },
+      }
+    },
+    "/api/auth/me/email/request": {
       "post": {
-        "operationId": "admin_create_user_api_admin_users_post",
+        "operationId": "request_email_change_api_auth_me_email_request_post",
         "requestBody": {
           "content": {
             "application/json": {
               "schema": {
-                "$ref": "#/components/schemas/AdminUserCreate"
+                "$ref": "#/components/schemas/RequestEmailChangeRequest"
               }
             }
           },
           "required": true
         },
         "responses": {
-          "201": {
+          "200": {
             "content": {
               "application/json": {
                 "schema": {
-                  "$ref": "#/components/schemas/AdminUserOut"
+                  "$ref": "#/components/schemas/StatusMessageResponse"
                 }
               }
             },
@@ -6265,28 +8432,34 @@
             "OAuth2PasswordBearer": []
           }
         ],
-        "summary": "Admin Create User",
+        "summary": "Request Email Change",
         "tags": [
-          "admin"
+          "auth"
         ]
       }
     },
-    "/api/admin/users/{user_id}": {
-      "delete": {
-        "operationId": "admin_delete_user_api_admin_users__user_id__delete",
-        "parameters": [
-          {
-            "in": "path",
-            "name": "user_id",
-            "required": true,
-            "schema": {
-              "title": "User Id",
-              "type": "integer"
+    "/api/auth/me/password": {
+      "patch": {
+        "operationId": "change_password_api_auth_me_password_patch",
+        "requestBody": {
+          "content": {
+            "application/json": {
+              "schema": {
+                "$ref": "#/components/schemas/ChangePasswordRequest"
+              }
             }
-          }
-        ],
+          },
+          "required": true
+        },
         "responses": {
-          "204": {
+          "200": {
+            "content": {
+              "application/json": {
+                "schema": {
+                  "$ref": "#/components/schemas/StatusMessageResponse"
+                }
+              }
+            },
             "description": "Successful Response"
           },
           "422": {
@@ -6305,29 +8478,20 @@
             "OAuth2PasswordBearer": []
           }
         ],
-        "summary": "Admin Delete User",
+        "summary": "Change Password",
         "tags": [
-          "admin"
+          "auth"
         ]
-      },
+      }
+    },
+    "/api/auth/me/preferences": {
       "patch": {
-        "operationId": "admin_update_user_api_admin_users__user_id__patch",
-        "parameters": [
-          {
-            "in": "path",
-            "name": "user_id",
-            "required": true,
-            "schema": {
-              "title": "User Id",
-              "type": "integer"
-            }
-          }
-        ],
+        "operationId": "update_me_preferences_api_auth_me_preferences_patch",
         "requestBody": {
           "content": {
             "application/json": {
               "schema": {
-                "$ref": "#/components/schemas/AdminUserUpdate"
+                "$ref": "#/components/schemas/MePreferencesUpdate"
               }
             }
           },
@@ -6338,7 +8502,7 @@
             "content": {
               "application/json": {
                 "schema": {
-                  "$ref": "#/components/schemas/AdminUserOut"
+                  "$ref": "#/components/schemas/UserOut"
                 }
               }
             },
@@ -6360,26 +8524,26 @@
             "OAuth2PasswordBearer": []
           }
         ],
-        "summary": "Admin Update User",
+        "summary": "Update Me Preferences",
         "tags": [
-          "admin"
+          "auth"
         ]
       }
     },
-    "/api/auth/email/confirm": {
-      "get": {
-        "operationId": "confirm_email_change_api_auth_email_confirm_get",
-        "parameters": [
-          {
-            "in": "query",
-            "name": "token",
-            "required": true,
-            "schema": {
-              "title": "Token",
-              "type": "string"
+    "/api/auth/register": {
+      "post": {
+        "description": "Register a new user (pending approval).",
+        "operationId": "register_api_auth_register_post",
+        "requestBody": {
+          "content": {
+            "application/json": {
+              "schema": {
+                "$ref": "#/components/schemas/RegisterRequest"
+              }
             }
-          }
-        ],
+          },
+          "required": true
+        },
         "responses": {
           "200": {
             "content": {
@@ -6402,21 +8566,43 @@
             "description": "Validation Error"
           }
         },
-        "summary": "Confirm Email Change",
+        "summary": "Register",
         "tags": [
           "auth"
         ]
       }
     },
-    "/api/auth/help-seen": {
+    "/api/auth/settings": {
+      "get": {
+        "description": "Public endpoint returning registration status and Turnstile site key.",
+        "operationId": "get_public_settings_api_auth_settings_get",
+        "responses": {
+          "200": {
+            "content": {
+              "application/json": {
+                "schema": {
+                  "$ref": "#/components/schemas/PublicSettings"
+                }
+              }
+            },
+            "description": "Successful Response"
+          }
+        },
+        "summary": "Get Public Settings",
+        "tags": [
+          "auth"
+        ]
+      }
+    },
+    "/api/beatport/auth/login": {
       "post": {
-        "description": "Mark a help page as seen for the current user.",
-        "operationId": "mark_help_page_seen_api_auth_help_seen_post",
+        "description": "Authenticate with Beatport using username/password.\n\nThe backend logs in to Beatport server-side, obtains an authorization\ncode, exchanges it for tokens, and stores them on the user.",
+        "operationId": "login_beatport_api_beatport_auth_login_post",
         "requestBody": {
           "content": {
             "application/json": {
               "schema": {
-                "$ref": "#/components/schemas/HelpPageSeenRequest"
+                "$ref": "#/components/schemas/BeatportLogin"
               }
             }
           },
@@ -6449,31 +8635,60 @@
             "OAuth2PasswordBearer": []
           }
         ],
-        "summary": "Mark Help Page Seen",
+        "summary": "Login Beatport",
         "tags": [
-          "auth"
+          "beatport"
         ]
       }
     },
-    "/api/auth/login": {
+    "/api/beatport/disconnect": {
       "post": {
-        "operationId": "login_api_auth_login_post",
-        "requestBody": {
-          "content": {
-            "application/x-www-form-urlencoded": {
-              "schema": {
-                "$ref": "#/components/schemas/Body_login_api_auth_login_post"
+        "description": "Unlink Beatport account from current user.",
+        "operationId": "disconnect_api_beatport_disconnect_post",
+        "responses": {
+          "200": {
+            "content": {
+              "application/json": {
+                "schema": {
+                  "$ref": "#/components/schemas/StatusMessageResponse"
+                }
               }
-            }
-          },
-          "required": true
+            },
+            "description": "Successful Response"
+          }
         },
+        "security": [
+          {
+            "OAuth2PasswordBearer": []
+          }
+        ],
+        "summary": "Disconnect",
+        "tags": [
+          "beatport"
+        ]
+      }
+    },
+    "/api/beatport/events/{event_id}/settings": {
+      "get": {
+        "description": "Get Beatport sync settings for an event.",
+        "operationId": "get_event_settings_api_beatport_events__event_id__settings_get",
+        "parameters": [
+          {
+            "in": "path",
+            "name": "event_id",
+            "required": true,
+            "schema": {
+              "title": "Event Id",
+              "type": "integer"
+            }
+          }
+        ],
         "responses": {
           "200": {
             "content": {
               "application/json": {
                 "schema": {
-                  "$ref": "#/components/schemas/Token"
+                  "$ref": "#/components/schemas/BeatportEventSettings"
                 }
               }
             },
@@ -6490,52 +8705,60 @@
             "description": "Validation Error"
           }
         },
-        "summary": "Login",
+        "security": [
+          {
+            "OAuth2PasswordBearer": []
+          }
+        ],
+        "summary": "Get Event Settings",
         "tags": [
-          "auth"
+          "beatport"
         ]
-      }
-    },
-    "/api/auth/logout": {
-      "post": {
-        "description": "Invalidate all outstanding JWTs for the current user.\n\nSECURITY (CRIT-2): bumps token_version so every previously-issued JWT\nfor this user fails the version check in get_current_user.",
-        "operationId": "logout_api_auth_logout_post",
+      },
+      "put": {
+        "description": "Update Beatport sync settings for an event.",
+        "operationId": "update_event_settings_api_beatport_events__event_id__settings_put",
+        "parameters": [
+          {
+            "in": "path",
+            "name": "event_id",
+            "required": true,
+            "schema": {
+              "title": "Event Id",
+              "type": "integer"
+            }
+          }
+        ],
+        "requestBody": {
+          "content": {
+            "application/json": {
+              "schema": {
+                "$ref": "#/components/schemas/BeatportEventSettingsUpdate"
+              }
+            }
+          },
+          "required": true
+        },
         "responses": {
           "200": {
             "content": {
               "application/json": {
                 "schema": {
-                  "$ref": "#/components/schemas/StatusMessageResponse"
+                  "$ref": "#/components/schemas/BeatportEventSettings"
                 }
               }
             },
             "description": "Successful Response"
-          }
-        },
-        "security": [
-          {
-            "OAuth2PasswordBearer": []
-          }
-        ],
-        "summary": "Logout",
-        "tags": [
-          "auth"
-        ]
-      }
-    },
-    "/api/auth/me": {
-      "get": {
-        "operationId": "get_me_api_auth_me_get",
-        "responses": {
-          "200": {
+          },
+          "422": {
             "content": {
               "application/json": {
                 "schema": {
-                  "$ref": "#/components/schemas/UserOut"
+                  "$ref": "#/components/schemas/HTTPValidationError"
                 }
               }
             },
-            "description": "Successful Response"
+            "description": "Validation Error"
           }
         },
         "security": [
@@ -6543,20 +8766,32 @@
             "OAuth2PasswordBearer": []
           }
         ],
-        "summary": "Get Me",
+        "summary": "Update Event Settings",
         "tags": [
-          "auth"
+          "beatport"
         ]
       }
     },
-    "/api/auth/me/email/request": {
+    "/api/beatport/requests/{request_id}/link": {
       "post": {
-        "operationId": "request_email_change_api_auth_me_email_request_post",
+        "description": "Manually link a Beatport track to a request.\n\nVerifies the track exists on Beatport, then stores the\nBeatport URL and metadata in sync_results_json.",
+        "operationId": "link_track_api_beatport_requests__request_id__link_post",
+        "parameters": [
+          {
+            "in": "path",
+            "name": "request_id",
+            "required": true,
+            "schema": {
+              "title": "Request Id",
+              "type": "integer"
+            }
+          }
+        ],
         "requestBody": {
           "content": {
             "application/json": {
               "schema": {
-                "$ref": "#/components/schemas/RequestEmailChangeRequest"
+                "$ref": "#/components/schemas/BeatportManualLink"
               }
             }
           },
@@ -6589,31 +8824,51 @@
             "OAuth2PasswordBearer": []
           }
         ],
-        "summary": "Request Email Change",
+        "summary": "Link Track",
         "tags": [
-          "auth"
+          "beatport"
         ]
       }
     },
-    "/api/auth/me/password": {
-      "patch": {
-        "operationId": "change_password_api_auth_me_password_patch",
-        "requestBody": {
-          "content": {
-            "application/json": {
-              "schema": {
-                "$ref": "#/components/schemas/ChangePasswordRequest"
-              }
+    "/api/beatport/search": {
+      "get": {
+        "description": "Search Beatport for tracks.",
+        "operationId": "search_api_beatport_search_get",
+        "parameters": [
+          {
+            "in": "query",
+            "name": "q",
+            "required": true,
+            "schema": {
+              "maxLength": 200,
+              "minLength": 1,
+              "title": "Q",
+              "type": "string"
             }
           },
-          "required": true
-        },
+          {
+            "in": "query",
+            "name": "limit",
+            "required": false,
+            "schema": {
+              "default": 10,
+              "maximum": 50,
+              "minimum": 1,
+              "title": "Limit",
+              "type": "integer"
+            }
+          }
+        ],
         "responses": {
           "200": {
             "content": {
               "application/json": {
                 "schema": {
-                  "$ref": "#/components/schemas/StatusMessageResponse"
+                  "items": {
+                    "$ref": "#/components/schemas/BeatportSearchResult"
+                  },
+                  "title": "Response Search Api Beatport Search Get",
+                  "type": "array"
                 }
               }
             },
@@ -6635,45 +8890,53 @@
             "OAuth2PasswordBearer": []
           }
         ],
-        "summary": "Change Password",
+        "summary": "Search",
         "tags": [
-          "auth"
+          "beatport"
         ]
       }
     },
-    "/api/auth/me/preferences": {
-      "patch": {
-        "operationId": "update_me_preferences_api_auth_me_preferences_patch",
-        "requestBody": {
-          "content": {
-            "application/json": {
-              "schema": {
-                "$ref": "#/components/schemas/MePreferencesUpdate"
-              }
-            }
-          },
-          "required": true
-        },
+    "/api/beatport/status": {
+      "get": {
+        "description": "Check if current user has linked Beatport account.",
+        "operationId": "get_status_api_beatport_status_get",
         "responses": {
           "200": {
             "content": {
               "application/json": {
                 "schema": {
-                  "$ref": "#/components/schemas/UserOut"
+                  "$ref": "#/components/schemas/BeatportStatus"
                 }
               }
             },
             "description": "Successful Response"
-          },
-          "422": {
+          }
+        },
+        "security": [
+          {
+            "OAuth2PasswordBearer": []
+          }
+        ],
+        "summary": "Get Status",
+        "tags": [
+          "beatport"
+        ]
+      }
+    },
+    "/api/bridge/apikey": {
+      "get": {
+        "description": "Return the server's bridge API key to an admin user.\n\nThe GUI uses this so the DJ doesn't have to manually paste the key.\nRestricted to admins to prevent non-owners from impersonating the bridge.",
+        "operationId": "get_bridge_api_key_api_bridge_apikey_get",
+        "responses": {
+          "200": {
             "content": {
               "application/json": {
                 "schema": {
-                  "$ref": "#/components/schemas/HTTPValidationError"
+                  "$ref": "#/components/schemas/BridgeApiKeyResponse"
                 }
               }
             },
-            "description": "Validation Error"
+            "description": "Successful Response"
           }
         },
         "security": [
@@ -6681,32 +8944,44 @@
             "OAuth2PasswordBearer": []
           }
         ],
-        "summary": "Update Me Preferences",
+        "summary": "Get Bridge Api Key",
         "tags": [
-          "auth"
+          "bridge"
         ]
       }
     },
-    "/api/auth/register": {
-      "post": {
-        "description": "Register a new user (pending approval).",
-        "operationId": "register_api_auth_register_post",
-        "requestBody": {
-          "content": {
-            "application/json": {
-              "schema": {
-                "$ref": "#/components/schemas/RegisterRequest"
-              }
+    "/api/bridge/commands/{code}": {
+      "get": {
+        "description": "Poll and clear pending commands for the bridge.\n\nRequires bridge API key auth. Returns all pending commands and clears the queue.\nRate limited to 30 requests per minute.",
+        "operationId": "get_bridge_commands_api_bridge_commands__code__get",
+        "parameters": [
+          {
+            "in": "path",
+            "name": "code",
+            "required": true,
+            "schema": {
+              "maxLength": 10,
+              "minLength": 1,
+              "title": "Code",
+              "type": "string"
             }
           },
-          "required": true
-        },
+          {
+            "in": "header",
+            "name": "x-bridge-api-key",
+            "required": true,
+            "schema": {
+              "title": "X-Bridge-Api-Key",
+              "type": "string"
+            }
+          }
+        ],
         "responses": {
           "200": {
             "content": {
               "application/json": {
                 "schema": {
-                  "$ref": "#/components/schemas/StatusMessageResponse"
+                  "$ref": "#/components/schemas/BridgeCommandsPollResponse"
                 }
               }
             },
@@ -6723,43 +8998,90 @@
             "description": "Validation Error"
           }
         },
-        "summary": "Register",
+        "summary": "Get Bridge Commands",
         "tags": [
-          "auth"
+          "bridge"
         ]
-      }
-    },
-    "/api/auth/settings": {
-      "get": {
-        "description": "Public endpoint returning registration status and Turnstile site key.",
-        "operationId": "get_public_settings_api_auth_settings_get",
+      },
+      "post": {
+        "description": "Queue a command for the bridge to pick up.\n\nRequires JWT auth. The user must own the event or be an admin.\nRate limited to 10 requests per minute.",
+        "operationId": "post_bridge_command_api_bridge_commands__code__post",
+        "parameters": [
+          {
+            "in": "path",
+            "name": "code",
+            "required": true,
+            "schema": {
+              "maxLength": 10,
+              "minLength": 1,
+              "title": "Code",
+              "type": "string"
+            }
+          }
+        ],
+        "requestBody": {
+          "content": {
+            "application/json": {
+              "schema": {
+                "$ref": "#/components/schemas/BridgeCommandRequest"
+              }
+            }
+          },
+          "required": true
+        },
         "responses": {
           "200": {
             "content": {
               "application/json": {
                 "schema": {
-                  "$ref": "#/components/schemas/PublicSettings"
+                  "$ref": "#/components/schemas/BridgeCommandResponse"
                 }
               }
             },
             "description": "Successful Response"
+          },
+          "422": {
+            "content": {
+              "application/json": {
+                "schema": {
+                  "$ref": "#/components/schemas/HTTPValidationError"
+                }
+              }
+            },
+            "description": "Validation Error"
           }
         },
-        "summary": "Get Public Settings",
+        "security": [
+          {
+            "OAuth2PasswordBearer": []
+          }
+        ],
+        "summary": "Post Bridge Command",
         "tags": [
-          "auth"
+          "bridge"
         ]
       }
     },
-    "/api/beatport/auth/login": {
+    "/api/bridge/nowplaying": {
       "post": {
-        "description": "Authenticate with Beatport using username/password.\n\nThe backend logs in to Beatport server-side, obtains an authorization\ncode, exchanges it for tokens, and stores them on the user.",
-        "operationId": "login_beatport_api_beatport_auth_login_post",
+        "description": "Bridge reports a new track playing.\n\nCalled when the DJ loads/plays a new track on their equipment.\nArchives the previous track to play history and updates now_playing.\nRate limited to 60 requests per minute.",
+        "operationId": "post_now_playing_api_bridge_nowplaying_post",
+        "parameters": [
+          {
+            "in": "header",
+            "name": "x-bridge-api-key",
+            "required": true,
+            "schema": {
+              "title": "X-Bridge-Api-Key",
+              "type": "string"
+            }
+          }
+        ],
         "requestBody": {
           "content": {
             "application/json": {
               "schema": {
-                "$ref": "#/components/schemas/BeatportLogin"
+                "$ref": "#/components/schemas/NowPlayingBridgePayload"
               }
             }
           },
@@ -6770,7 +9092,7 @@
             "content": {
               "application/json": {
                 "schema": {
-                  "$ref": "#/components/schemas/StatusMessageResponse"
+                  "$ref": "#/components/schemas/StatusResponse"
                 }
               }
             },
@@ -6787,56 +9109,35 @@
             "description": "Validation Error"
           }
         },
-        "security": [
-          {
-            "OAuth2PasswordBearer": []
-          }
-        ],
-        "summary": "Login Beatport",
-        "tags": [
-          "beatport"
-        ]
-      }
-    },
-    "/api/beatport/disconnect": {
-      "post": {
-        "description": "Unlink Beatport account from current user.",
-        "operationId": "disconnect_api_beatport_disconnect_post",
-        "responses": {
-          "200": {
-            "content": {
-              "application/json": {
-                "schema": {
-                  "$ref": "#/components/schemas/StatusMessageResponse"
-                }
-              }
-            },
-            "description": "Successful Response"
-          }
-        },
-        "security": [
-          {
-            "OAuth2PasswordBearer": []
-          }
-        ],
-        "summary": "Disconnect",
+        "summary": "Post Now Playing",
         "tags": [
-          "beatport"
+          "bridge"
         ]
       }
     },
-    "/api/beatport/events/{event_id}/settings": {
-      "get": {
-        "description": "Get Beatport sync settings for an event.",
-        "operationId": "get_event_settings_api_beatport_events__event_id__settings_get",
+    "/api/bridge/nowplaying/{code}": {
+      "delete": {
+        "description": "Bridge signals track ended / deck cleared.\n\nArchives current track to history and clears now_playing.\nRate limited to 60 requests per minute.",
+        "operationId": "delete_now_playing_api_bridge_nowplaying__code__delete",
         "parameters": [
           {
             "in": "path",
-            "name": "event_id",
+            "name": "code",
             "required": true,
             "schema": {
-              "title": "Event Id",
-              "type": "integer"
+              "maxLength": 10,
+              "minLength": 1,
+              "title": "Code",
+              "type": "string"
+            }
+          },
+          {
+            "in": "header",
+            "name": "x-bridge-api-key",
+            "required": true,
+            "schema": {
+              "title": "X-Bridge-Api-Key",
+              "type": "string"
             }
           }
         ],
@@ -6845,7 +9146,7 @@
             "content": {
               "application/json": {
                 "schema": {
-                  "$ref": "#/components/schemas/BeatportEventSettings"
+                  "$ref": "#/components/schemas/StatusResponse"
                 }
               }
             },
@@ -6862,27 +9163,24 @@
             "description": "Validation Error"
           }
         },
-        "security": [
-          {
-            "OAuth2PasswordBearer": []
-          }
-        ],
-        "summary": "Get Event Settings",
+        "summary": "Delete Now Playing",
         "tags": [
-          "beatport"
+          "bridge"
         ]
-      },
-      "put": {
-        "description": "Update Beatport sync settings for an event.",
-        "operationId": "update_event_settings_api_beatport_events__event_id__settings_put",
+      }
+    },
+    "/api/bridge/status": {
+      "post": {
+        "description": "Bridge reports connection status.\n\nCalled when bridge connects/disconnects from DJ equipment.\nRate limited to 30 requests per minute.",
+        "operationId": "post_bridge_status_api_bridge_status_post",
         "parameters": [
           {
-            "in": "path",
-            "name": "event_id",
+            "in": "header",
+            "name": "x-bridge-api-key",
             "required": true,
             "schema": {
-              "title": "Event Id",
-              "type": "integer"
+              "title": "X-Bridge-Api-Key",
+              "type": "string"
             }
           }
         ],
@@ -6890,7 +9188,7 @@
           "content": {
             "application/json": {
               "schema": {
-                "$ref": "#/components/schemas/BeatportEventSettingsUpdate"
+                "$ref": "#/components/schemas/BridgeStatusPayload"
               }
             }
           },
@@ -6901,7 +9199,7 @@
             "content": {
               "application/json": {
                 "schema": {
-                  "$ref": "#/components/schemas/BeatportEventSettings"
+                  "$ref": "#/components/schemas/StatusResponse"
                 }
               }
             },
@@ -6918,48 +9216,59 @@
             "description": "Validation Error"
           }
         },
+        "summary": "Post Bridge Status",
+        "tags": [
+          "bridge"
+        ]
+      }
+    },
+    "/api/events": {
+      "get": {
+        "operationId": "list_events_api_events_get",
+        "responses": {
+          "200": {
+            "content": {
+              "application/json": {
+                "schema": {
+                  "items": {
+                    "$ref": "#/components/schemas/EventOut"
+                  },
+                  "title": "Response List Events Api Events Get",
+                  "type": "array"
+                }
+              }
+            },
+            "description": "Successful Response"
+          }
+        },
         "security": [
           {
             "OAuth2PasswordBearer": []
           }
         ],
-        "summary": "Update Event Settings",
+        "summary": "List Events",
         "tags": [
-          "beatport"
+          "events"
         ]
-      }
-    },
-    "/api/beatport/requests/{request_id}/link": {
+      },
       "post": {
-        "description": "Manually link a Beatport track to a request.\n\nVerifies the track exists on Beatport, then stores the\nBeatport URL and metadata in sync_results_json.",
-        "operationId": "link_track_api_beatport_requests__request_id__link_post",
-        "parameters": [
-          {
-            "in": "path",
-            "name": "request_id",
-            "required": true,
-            "schema": {
-              "title": "Request Id",
-              "type": "integer"
-            }
-          }
-        ],
+        "operationId": "create_new_event_api_events_post",
         "requestBody": {
           "content": {
             "application/json": {
               "schema": {
-                "$ref": "#/components/schemas/BeatportManualLink"
+                "$ref": "#/components/schemas/EventCreate"
               }
             }
           },
           "required": true
         },
         "responses": {
-          "200": {
+          "201": {
             "content": {
               "application/json": {
                 "schema": {
-                  "$ref": "#/components/schemas/StatusMessageResponse"
+                  "$ref": "#/components/schemas/EventOut"
                 }
               }
             },
@@ -6981,26 +9290,31 @@
             "OAuth2PasswordBearer": []
           }
         ],
-        "summary": "Link Track",
+        "summary": "Create New Event",
         "tags": [
-          "beatport"
+          "events"
         ]
       }
     },
-    "/api/beatport/search": {
+    "/api/events/activity": {
       "get": {
-        "description": "Search Beatport for tracks.",
-        "operationId": "search_api_beatport_search_get",
+        "description": "Get recent activity log entries for the current user's events.",
+        "operationId": "get_activity_log_api_events_activity_get",
         "parameters": [
           {
             "in": "query",
-            "name": "q",
-            "required": true,
+            "name": "event_code",
+            "required": false,
             "schema": {
-              "maxLength": 200,
-              "minLength": 1,
-              "title": "Q",
-              "type": "string"
+              "anyOf": [
+                {
+                  "type": "string"
+                },
+                {
+                  "type": "null"
+                }
+              ],
+              "title": "Event Code"
             }
           },
           {
@@ -7008,8 +9322,8 @@
             "name": "limit",
             "required": false,
             "schema": {
-              "default": 10,
-              "maximum": 50,
+              "default": 50,
+              "maximum": 200,
               "minimum": 1,
               "title": "Limit",
               "type": "integer"
@@ -7022,9 +9336,9 @@
               "application/json": {
                 "schema": {
                   "items": {
-                    "$ref": "#/components/schemas/BeatportSearchResult"
+                    "$ref": "#/components/schemas/ActivityLogEntry"
                   },
-                  "title": "Response Search Api Beatport Search Get",
+                  "title": "Response Get Activity Log Api Events Activity Get",
                   "type": "array"
                 }
               }
@@ -7047,22 +9361,26 @@
             "OAuth2PasswordBearer": []
           }
         ],
-        "summary": "Search",
+        "summary": "Get Activity Log",
         "tags": [
-          "beatport"
+          "events"
         ]
       }
     },
-    "/api/beatport/status": {
+    "/api/events/archived": {
       "get": {
-        "description": "Check if current user has linked Beatport account.",
-        "operationId": "get_status_api_beatport_status_get",
+        "description": "List all archived and expired events for the current user.",
+        "operationId": "list_archived_events_api_events_archived_get",
         "responses": {
           "200": {
             "content": {
               "application/json": {
                 "schema": {
-                  "$ref": "#/components/schemas/BeatportStatus"
+                  "items": {
+                    "$ref": "#/components/schemas/EventOut"
+                  },
+                  "title": "Response List Archived Events Api Events Archived Get",
+                  "type": "array"
                 }
               }
             },
@@ -7074,26 +9392,87 @@
             "OAuth2PasswordBearer": []
           }
         ],
-        "summary": "Get Status",
+        "summary": "List Archived Events",
+        "tags": [
+          "events"
+        ]
+      }
+    },
+    "/api/events/bulk-delete": {
+      "post": {
+        "description": "Bulk delete multiple events owned by the current user.",
+        "operationId": "bulk_delete_events_endpoint_api_events_bulk_delete_post",
+        "requestBody": {
+          "content": {
+            "application/json": {
+              "schema": {
+                "$ref": "#/components/schemas/BulkDeleteEventsRequest"
+              }
+            }
+          },
+          "required": true
+        },
+        "responses": {
+          "200": {
+            "content": {
+              "application/json": {
+                "schema": {
+                  "$ref": "#/components/schemas/BulkActionResponse"
+                }
+              }
+            },
+            "description": "Successful Response"
+          },
+          "422": {
+            "content": {
+              "application/json": {
+                "schema": {
+                  "$ref": "#/components/schemas/HTTPValidationError"
+                }
+              }
+            },
+            "description": "Validation Error"
+          }
+        },
+        "security": [
+          {
+            "OAuth2PasswordBearer": []
+          }
+        ],
+        "summary": "Bulk Delete Events Endpoint",
         "tags": [
-          "beatport"
+          "events"
         ]
       }
     },
-    "/api/bridge/apikey": {
-      "get": {
-        "description": "Return the server's bridge API key to an admin user.\n\nThe GUI uses this so the DJ doesn't have to manually paste the key.\nRestricted to admins to prevent non-owners from impersonating the bridge.",
-        "operationId": "get_bridge_api_key_api_bridge_apikey_get",
+    "/api/events/{code}": {
+      "delete": {
+        "description": "Delete an event and all its requests.",
+        "operationId": "delete_event_endpoint_api_events__code__delete",
+        "parameters": [
+          {
+            "in": "path",
+            "name": "code",
+            "required": true,
+            "schema": {
+              "title": "Code",
+              "type": "string"
+            }
+          }
+        ],
         "responses": {
-          "200": {
+          "204": {
+            "description": "Successful Response"
+          },
+          "422": {
             "content": {
               "application/json": {
                 "schema": {
-                  "$ref": "#/components/schemas/BridgeApiKeyResponse"
+                  "$ref": "#/components/schemas/HTTPValidationError"
                 }
               }
             },
-            "description": "Successful Response"
+            "description": "Validation Error"
           }
         },
         "security": [
@@ -7101,36 +9480,22 @@
             "OAuth2PasswordBearer": []
           }
         ],
-        "summary": "Get Bridge Api Key",
+        "summary": "Delete Event Endpoint",
         "tags": [
-          "bridge"
+          "events"
         ]
-      }
-    },
-    "/api/bridge/commands/{code}": {
+      },
       "get": {
-        "description": "Poll and clear pending commands for the bridge.\n\nRequires bridge API key auth. Returns all pending commands and clears the queue.\nRate limited to 30 requests per minute.",
-        "operationId": "get_bridge_commands_api_bridge_commands__code__get",
+        "operationId": "get_event_api_events__code__get",
         "parameters": [
           {
             "in": "path",
             "name": "code",
             "required": true,
             "schema": {
-              "maxLength": 10,
-              "minLength": 1,
               "title": "Code",
               "type": "string"
             }
-          },
-          {
-            "in": "header",
-            "name": "x-bridge-api-key",
-            "required": true,
-            "schema": {
-              "title": "X-Bridge-Api-Key",
-              "type": "string"
-            }
           }
         ],
         "responses": {
@@ -7138,7 +9503,7 @@
             "content": {
               "application/json": {
                 "schema": {
-                  "$ref": "#/components/schemas/BridgeCommandsPollResponse"
+                  "$ref": "#/components/schemas/EventOut"
                 }
               }
             },
@@ -7155,22 +9520,24 @@
             "description": "Validation Error"
           }
         },
-        "summary": "Get Bridge Commands",
+        "security": [
+          {
+            "OAuth2PasswordBearer": []
+          }
+        ],
+        "summary": "Get Event",
         "tags": [
-          "bridge"
+          "events"
         ]
       },
-      "post": {
-        "description": "Queue a command for the bridge to pick up.\n\nRequires JWT auth. The user must own the event or be an admin.\nRate limited to 10 requests per minute.",
-        "operationId": "post_bridge_command_api_bridge_commands__code__post",
+      "patch": {
+        "operationId": "update_event_endpoint_api_events__code__patch",
         "parameters": [
           {
             "in": "path",
             "name": "code",
             "required": true,
             "schema": {
-              "maxLength": 10,
-              "minLength": 1,
               "title": "Code",
               "type": "string"
             }
@@ -7180,7 +9547,7 @@
           "content": {
             "application/json": {
               "schema": {
-                "$ref": "#/components/schemas/BridgeCommandRequest"
+                "$ref": "#/components/schemas/EventUpdate"
               }
             }
           },
@@ -7191,7 +9558,7 @@
             "content": {
               "application/json": {
                 "schema": {
-                  "$ref": "#/components/schemas/BridgeCommandResponse"
+                  "$ref": "#/components/schemas/EventOut"
                 }
               }
             },
@@ -7213,43 +9580,33 @@
             "OAuth2PasswordBearer": []
           }
         ],
-        "summary": "Post Bridge Command",
+        "summary": "Update Event Endpoint",
         "tags": [
-          "bridge"
+          "events"
         ]
       }
     },
-    "/api/bridge/nowplaying": {
+    "/api/events/{code}/archive": {
       "post": {
-        "description": "Bridge reports a new track playing.\n\nCalled when the DJ loads/plays a new track on their equipment.\nArchives the previous track to play history and updates now_playing.\nRate limited to 60 requests per minute.",
-        "operationId": "post_now_playing_api_bridge_nowplaying_post",
+        "description": "Archive an event.",
+        "operationId": "archive_event_endpoint_api_events__code__archive_post",
         "parameters": [
           {
-            "in": "header",
-            "name": "x-bridge-api-key",
+            "in": "path",
+            "name": "code",
             "required": true,
             "schema": {
-              "title": "X-Bridge-Api-Key",
+              "title": "Code",
               "type": "string"
             }
           }
         ],
-        "requestBody": {
-          "content": {
-            "application/json": {
-              "schema": {
-                "$ref": "#/components/schemas/NowPlayingBridgePayload"
-              }
-            }
-          },
-          "required": true
-        },
         "responses": {
           "200": {
             "content": {
               "application/json": {
                 "schema": {
-                  "$ref": "#/components/schemas/StatusResponse"
+                  "$ref": "#/components/schemas/EventOut"
                 }
               }
             },
@@ -7266,44 +9623,94 @@
             "description": "Validation Error"
           }
         },
-        "summary": "Post Now Playing",
+        "security": [
+          {
+            "OAuth2PasswordBearer": []
+          }
+        ],
+        "summary": "Archive Event Endpoint",
         "tags": [
-          "bridge"
+          "events"
         ]
       }
     },
-    "/api/bridge/nowplaying/{code}": {
+    "/api/events/{code}/banner": {
       "delete": {
-        "description": "Bridge signals track ended / deck cleared.\n\nArchives current track to history and clears now_playing.\nRate limited to 60 requests per minute.",
-        "operationId": "delete_now_playing_api_bridge_nowplaying__code__delete",
+        "description": "Delete the event's custom banner image.",
+        "operationId": "delete_banner_api_events__code__banner_delete",
         "parameters": [
           {
             "in": "path",
             "name": "code",
             "required": true,
             "schema": {
-              "maxLength": 10,
-              "minLength": 1,
               "title": "Code",
               "type": "string"
             }
+          }
+        ],
+        "responses": {
+          "200": {
+            "content": {
+              "application/json": {
+                "schema": {
+                  "$ref": "#/components/schemas/EventOut"
+                }
+              }
+            },
+            "description": "Successful Response"
           },
+          "422": {
+            "content": {
+              "application/json": {
+                "schema": {
+                  "$ref": "#/components/schemas/HTTPValidationError"
+                }
+              }
+            },
+            "description": "Validation Error"
+          }
+        },
+        "security": [
           {
-            "in": "header",
-            "name": "x-bridge-api-key",
+            "OAuth2PasswordBearer": []
+          }
+        ],
+        "summary": "Delete Banner",
+        "tags": [
+          "events"
+        ]
+      },
+      "post": {
+        "description": "Upload a custom banner image for the event.",
+        "operationId": "upload_banner_api_events__code__banner_post",
+        "parameters": [
+          {
+            "in": "path",
+            "name": "code",
             "required": true,
             "schema": {
-              "title": "X-Bridge-Api-Key",
+              "title": "Code",
               "type": "string"
             }
           }
         ],
+        "requestBody": {
+          "content": {
+            "multipart/form-data": {
+              "schema": {
+                "$ref": "#/components/schemas/Body_upload_banner_api_events__code__banner_post"
+              }
+            }
+          },
+          "required": true
+        },
         "responses": {
           "200": {
             "content": {
               "application/json": {
                 "schema": {
-                  "$ref": "#/components/schemas/StatusResponse"
+                  "$ref": "#/components/schemas/EventOut"
                 }
               }
             },
@@ -7320,23 +9727,27 @@
             "description": "Validation Error"
           }
         },
-        "summary": "Delete Now Playing",
+        "security": [
+          {
+            "OAuth2PasswordBearer": []
+          }
+        ],
+        "summary": "Upload Banner",
         "tags": [
-          "bridge"
+          "events"
         ]
       }
     },
-    "/api/bridge/status": {
+    "/api/events/{code}/bulk-review": {
       "post": {
-        "description": "Bridge reports connection status.\n\nCalled when bridge connects/disconnects from DJ equipment.\nRate limited to 30 requests per minute.",
-        "operationId": "post_bridge_status_api_bridge_status_post",
+        "operationId": "bulk_review_api_events__code__bulk_review_post",
         "parameters": [
           {
-            "in": "header",
-            "name": "x-bridge-api-key",
+            "in": "path",
+            "name": "code",
             "required": true,
             "schema": {
-              "title": "X-Bridge-Api-Key",
+              "title": "Code",
               "type": "string"
             }
           }
@@ -7345,7 +9756,7 @@
           "content": {
             "application/json": {
               "schema": {
-                "$ref": "#/components/schemas/BridgeStatusPayload"
+                "$ref": "#/components/schemas/BulkReviewRequest"
               }
             }
           },
@@ -7356,7 +9767,7 @@
             "content": {
               "application/json": {
                 "schema": {
-                  "$ref": "#/components/schemas/StatusResponse"
+                  "$ref": "#/components/schemas/BulkReviewResponse"
                 }
               }
             },
@@ -7373,29 +9784,54 @@
             "description": "Validation Error"
           }
         },
-        "summary": "Post Bridge Status",
+        "security": [
+          {
+            "OAuth2PasswordBearer": []
+          }
+        ],
+        "summary": "Bulk Review",
         "tags": [
-          "bridge"
+          "events"
         ]
       }
     },
-    "/api/events": {
+    "/api/events/{code}/collection": {
       "get": {
-        "operationId": "list_events_api_events_get",
+        "description": "Get pre-event collection scheduling settings.",
+        "operationId": "get_collection_settings_api_events__code__collection_get",
+        "parameters": [
+          {
+            "in": "path",
+            "name": "code",
+            "required": true,
+            "schema": {
+              "title": "Code",
+              "type": "string"
+            }
+          }
+        ],
         "responses": {
           "200": {
             "content": {
               "application/json": {
                 "schema": {
-                  "items": {
-                    "$ref": "#/components/schemas/EventOut"
-                  },
-                  "title": "Response List Events Api Events Get",
-                  "type": "array"
+                  "additionalProperties": true,
+                  "title": "Response Get Collection Settings Api Events  Code  Collection Get",
+                  "type": "object"
                 }
               }
             },
             "description": "Successful Response"
+          },
+          "422": {
+            "content": {
+              "application/json": {
+                "schema": {
+                  "$ref": "#/components/schemas/HTTPValidationError"
+                }
+              }
+            },
+            "description": "Validation Error"
           }
         },
         "security": [
@@ -7403,29 +9839,43 @@
             "OAuth2PasswordBearer": []
           }
         ],
-        "summary": "List Events",
-        "tags": [
-          "events"
-        ]
-      },
-      "post": {
-        "operationId": "create_new_event_api_events_post",
+        "summary": "Get Collection Settings",
+        "tags": [
+          "events"
+        ]
+      },
+      "patch": {
+        "description": "Update pre-event collection scheduling settings.",
+        "operationId": "update_collection_settings_endpoint_api_events__code__collection_patch",
+        "parameters": [
+          {
+            "in": "path",
+            "name": "code",
+            "required": true,
+            "schema": {
+              "title": "Code",
+              "type": "string"
+            }
+          }
+        ],
         "requestBody": {
           "content": {
             "application/json": {
               "schema": {
-                "$ref": "#/components/schemas/EventCreate"
+                "$ref": "#/components/schemas/UpdateCollectionSettings"
               }
             }
           },
           "required": true
         },
         "responses": {
-          "201": {
+          "200": {
             "content": {
               "application/json": {
                 "schema": {
-                  "$ref": "#/components/schemas/EventOut"
+                  "additionalProperties": true,
+                  "title": "Response Update Collection Settings Endpoint Api Events  Code  Collection Patch",
+                  "type": "object"
                 }
               }
             },
@@ -7447,43 +9897,24 @@
             "OAuth2PasswordBearer": []
           }
         ],
-        "summary": "Create New Event",
+        "summary": "Update Collection Settings Endpoint",
         "tags": [
           "events"
         ]
       }
     },
-    "/api/events/activity": {
-      "get": {
-        "description": "Get recent activity log entries for the current user's events.",
-        "operationId": "get_activity_log_api_events_activity_get",
+    "/api/events/{code}/collection/sync-tidal": {
+      "post": {
+        "description": "Sync all non-rejected collection-phase requests to the DJ's Tidal playlist.\n\nIncludes pending (new) and accepted requests so the DJ can listen to guest\nsuggestions on Tidal before the review step.  Already-synced tracks are\nsilently skipped inside sync_requests_batch.",
+        "operationId": "sync_collection_to_tidal_api_events__code__collection_sync_tidal_post",
         "parameters": [
           {
-            "in": "query",
-            "name": "event_code",
-            "required": false,
-            "schema": {
-              "anyOf": [
-                {
-                  "type": "string"
-                },
-                {
-                  "type": "null"
-                }
-              ],
-              "title": "Event Code"
-            }
-          },
-          {
-            "in": "query",
-            "name": "limit",
-            "required": false,
+            "in": "path",
+            "name": "code",
+            "required": true,
             "schema": {
-              "default": 50,
-              "maximum": 200,
-              "minimum": 1,
-              "title": "Limit",
-              "type": "integer"
+              "title": "Code",
+              "type": "string"
             }
           }
         ],
@@ -7491,13 +9922,7 @@
           "200": {
             "content": {
               "application/json": {
-                "schema": {
-                  "items": {
-                    "$ref": "#/components/schemas/ActivityLogEntry"
-                  },
-                  "title": "Response Get Activity Log Api Events Activity Get",
-                  "type": "array"
-                }
+                "schema": {}
               }
             },
             "description": "Successful Response"
@@ -7518,30 +9943,47 @@
             "OAuth2PasswordBearer": []
           }
         ],
-        "summary": "Get Activity Log",
+        "summary": "Sync Collection To Tidal",
         "tags": [
           "events"
         ]
       }
     },
-    "/api/events/archived": {
+    "/api/events/{code}/display-settings": {
       "get": {
-        "description": "List all archived and expired events for the current user.",
-        "operationId": "list_archived_events_api_events_archived_get",
+        "description": "Get current display settings for an event.",
+        "operationId": "get_display_settings_api_events__code__display_settings_get",
+        "parameters": [
+          {
+            "in": "path",
+            "name": "code",
+            "required": true,
+            "schema": {
+              "title": "Code",
+              "type": "string"
+            }
+          }
+        ],
         "responses": {
           "200": {
             "content": {
               "application/json": {
                 "schema": {
-                  "items": {
-                    "$ref": "#/components/schemas/EventOut"
-                  },
-                  "title": "Response List Archived Events Api Events Archived Get",
-                  "type": "array"
+                  "$ref": "#/components/schemas/DisplaySettingsResponse"
                 }
               }
             },
             "description": "Successful Response"
+          },
+          "422": {
+            "content": {
+              "application/json": {
+                "schema": {
+                  "$ref": "#/components/schemas/HTTPValidationError"
+                }
+              }
+            },
+            "description": "Validation Error"
           }
         },
         "security": [
@@ -7549,21 +9991,30 @@
             "OAuth2PasswordBearer": []
           }
         ],
-        "summary": "List Archived Events",
+        "summary": "Get Display Settings",
         "tags": [
           "events"
         ]
-      }
-    },
-    "/api/events/bulk-delete": {
-      "post": {
-        "description": "Bulk delete multiple events owned by the current user.",
-        "operationId": "bulk_delete_events_endpoint_api_events_bulk_delete_post",
+      },
+      "patch": {
+        "description": "Update display settings for an event (e.g., hide/show now playing on kiosk).",
+        "operationId": "update_display_settings_api_events__code__display_settings_patch",
+        "parameters": [
+          {
+            "in": "path",
+            "name": "code",
+            "required": true,
+            "schema": {
+              "title": "Code",
+              "type": "string"
+            }
+          }
+        ],
         "requestBody": {
           "content": {
             "application/json": {
               "schema": {
-                "$ref": "#/components/schemas/BulkDeleteEventsRequest"
+                "$ref": "#/components/schemas/DisplaySettingsUpdate"
               }
             }
           },
@@ -7574,7 +10025,7 @@
             "content": {
               "application/json": {
                 "schema": {
-                  "$ref": "#/components/schemas/BulkActionResponse"
+                  "$ref": "#/components/schemas/DisplaySettingsResponse"
                 }
               }
             },
@@ -7596,16 +10047,16 @@
             "OAuth2PasswordBearer": []
           }
         ],
-        "summary": "Bulk Delete Events Endpoint",
+        "summary": "Update Display Settings",
         "tags": [
           "events"
         ]
       }
     },
-    "/api/events/{code}": {
-      "delete": {
-        "description": "Delete an event and all its requests.",
-        "operationId": "delete_event_endpoint_api_events__code__delete",
+    "/api/events/{code}/enrich-all": {
+      "post": {
+        "description": "Queue enrichment for up to ENRICH_ALL_BATCH_LIMIT requests missing BPM, key, or genre.\n\nBatched to avoid exhausting the connection pool when many tracks need enrichment.\nReturns `remaining` so the caller can re-invoke until 0.",
+        "operationId": "enrich_all_requests_api_events__code__enrich_all_post",
         "parameters": [
           {
             "in": "path",
@@ -7618,7 +10069,12 @@
           }
         ],
         "responses": {
-          "204": {
+          "200": {
+            "content": {
+              "application/json": {
+                "schema": {}
+              }
+            },
             "description": "Successful Response"
           },
           "422": {
@@ -7637,13 +10093,16 @@
             "OAuth2PasswordBearer": []
           }
         ],
-        "summary": "Delete Event Endpoint",
+        "summary": "Enrich All Requests",
         "tags": [
           "events"
         ]
-      },
+      }
+    },
+    "/api/events/{code}/export/csv": {
       "get": {
-        "operationId": "get_event_api_events__code__get",
+        "description": "Export event requests as CSV. Owner can export regardless of event status.",
+        "operationId": "export_event_csv_api_events__code__export_csv_get",
         "parameters": [
           {
             "in": "path",
@@ -7659,9 +10118,7 @@
           "200": {
             "content": {
               "application/json": {
-                "schema": {
-                  "$ref": "#/components/schemas/EventOut"
-                }
+                "schema": {}
               }
             },
             "description": "Successful Response"
@@ -7682,13 +10139,16 @@
             "OAuth2PasswordBearer": []
           }
         ],
-        "summary": "Get Event",
+        "summary": "Export Event Csv",
         "tags": [
           "events"
         ]
-      },
-      "patch": {
-        "operationId": "update_event_endpoint_api_events__code__patch",
+      }
+    },
+    "/api/events/{code}/export/play-history/csv": {
+      "get": {
+        "description": "Export play history as CSV. Owner can export regardless of event status.",
+        "operationId": "export_play_history_csv_api_events__code__export_play_history_csv_get",
         "parameters": [
           {
             "in": "path",
@@ -7700,22 +10160,58 @@
             }
           }
         ],
-        "requestBody": {
-          "content": {
-            "application/json": {
-              "schema": {
-                "$ref": "#/components/schemas/EventUpdate"
+        "responses": {
+          "200": {
+            "content": {
+              "application/json": {
+                "schema": {}
               }
-            }
+            },
+            "description": "Successful Response"
           },
-          "required": true
+          "422": {
+            "content": {
+              "application/json": {
+                "schema": {
+                  "$ref": "#/components/schemas/HTTPValidationError"
+                }
+              }
+            },
+            "description": "Validation Error"
+          }
         },
+        "security": [
+          {
+            "OAuth2PasswordBearer": []
+          }
+        ],
+        "summary": "Export Play History Csv",
+        "tags": [
+          "events"
+        ]
+      }
+    },
+    "/api/events/{code}/pending-review": {
+      "get": {
+        "description": "Get pending review data source for DJ bulk-review.",
+        "operationId": "pending_review_api_events__code__pending_review_get",
+        "parameters": [
+          {
+            "in": "path",
+            "name": "code",
+            "required": true,
+            "schema": {
+              "title": "Code",
+              "type": "string"
+            }
+          }
+        ],
         "responses": {
           "200": {
             "content": {
               "application/json": {
                 "schema": {
-                  "$ref": "#/components/schemas/EventOut"
+                  "$ref": "#/components/schemas/PendingReviewResponse"
                 }
               }
             },
@@ -7737,16 +10233,16 @@
             "OAuth2PasswordBearer": []
           }
         ],
-        "summary": "Update Event Endpoint",
+        "summary": "Pending Review",
         "tags": [
           "events"
         ]
       }
     },
-    "/api/events/{code}/archive": {
-      "post": {
-        "description": "Archive an event.",
-        "operationId": "archive_event_endpoint_api_events__code__archive_post",
+    "/api/events/{code}/playlists": {
+      "get": {
+        "description": "List the DJ's playlists from connected music services.",
+        "operationId": "get_playlists_api_events__code__playlists_get",
         "parameters": [
           {
             "in": "path",
@@ -7762,9 +10258,7 @@
           "200": {
             "content": {
               "application/json": {
-                "schema": {
-                  "$ref": "#/components/schemas/EventOut"
-                }
+                "schema": {}
               }
             },
             "description": "Successful Response"
@@ -7785,16 +10279,16 @@
             "OAuth2PasswordBearer": []
           }
         ],
-        "summary": "Archive Event Endpoint",
+        "summary": "Get Playlists",
         "tags": [
           "events"
         ]
       }
     },
-    "/api/events/{code}/banner": {
-      "delete": {
-        "description": "Delete the event's custom banner image.",
-        "operationId": "delete_banner_api_events__code__banner_delete",
+    "/api/events/{code}/recommendations": {
+      "post": {
+        "description": "Generate song recommendations based on the event's musical profile.",
+        "operationId": "get_recommendations_api_events__code__recommendations_post",
         "parameters": [
           {
             "in": "path",
@@ -7811,7 +10305,7 @@
             "content": {
               "application/json": {
                 "schema": {
-                  "$ref": "#/components/schemas/EventOut"
+                  "$ref": "#/components/schemas/RecommendationResponse"
                 }
               }
             },
@@ -7833,14 +10327,16 @@
             "OAuth2PasswordBearer": []
           }
         ],
-        "summary": "Delete Banner",
+        "summary": "Get Recommendations",
         "tags": [
           "events"
         ]
-      },
-      "post": {
-        "description": "Upload a custom banner image for the event.",
-        "operationId": "upload_banner_api_events__code__banner_post",
+      }
+    },
+    "/api/events/{code}/recommendations/from-template": {
+      "post": {
+        "description": "Generate recommendations using a template playlist.",
+        "operationId": "get_recommendations_from_template_api_events__code__recommendations_from_template_post",
         "parameters": [
           {
             "in": "path",
@@ -7854,9 +10350,9 @@
         ],
         "requestBody": {
           "content": {
-            "multipart/form-data": {
+            "application/json": {
               "schema": {
-                "$ref": "#/components/schemas/Body_upload_banner_api_events__code__banner_post"
+                "$ref": "#/components/schemas/TemplatePlaylistRequest"
               }
             }
           },
@@ -7867,7 +10363,7 @@
             "content": {
               "application/json": {
                 "schema": {
-                  "$ref": "#/components/schemas/EventOut"
+                  "$ref": "#/components/schemas/RecommendationResponse"
                 }
               }
             },
@@ -7889,15 +10385,16 @@
             "OAuth2PasswordBearer": []
           }
         ],
-        "summary": "Upload Banner",
+        "summary": "Get Recommendations From Template",
         "tags": [
           "events"
         ]
       }
     },
-    "/api/events/{code}/bulk-review": {
+    "/api/events/{code}/recommendations/llm": {
       "post": {
-        "operationId": "bulk_review_api_events__code__bulk_review_post",
+        "description": "Generate song recommendations from an LLM-interpreted DJ prompt.",
+        "operationId": "get_llm_recommendations_api_events__code__recommendations_llm_post",
         "parameters": [
           {
             "in": "path",
@@ -7913,7 +10410,7 @@
           "content": {
             "application/json": {
               "schema": {
-                "$ref": "#/components/schemas/BulkReviewRequest"
+                "$ref": "#/components/schemas/LLMPromptRequest"
               }
             }
           },
@@ -7923,9 +10420,7 @@
           "200": {
             "content": {
               "application/json": {
-                "schema": {
-                  "$ref": "#/components/schemas/BulkReviewResponse"
-                }
+                "schema": {}
               }
             },
             "description": "Successful Response"
@@ -7946,16 +10441,15 @@
             "OAuth2PasswordBearer": []
           }
         ],
-        "summary": "Bulk Review",
+        "summary": "Get Llm Recommendations",
         "tags": [
           "events"
         ]
       }
     },
-    "/api/events/{code}/collection": {
+    "/api/events/{code}/requests": {
       "get": {
-        "description": "Get pre-event collection scheduling settings.",
-        "operationId": "get_collection_settings_api_events__code__collection_get",
+        "operationId": "get_event_requests_api_events__code__requests_get",
         "parameters": [
           {
             "in": "path",
@@ -7965,6 +10459,65 @@
               "title": "Code",
               "type": "string"
             }
+          },
+          {
+            "in": "query",
+            "name": "status",
+            "required": false,
+            "schema": {
+              "anyOf": [
+                {
+                  "$ref": "#/components/schemas/RequestStatus"
+                },
+                {
+                  "type": "null"
+                }
+              ],
+              "title": "Status"
+            }
+          },
+          {
+            "in": "query",
+            "name": "since",
+            "required": false,
+            "schema": {
+              "anyOf": [
+                {
+                  "format": "date-time",
+                  "type": "string"
+                },
+                {
+                  "type": "null"
+                }
+              ],
+              "title": "Since"
+            }
+          },
+          {
+            "in": "query",
+            "name": "limit",
+            "required": false,
+            "schema": {
+              "default": 100,
+              "maximum": 500,
+              "minimum": 1,
+              "title": "Limit",
+              "type": "integer"
+            }
+          },
+          {
+            "in": "query",
+            "name": "sort",
+            "required": false,
+            "schema": {
+              "default": "chronological",
+              "enum": [
+                "chronological",
+                "priority"
+              ],
+              "title": "Sort",
+              "type": "string"
+            }
           }
         ],
         "responses": {
@@ -7972,9 +10525,11 @@
             "content": {
               "application/json": {
                 "schema": {
-                  "additionalProperties": true,
-                  "title": "Response Get Collection Settings Api Events  Code  Collection Get",
-                  "type": "object"
+                  "items": {
+                    "$ref": "#/components/schemas/RequestOut"
+                  },
+                  "title": "Response Get Event Requests Api Events  Code  Requests Get",
+                  "type": "array"
                 }
               }
             },
@@ -7996,14 +10551,13 @@
             "OAuth2PasswordBearer": []
           }
         ],
-        "summary": "Get Collection Settings",
+        "summary": "Get Event Requests",
         "tags": [
           "events"
         ]
       },
-      "patch": {
-        "description": "Update pre-event collection scheduling settings.",
-        "operationId": "update_collection_settings_endpoint_api_events__code__collection_patch",
+      "post": {
+        "operationId": "submit_request_api_events__code__requests_post",
         "parameters": [
           {
             "in": "path",
@@ -8019,7 +10573,7 @@
           "content": {
             "application/json": {
               "schema": {
-                "$ref": "#/components/schemas/UpdateCollectionSettings"
+                "$ref": "#/components/schemas/RequestCreate"
               }
             }
           },
@@ -8030,9 +10584,7 @@
             "content": {
               "application/json": {
                 "schema": {
-                  "additionalProperties": true,
-                  "title": "Response Update Collection Settings Endpoint Api Events  Code  Collection Patch",
-                  "type": "object"
+                  "$ref": "#/components/schemas/RequestOut"
                 }
               }
             },
@@ -8049,21 +10601,16 @@
             "description": "Validation Error"
           }
         },
-        "security": [
-          {
-            "OAuth2PasswordBearer": []
-          }
-        ],
-        "summary": "Update Collection Settings Endpoint",
+        "summary": "Submit Request",
         "tags": [
           "events"
         ]
       }
     },
-    "/api/events/{code}/collection/sync-tidal": {
+    "/api/events/{code}/requests/accept-all": {
       "post": {
-        "description": "Sync all non-rejected collection-phase requests to the DJ's Tidal playlist.\n\nIncludes pending (new) and accepted requests so the DJ can listen to guest\nsuggestions on Tidal before the review step.  Already-synced tracks are\nsilently skipped inside sync_requests_batch.",
-        "operationId": "sync_collection_to_tidal_api_events__code__collection_sync_tidal_post",
+        "description": "Accept all NEW requests for an event in one operation.",
+        "operationId": "accept_all_requests_endpoint_api_events__code__requests_accept_all_post",
         "parameters": [
           {
             "in": "path",
@@ -8079,7 +10626,9 @@
           "200": {
             "content": {
               "application/json": {
-                "schema": {}
+                "schema": {
+                  "$ref": "#/components/schemas/AcceptAllResponse"
+                }
               }
             },
             "description": "Successful Response"
@@ -8100,16 +10649,16 @@
             "OAuth2PasswordBearer": []
           }
         ],
-        "summary": "Sync Collection To Tidal",
+        "summary": "Accept All Requests Endpoint",
         "tags": [
           "events"
         ]
       }
     },
-    "/api/events/{code}/display-settings": {
-      "get": {
-        "description": "Get current display settings for an event.",
-        "operationId": "get_display_settings_api_events__code__display_settings_get",
+    "/api/events/{code}/requests/bulk": {
+      "delete": {
+        "description": "Bulk delete requests for an event, optionally filtered by status.",
+        "operationId": "bulk_delete_requests_endpoint_api_events__code__requests_bulk_delete",
         "parameters": [
           {
             "in": "path",
@@ -8119,6 +10668,22 @@
               "title": "Code",
               "type": "string"
             }
+          },
+          {
+            "in": "query",
+            "name": "status",
+            "required": false,
+            "schema": {
+              "anyOf": [
+                {
+                  "type": "string"
+                },
+                {
+                  "type": "null"
+                }
+              ],
+              "title": "Status"
+            }
           }
         ],
         "responses": {
@@ -8126,7 +10691,7 @@
             "content": {
               "application/json": {
                 "schema": {
-                  "$ref": "#/components/schemas/DisplaySettingsResponse"
+                  "$ref": "#/components/schemas/BulkActionResponse"
                 }
               }
             },
@@ -8148,14 +10713,16 @@
             "OAuth2PasswordBearer": []
           }
         ],
-        "summary": "Get Display Settings",
+        "summary": "Bulk Delete Requests Endpoint",
         "tags": [
           "events"
         ]
-      },
-      "patch": {
-        "description": "Update display settings for an event (e.g., hide/show now playing on kiosk).",
-        "operationId": "update_display_settings_api_events__code__display_settings_patch",
+      }
+    },
+    "/api/events/{code}/requests/reject-all": {
+      "post": {
+        "description": "Reject all NEW requests for an event in one operation.",
+        "operationId": "reject_all_requests_endpoint_api_events__code__requests_reject_all_post",
         "parameters": [
           {
             "in": "path",
@@ -8167,22 +10734,12 @@
             }
           }
         ],
-        "requestBody": {
-          "content": {
-            "application/json": {
-              "schema": {
-                "$ref": "#/components/schemas/DisplaySettingsUpdate"
-              }
-            }
-          },
-          "required": true
-        },
         "responses": {
           "200": {
             "content": {
               "application/json": {
                 "schema": {
-                  "$ref": "#/components/schemas/DisplaySettingsResponse"
+                  "$ref": "#/components/schemas/BulkActionResponse"
                 }
               }
             },
@@ -8204,16 +10761,16 @@
             "OAuth2PasswordBearer": []
           }
         ],
-        "summary": "Update Display Settings",
+        "summary": "Reject All Requests Endpoint",
         "tags": [
           "events"
         ]
       }
     },
-    "/api/events/{code}/enrich-all": {
-      "post": {
-        "description": "Queue enrichment for up to ENRICH_ALL_BATCH_LIMIT requests missing BPM, key, or genre.\n\nBatched to avoid exhausting the connection pool when many tracks need enrichment.\nReturns `remaining` so the caller can re-invoke until 0.",
-        "operationId": "enrich_all_requests_api_events__code__enrich_all_post",
+    "/api/events/{code}/search": {
+      "get": {
+        "description": "Public search endpoint for event guests.\n\nPriority: Tidal (primary) \u2192 Spotify (fallback) \u2192 Beatport (event toggle).\nResults are filtered for junk, deduplicated by ISRC, and sorted by popularity.",
+        "operationId": "event_search_api_events__code__search_get",
         "parameters": [
           {
             "in": "path",
@@ -8223,13 +10780,30 @@
               "title": "Code",
               "type": "string"
             }
+          },
+          {
+            "in": "query",
+            "name": "q",
+            "required": true,
+            "schema": {
+              "maxLength": 200,
+              "minLength": 2,
+              "title": "Q",
+              "type": "string"
+            }
           }
         ],
         "responses": {
           "200": {
             "content": {
               "application/json": {
-                "schema": {}
+                "schema": {
+                  "items": {
+                    "$ref": "#/components/schemas/SearchResult"
+                  },
+                  "title": "Response Event Search Api Events  Code  Search Get",
+                  "type": "array"
+                }
               }
             },
             "description": "Successful Response"
@@ -8245,21 +10819,16 @@
             "description": "Validation Error"
           }
         },
-        "security": [
-          {
-            "OAuth2PasswordBearer": []
-          }
-        ],
-        "summary": "Enrich All Requests",
+        "summary": "Event Search",
         "tags": [
           "events"
         ]
       }
     },
-    "/api/events/{code}/export/csv": {
-      "get": {
-        "description": "Export event requests as CSV. Owner can export regardless of event status.",
-        "operationId": "export_event_csv_api_events__code__export_csv_get",
+    "/api/events/{code}/unarchive": {
+      "post": {
+        "description": "Unarchive an event.",
+        "operationId": "unarchive_event_endpoint_api_events__code__unarchive_post",
         "parameters": [
           {
             "in": "path",
@@ -8275,7 +10844,9 @@
           "200": {
             "content": {
               "application/json": {
-                "schema": {}
+                "schema": {
+                  "$ref": "#/components/schemas/EventOut"
+                }
               }
             },
             "description": "Successful Response"
@@ -8296,27 +10867,16 @@
             "OAuth2PasswordBearer": []
           }
         ],
-        "summary": "Export Event Csv",
+        "summary": "Unarchive Event Endpoint",
         "tags": [
           "events"
         ]
       }
     },
-    "/api/events/{code}/export/play-history/csv": {
+    "/api/health": {
       "get": {
-        "description": "Export play history as CSV. Owner can export regardless of event status.",
-        "operationId": "export_play_history_csv_api_events__code__export_play_history_csv_get",
-        "parameters": [
-          {
-            "in": "path",
-            "name": "code",
-            "required": true,
-            "schema": {
-              "title": "Code",
-              "type": "string"
-            }
-          }
-        ],
+        "description": "Health check endpoint for monitoring and load balancers.",
+        "operationId": "api_health_check_api_health_get",
         "responses": {
           "200": {
             "content": {
@@ -8324,65 +10884,33 @@
                 "schema": {}
               }
             },
-            "description": "Successful Response"
-          },
-          "422": {
-            "content": {
-              "application/json": {
-                "schema": {
-                  "$ref": "#/components/schemas/HTTPValidationError"
-                }
-              }
-            },
-            "description": "Validation Error"
+            "description": "Successful Response"
           }
         },
-        "security": [
-          {
-            "OAuth2PasswordBearer": []
-          }
-        ],
-        "summary": "Export Play History Csv",
+        "summary": "Api Health Check",
         "tags": [
-          "events"
+          "health"
         ]
       }
     },
-    "/api/events/{code}/pending-review": {
+    "/api/kiosk/mine": {
       "get": {
-        "description": "Get pending review data source for DJ bulk-review.",
-        "operationId": "pending_review_api_events__code__pending_review_get",
-        "parameters": [
-          {
-            "in": "path",
-            "name": "code",
-            "required": true,
-            "schema": {
-              "title": "Code",
-              "type": "string"
-            }
-          }
-        ],
+        "description": "List all kiosks paired by the current user.",
+        "operationId": "list_my_kiosks_api_kiosk_mine_get",
         "responses": {
           "200": {
             "content": {
               "application/json": {
                 "schema": {
-                  "$ref": "#/components/schemas/PendingReviewResponse"
+                  "items": {
+                    "$ref": "#/components/schemas/KioskOut"
+                  },
+                  "title": "Response List My Kiosks Api Kiosk Mine Get",
+                  "type": "array"
                 }
               }
             },
             "description": "Successful Response"
-          },
-          "422": {
-            "content": {
-              "application/json": {
-                "schema": {
-                  "$ref": "#/components/schemas/HTTPValidationError"
-                }
-              }
-            },
-            "description": "Validation Error"
           }
         },
         "security": [
@@ -8390,32 +10918,44 @@
             "OAuth2PasswordBearer": []
           }
         ],
-        "summary": "Pending Review",
+        "summary": "List My Kiosks",
         "tags": [
-          "events"
+          "kiosk"
         ]
       }
     },
-    "/api/events/{code}/playlists": {
-      "get": {
-        "description": "List the DJ's playlists from connected music services.",
-        "operationId": "get_playlists_api_events__code__playlists_get",
+    "/api/kiosk/pair/{pair_code}/complete": {
+      "post": {
+        "description": "Complete a kiosk pairing by assigning an event.",
+        "operationId": "complete_kiosk_pairing_api_kiosk_pair__pair_code__complete_post",
         "parameters": [
           {
             "in": "path",
-            "name": "code",
+            "name": "pair_code",
             "required": true,
             "schema": {
-              "title": "Code",
+              "title": "Pair Code",
               "type": "string"
             }
           }
         ],
+        "requestBody": {
+          "content": {
+            "application/json": {
+              "schema": {
+                "$ref": "#/components/schemas/KioskCompletePairingRequest"
+              }
+            }
+          },
+          "required": true
+        },
         "responses": {
           "200": {
             "content": {
               "application/json": {
-                "schema": {}
+                "schema": {
+                  "$ref": "#/components/schemas/KioskOut"
+                }
               }
             },
             "description": "Successful Response"
@@ -8436,36 +10976,29 @@
             "OAuth2PasswordBearer": []
           }
         ],
-        "summary": "Get Playlists",
+        "summary": "Complete Kiosk Pairing",
         "tags": [
-          "events"
+          "kiosk"
         ]
       }
     },
-    "/api/events/{code}/recommendations": {
-      "post": {
-        "description": "Generate song recommendations based on the event's musical profile.",
-        "operationId": "get_recommendations_api_events__code__recommendations_post",
+    "/api/kiosk/{kiosk_id}": {
+      "delete": {
+        "description": "Unpair and delete a kiosk.",
+        "operationId": "delete_kiosk_endpoint_api_kiosk__kiosk_id__delete",
         "parameters": [
           {
             "in": "path",
-            "name": "code",
+            "name": "kiosk_id",
             "required": true,
             "schema": {
-              "title": "Code",
-              "type": "string"
+              "title": "Kiosk Id",
+              "type": "integer"
             }
           }
         ],
         "responses": {
-          "200": {
-            "content": {
-              "application/json": {
-                "schema": {
-                  "$ref": "#/components/schemas/RecommendationResponse"
-                }
-              }
-            },
+          "204": {
             "description": "Successful Response"
           },
           "422": {
@@ -8484,24 +11017,22 @@
             "OAuth2PasswordBearer": []
           }
         ],
-        "summary": "Get Recommendations",
+        "summary": "Delete Kiosk Endpoint",
         "tags": [
-          "events"
+          "kiosk"
         ]
-      }
-    },
-    "/api/events/{code}/recommendations/from-template": {
-      "post": {
-        "description": "Generate recommendations using a template playlist.",
-        "operationId": "get_recommendations_from_template_api_events__code__recommendations_from_template_post",
+      },
+      "patch": {
+        "description": "Rename a kiosk.",
+        "operationId": "rename_kiosk_endpoint_api_kiosk__kiosk_id__patch",
         "parameters": [
           {
             "in": "path",
-            "name": "code",
+            "name": "kiosk_id",
             "required": true,
             "schema": {
-              "title": "Code",
-              "type": "string"
+              "title": "Kiosk Id",
+              "type": "integer"
             }
           }
         ],
@@ -8509,7 +11040,7 @@
           "content": {
             "application/json": {
               "schema": {
-                "$ref": "#/components/schemas/TemplatePlaylistRequest"
+                "$ref": "#/components/schemas/KioskRenameRequest"
               }
             }
           },
@@ -8520,7 +11051,7 @@
             "content": {
               "application/json": {
                 "schema": {
-                  "$ref": "#/components/schemas/RecommendationResponse"
+                  "$ref": "#/components/schemas/KioskOut"
                 }
               }
             },
@@ -8542,24 +11073,24 @@
             "OAuth2PasswordBearer": []
           }
         ],
-        "summary": "Get Recommendations From Template",
+        "summary": "Rename Kiosk Endpoint",
         "tags": [
-          "events"
+          "kiosk"
         ]
       }
     },
-    "/api/events/{code}/recommendations/llm": {
-      "post": {
-        "description": "Generate song recommendations from an LLM-interpreted DJ prompt.",
-        "operationId": "get_llm_recommendations_api_events__code__recommendations_llm_post",
+    "/api/kiosk/{kiosk_id}/assign": {
+      "patch": {
+        "description": "Change which event a kiosk displays.",
+        "operationId": "assign_kiosk_api_kiosk__kiosk_id__assign_patch",
         "parameters": [
           {
             "in": "path",
-            "name": "code",
+            "name": "kiosk_id",
             "required": true,
             "schema": {
-              "title": "Code",
-              "type": "string"
+              "title": "Kiosk Id",
+              "type": "integer"
             }
           }
         ],
@@ -8567,7 +11098,7 @@
           "content": {
             "application/json": {
               "schema": {
-                "$ref": "#/components/schemas/LLMPromptRequest"
+                "$ref": "#/components/schemas/KioskAssignRequest"
               }
             }
           },
@@ -8577,7 +11108,9 @@
           "200": {
             "content": {
               "application/json": {
-                "schema": {}
+                "schema": {
+                  "$ref": "#/components/schemas/KioskOut"
+                }
               }
             },
             "description": "Successful Response"
@@ -8598,98 +11131,102 @@
             "OAuth2PasswordBearer": []
           }
         ],
-        "summary": "Get Llm Recommendations",
+        "summary": "Assign Kiosk",
         "tags": [
-          "events"
+          "kiosk"
         ]
       }
     },
-    "/api/events/{code}/requests": {
+    "/api/llm/connectors": {
       "get": {
-        "operationId": "get_event_requests_api_events__code__requests_get",
-        "parameters": [
-          {
-            "in": "path",
-            "name": "code",
-            "required": true,
-            "schema": {
-              "title": "Code",
-              "type": "string"
-            }
-          },
-          {
-            "in": "query",
-            "name": "status",
-            "required": false,
-            "schema": {
-              "anyOf": [
-                {
-                  "$ref": "#/components/schemas/RequestStatus"
-                },
-                {
-                  "type": "null"
-                }
-              ],
-              "title": "Status"
-            }
-          },
-          {
-            "in": "query",
-            "name": "since",
-            "required": false,
-            "schema": {
-              "anyOf": [
-                {
-                  "format": "date-time",
-                  "type": "string"
-                },
-                {
-                  "type": "null"
+        "operationId": "list_connectors_api_llm_connectors_get",
+        "responses": {
+          "200": {
+            "content": {
+              "application/json": {
+                "schema": {
+                  "items": {
+                    "$ref": "#/components/schemas/ConnectorOut"
+                  },
+                  "title": "Response List Connectors Api Llm Connectors Get",
+                  "type": "array"
                 }
-              ],
-              "title": "Since"
-            }
-          },
-          {
-            "in": "query",
-            "name": "limit",
-            "required": false,
-            "schema": {
-              "default": 100,
-              "maximum": 500,
-              "minimum": 1,
-              "title": "Limit",
-              "type": "integer"
-            }
-          },
+              }
+            },
+            "description": "Successful Response"
+          }
+        },
+        "security": [
           {
-            "in": "query",
-            "name": "sort",
-            "required": false,
-            "schema": {
-              "default": "chronological",
-              "enum": [
-                "chronological",
-                "priority"
-              ],
-              "title": "Sort",
-              "type": "string"
-            }
+            "OAuth2PasswordBearer": []
           }
         ],
+        "summary": "List Connectors",
+        "tags": [
+          "llm"
+        ]
+      },
+      "post": {
+        "operationId": "create_connector_endpoint_api_llm_connectors_post",
+        "requestBody": {
+          "content": {
+            "application/json": {
+              "schema": {
+                "$ref": "#/components/schemas/ConnectorCreate"
+              }
+            }
+          },
+          "required": true
+        },
         "responses": {
-          "200": {
+          "201": {
+            "content": {
+              "application/json": {
+                "schema": {
+                  "$ref": "#/components/schemas/ConnectorOut"
+                }
+              }
+            },
+            "description": "Successful Response"
+          },
+          "422": {
             "content": {
               "application/json": {
                 "schema": {
-                  "items": {
-                    "$ref": "#/components/schemas/RequestOut"
-                  },
-                  "title": "Response Get Event Requests Api Events  Code  Requests Get",
-                  "type": "array"
+                  "$ref": "#/components/schemas/HTTPValidationError"
                 }
               }
             },
+            "description": "Validation Error"
+          }
+        },
+        "security": [
+          {
+            "OAuth2PasswordBearer": []
+          }
+        ],
+        "summary": "Create Connector Endpoint",
+        "tags": [
+          "llm"
+        ]
+      }
+    },
+    "/api/llm/connectors/{connector_id}": {
+      "delete": {
+        "operationId": "delete_connector_endpoint_api_llm_connectors__connector_id__delete",
+        "parameters": [
+          {
+            "in": "path",
+            "name": "connector_id",
+            "required": true,
+            "schema": {
+              "title": "Connector Id",
+              "type": "integer"
+            }
+          }
+        ],
+        "responses": {
+          "204": {
             "description": "Successful Response"
           },
           "422": {
@@ -8708,21 +11245,21 @@
             "OAuth2PasswordBearer": []
           }
         ],
-        "summary": "Get Event Requests",
+        "summary": "Delete Connector Endpoint",
         "tags": [
-          "events"
+          "llm"
         ]
       },
-      "post": {
-        "operationId": "submit_request_api_events__code__requests_post",
+      "patch": {
+        "operationId": "update_connector_metadata_api_llm_connectors__connector_id__patch",
         "parameters": [
           {
             "in": "path",
-            "name": "code",
+            "name": "connector_id",
             "required": true,
             "schema": {
-              "title": "Code",
-              "type": "string"
+              "title": "Connector Id",
+              "type": "integer"
             }
           }
         ],
@@ -8730,7 +11267,7 @@
           "content": {
             "application/json": {
               "schema": {
-                "$ref": "#/components/schemas/RequestCreate"
+                "$ref": "#/components/schemas/ConnectorPatch"
               }
             }
           },
@@ -8741,7 +11278,7 @@
             "content": {
               "application/json": {
                 "schema": {
-                  "$ref": "#/components/schemas/RequestOut"
+                  "$ref": "#/components/schemas/ConnectorOut"
                 }
               }
             },
@@ -8758,33 +11295,47 @@
             "description": "Validation Error"
           }
         },
-        "summary": "Submit Request",
+        "security": [
+          {
+            "OAuth2PasswordBearer": []
+          }
+        ],
+        "summary": "Update Connector Metadata",
         "tags": [
-          "events"
+          "llm"
         ]
       }
     },
-    "/api/events/{code}/requests/accept-all": {
-      "post": {
-        "description": "Accept all NEW requests for an event in one operation.",
-        "operationId": "accept_all_requests_endpoint_api_events__code__requests_accept_all_post",
+    "/api/llm/connectors/{connector_id}/credentials": {
+      "put": {
+        "operationId": "rotate_connector_credentials_api_llm_connectors__connector_id__credentials_put",
         "parameters": [
           {
             "in": "path",
-            "name": "code",
+            "name": "connector_id",
             "required": true,
             "schema": {
-              "title": "Code",
-              "type": "string"
+              "title": "Connector Id",
+              "type": "integer"
             }
           }
         ],
+        "requestBody": {
+          "content": {
+            "application/json": {
+              "schema": {
+                "$ref": "#/components/schemas/ConnectorCredentialsRotate"
+              }
+            }
+          },
+          "required": true
+        },
         "responses": {
           "200": {
             "content": {
               "application/json": {
                 "schema": {
-                  "$ref": "#/components/schemas/AcceptAllResponse"
+                  "$ref": "#/components/schemas/ConnectorOut"
                 }
               }
             },
@@ -8806,40 +11357,24 @@
             "OAuth2PasswordBearer": []
           }
         ],
-        "summary": "Accept All Requests Endpoint",
+        "summary": "Rotate Connector Credentials",
         "tags": [
-          "events"
+          "llm"
         ]
       }
     },
-    "/api/events/{code}/requests/bulk": {
+    "/api/llm/connectors/{connector_id}/default": {
       "delete": {
-        "description": "Bulk delete requests for an event, optionally filtered by status.",
-        "operationId": "bulk_delete_requests_endpoint_api_events__code__requests_bulk_delete",
+        "description": "Clear the explicit default \u2014 gateway resolution falls back to MRU.",
+        "operationId": "unset_connector_as_default_api_llm_connectors__connector_id__default_delete",
         "parameters": [
           {
             "in": "path",
-            "name": "code",
+            "name": "connector_id",
             "required": true,
             "schema": {
-              "title": "Code",
-              "type": "string"
-            }
-          },
-          {
-            "in": "query",
-            "name": "status",
-            "required": false,
-            "schema": {
-              "anyOf": [
-                {
-                  "type": "string"
-                },
-                {
-                  "type": "null"
-                }
-              ],
-              "title": "Status"
+              "title": "Connector Id",
+              "type": "integer"
             }
           }
         ],
@@ -8848,12 +11383,15 @@
             "content": {
               "application/json": {
                 "schema": {
-                  "$ref": "#/components/schemas/BulkActionResponse"
+                  "$ref": "#/components/schemas/ConnectorOut"
                 }
               }
             },
             "description": "Successful Response"
           },
+          "404": {
+            "description": "Connector not found for current user."
+          },
           "422": {
             "content": {
               "application/json": {
@@ -8870,24 +11408,22 @@
             "OAuth2PasswordBearer": []
           }
         ],
-        "summary": "Bulk Delete Requests Endpoint",
+        "summary": "Unset Connector As Default",
         "tags": [
-          "events"
+          "llm"
         ]
-      }
-    },
-    "/api/events/{code}/requests/reject-all": {
+      },
       "post": {
-        "description": "Reject all NEW requests for an event in one operation.",
-        "operationId": "reject_all_requests_endpoint_api_events__code__requests_reject_all_post",
+        "description": "Pin this connector as the DJ's explicit default (issue #336).\n\nAtomically clears any other defaults the DJ owns before flipping this row,\nso the partial unique index never sees two True rows for the same user.\n\nSetting a disabled / auth_invalid connector as default is rejected with 400\nso DJs don't silently break their own routing \u2014 a default that the gateway\nwould skip anyway is a footgun.",
+        "operationId": "set_connector_as_default_api_llm_connectors__connector_id__default_post",
         "parameters": [
           {
             "in": "path",
-            "name": "code",
+            "name": "connector_id",
             "required": true,
             "schema": {
-              "title": "Code",
-              "type": "string"
+              "title": "Connector Id",
+              "type": "integer"
             }
           }
         ],
@@ -8896,12 +11432,18 @@
             "content": {
               "application/json": {
                 "schema": {
-                  "$ref": "#/components/schemas/BulkActionResponse"
+                  "$ref": "#/components/schemas/ConnectorOut"
                 }
               }
             },
             "description": "Successful Response"
           },
+          "400": {
+            "description": "Connector cannot be set as default (e.g. disabled or auth_invalid)."
+          },
+          "404": {
+            "description": "Connector not found for current user."
+          },
           "422": {
             "content": {
               "application/json": {
@@ -8918,35 +11460,24 @@
             "OAuth2PasswordBearer": []
           }
         ],
-        "summary": "Reject All Requests Endpoint",
+        "summary": "Set Connector As Default",
         "tags": [
-          "events"
+          "llm"
         ]
       }
     },
-    "/api/events/{code}/search": {
-      "get": {
-        "description": "Public search endpoint for event guests.\n\nPriority: Tidal (primary) \u2192 Spotify (fallback) \u2192 Beatport (event toggle).\nResults are filtered for junk, deduplicated by ISRC, and sorted by popularity.",
-        "operationId": "event_search_api_events__code__search_get",
+    "/api/llm/connectors/{connector_id}/stream-test": {
+      "post": {
+        "description": "Stream a short sentence through the connector as ``text/event-stream``.\n\nValidates ownership up front (404 for connectors the DJ doesn't own \u2014 never\nleaks existence). Each SSE ``data:`` frame is a JSON ``ChatResponseChunk``.\nOn a typed gateway error an ``event: error`` frame is emitted carrying only a\nsanitised code (never the upstream payload), then the stream ends. Client\ndisconnect cancels the upstream provider request \u2014 the gateway generator's\n``finally`` writes the counts-only call log and closes the adapter.\n\nUnlike the public guest SSE stream (``api/sse.py``), this endpoint is\nauthenticated, rate-limited (10/min), and strictly bounded (max 64 output\ntokens), so it holds the request-scoped DB session for the brief stream\nlifetime rather than opening a detached ``SessionLocal`` \u2014 the pool-pinning\nconcern that drove ``api/sse.py``'s pattern applies to unauthenticated,\nindefinitely-open guest connections, not a short admin health probe.",
+        "operationId": "stream_test_connector_api_llm_connectors__connector_id__stream_test_post",
         "parameters": [
           {
             "in": "path",
-            "name": "code",
-            "required": true,
-            "schema": {
-              "title": "Code",
-              "type": "string"
-            }
-          },
-          {
-            "in": "query",
-            "name": "q",
+            "name": "connector_id",
             "required": true,
             "schema": {
-              "maxLength": 200,
-              "minLength": 2,
-              "title": "Q",
-              "type": "string"
+              "title": "Connector Id",
+              "type": "integer"
             }
           }
         ],
@@ -8954,13 +11485,7 @@
           "200": {
             "content": {
               "application/json": {
-                "schema": {
-                  "items": {
-                    "$ref": "#/components/schemas/SearchResult"
-                  },
-                  "title": "Response Event Search Api Events  Code  Search Get",
-                  "type": "array"
-                }
+                "schema": {}
               }
             },
             "description": "Successful Response"
@@ -8976,24 +11501,29 @@
             "description": "Validation Error"
           }
         },
-        "summary": "Event Search",
+        "security": [
+          {
+            "OAuth2PasswordBearer": []
+          }
+        ],
+        "summary": "Stream Test Connector",
         "tags": [
-          "events"
+          "llm"
         ]
       }
     },
-    "/api/events/{code}/unarchive": {
+    "/api/llm/connectors/{connector_id}/test": {
       "post": {
-        "description": "Unarchive an event.",
-        "operationId": "unarchive_event_endpoint_api_events__code__unarchive_post",
+        "description": "Run a health check and return a sanitised result.\n\nBehaviour identical to the background monitor (issue #340), so the\n``last_health_check_at`` / ``last_health_check_status`` columns and audit\nrows are written the same way on every invocation regardless of trigger\nsource. See ``services/llm/health_check.py`` for the shared helper.",
+        "operationId": "test_connector_api_llm_connectors__connector_id__test_post",
         "parameters": [
           {
             "in": "path",
-            "name": "code",
+            "name": "connector_id",
             "required": true,
             "schema": {
-              "title": "Code",
-              "type": "string"
+              "title": "Connector Id",
+              "type": "integer"
             }
           }
         ],
@@ -9002,7 +11532,7 @@
             "content": {
               "application/json": {
                 "schema": {
-                  "$ref": "#/components/schemas/EventOut"
+                  "$ref": "#/components/schemas/ConnectorTestResult"
                 }
               }
             },
@@ -9024,46 +11554,22 @@
             "OAuth2PasswordBearer": []
           }
         ],
-        "summary": "Unarchive Event Endpoint",
-        "tags": [
-          "events"
-        ]
-      }
-    },
-    "/api/health": {
-      "get": {
-        "description": "Health check endpoint for monitoring and load balancers.",
-        "operationId": "api_health_check_api_health_get",
-        "responses": {
-          "200": {
-            "content": {
-              "application/json": {
-                "schema": {}
-              }
-            },
-            "description": "Successful Response"
-          }
-        },
-        "summary": "Api Health Check",
+        "summary": "Test Connector",
         "tags": [
-          "health"
+          "llm"
         ]
       }
     },
-    "/api/kiosk/mine": {
+    "/api/llm/feature-preferences": {
       "get": {
-        "description": "List all kiosks paired by the current user.",
-        "operationId": "list_my_kiosks_api_kiosk_mine_get",
+        "description": "List the DJ's per-feature connector pins (issue #337).",
+        "operationId": "list_feature_preferences_api_llm_feature_preferences_get",
         "responses": {
           "200": {
             "content": {
               "application/json": {
                 "schema": {
-                  "items": {
-                    "$ref": "#/components/schemas/KioskOut"
-                  },
-                  "title": "Response List My Kiosks Api Kiosk Mine Get",
-                  "type": "array"
+                  "$ref": "#/components/schemas/FeaturePreferencesListOut"
                 }
               }
             },
@@ -9075,32 +11581,19 @@
             "OAuth2PasswordBearer": []
           }
         ],
-        "summary": "List My Kiosks",
+        "summary": "List Feature Preferences",
         "tags": [
-          "kiosk"
+          "llm"
         ]
-      }
-    },
-    "/api/kiosk/pair/{pair_code}/complete": {
+      },
       "post": {
-        "description": "Complete a kiosk pairing by assigning an event.",
-        "operationId": "complete_kiosk_pairing_api_kiosk_pair__pair_code__complete_post",
-        "parameters": [
-          {
-            "in": "path",
-            "name": "pair_code",
-            "required": true,
-            "schema": {
-              "title": "Pair Code",
-              "type": "string"
-            }
-          }
-        ],
+        "description": "Pin (or re-pin) a connector to a feature for the current DJ.\n\nValidates connector ownership server-side (404 for IDs the DJ doesn't own,\nso another DJ's connector existence is never leaked) and rejects pinning a\nnon-active connector (400) \u2014 the gateway would skip it anyway, so silently\naccepting it is a footgun.",
+        "operationId": "set_feature_preference_endpoint_api_llm_feature_preferences_post",
         "requestBody": {
           "content": {
             "application/json": {
               "schema": {
-                "$ref": "#/components/schemas/KioskCompletePairingRequest"
+                "$ref": "#/components/schemas/FeaturePreferenceSet"
               }
             }
           },
@@ -9111,52 +11604,17 @@
             "content": {
               "application/json": {
                 "schema": {
-                  "$ref": "#/components/schemas/KioskOut"
+                  "$ref": "#/components/schemas/FeaturePreferencesListOut"
                 }
               }
             },
             "description": "Successful Response"
           },
-          "422": {
-            "content": {
-              "application/json": {
-                "schema": {
-                  "$ref": "#/components/schemas/HTTPValidationError"
-                }
-              }
-            },
-            "description": "Validation Error"
-          }
-        },
-        "security": [
-          {
-            "OAuth2PasswordBearer": []
-          }
-        ],
-        "summary": "Complete Kiosk Pairing",
-        "tags": [
-          "kiosk"
-        ]
-      }
-    },
-    "/api/kiosk/{kiosk_id}": {
-      "delete": {
-        "description": "Unpair and delete a kiosk.",
-        "operationId": "delete_kiosk_endpoint_api_kiosk__kiosk_id__delete",
-        "parameters": [
-          {
-            "in": "path",
-            "name": "kiosk_id",
-            "required": true,
-            "schema": {
-              "title": "Kiosk Id",
-              "type": "integer"
-            }
-          }
-        ],
-        "responses": {
-          "204": {
-            "description": "Successful Response"
+          "400": {
+            "description": "Connector is not active and cannot be pinned."
+          },
+          "404": {
+            "description": "Connector not found for current user."
           },
           "422": {
             "content": {
@@ -9174,41 +11632,37 @@
             "OAuth2PasswordBearer": []
           }
         ],
-        "summary": "Delete Kiosk Endpoint",
+        "summary": "Set Feature Preference Endpoint",
         "tags": [
-          "kiosk"
+          "llm"
         ]
-      },
-      "patch": {
-        "description": "Rename a kiosk.",
-        "operationId": "rename_kiosk_endpoint_api_kiosk__kiosk_id__patch",
+      }
+    },
+    "/api/llm/feature-preferences/{feature}": {
+      "delete": {
+        "description": "Clear the DJ's pin for ``feature`` (no-op if unset). Returns the new list.",
+        "operationId": "clear_feature_preference_endpoint_api_llm_feature_preferences__feature__delete",
         "parameters": [
           {
             "in": "path",
-            "name": "kiosk_id",
+            "name": "feature",
             "required": true,
             "schema": {
-              "title": "Kiosk Id",
-              "type": "integer"
+              "enum": [
+                "recommendation",
+                "set_builder"
+              ],
+              "title": "Feature",
+              "type": "string"
             }
           }
         ],
-        "requestBody": {
-          "content": {
-            "application/json": {
-              "schema": {
-                "$ref": "#/components/schemas/KioskRenameRequest"
-              }
-            }
-          },
-          "required": true
-        },
         "responses": {
           "200": {
             "content": {
               "application/json": {
                 "schema": {
-                  "$ref": "#/components/schemas/KioskOut"
+                  "$ref": "#/components/schemas/FeaturePreferencesListOut"
                 }
               }
             },
@@ -9230,57 +11684,59 @@
             "OAuth2PasswordBearer": []
           }
         ],
-        "summary": "Rename Kiosk Endpoint",
+        "summary": "Clear Feature Preference Endpoint",
         "tags": [
-          "kiosk"
+          "llm"
         ]
       }
     },
-    "/api/kiosk/{kiosk_id}/assign": {
-      "patch": {
-        "description": "Change which event a kiosk displays.",
-        "operationId": "assign_kiosk_api_kiosk__kiosk_id__assign_patch",
-        "parameters": [
-          {
-            "in": "path",
-            "name": "kiosk_id",
-            "required": true,
-            "schema": {
-              "title": "Kiosk Id",
-              "type": "integer"
-            }
-          }
-        ],
-        "requestBody": {
-          "content": {
-            "application/json": {
-              "schema": {
-                "$ref": "#/components/schemas/KioskAssignRequest"
-              }
-            }
-          },
-          "required": true
-        },
+    "/api/llm/openrouter/models": {
+      "get": {
+        "description": "Return the OpenRouter model catalogue for the model-hint dropdown.\n\nServed from a process-wide TTL cache (refreshed hourly). The OpenRouter\n``/models`` endpoint is public, so no connector credentials are required.\nReturns an empty list if the catalogue is unavailable \u2014 the frontend then\nfalls back to a free-text model input.",
+        "operationId": "list_openrouter_models_api_llm_openrouter_models_get",
         "responses": {
           "200": {
             "content": {
               "application/json": {
                 "schema": {
-                  "$ref": "#/components/schemas/KioskOut"
+                  "$ref": "#/components/schemas/AIModelsResponse"
                 }
               }
             },
             "description": "Successful Response"
-          },
-          "422": {
+          }
+        },
+        "security": [
+          {
+            "OAuth2PasswordBearer": []
+          }
+        ],
+        "summary": "List Openrouter Models",
+        "tags": [
+          "llm"
+        ]
+      }
+    },
+    "/api/llm/policy": {
+      "get": {
+        "description": "DJ-readable connector policy (non-sensitive subset).\n\nThe settings/ai page consumes this to fail *closed* \u2014 hiding connector\ntypes the admin has disabled rather than showing every provider and only\ndiscovering the block when the create call returns 403. Admin-only fields\n(e.g. ``llm_default_connector_id``) are intentionally excluded.",
+        "operationId": "get_dj_policy_api_llm_policy_get",
+        "responses": {
+          "200": {
             "content": {
               "application/json": {
                 "schema": {
-                  "$ref": "#/components/schemas/HTTPValidationError"
+                  "$ref": "#/components/schemas/DjPolicyOut"
                 }
               }
             },
-            "description": "Validation Error"
+            "description": "Successful Response"
+          },
+          "401": {
+            "description": "Not authenticated (missing or invalid bearer token)."
+          },
+          "403": {
+            "description": "Authenticated but not an active DJ (e.g. pending approval)."
           }
         },
         "security": [
@@ -9288,9 +11744,9 @@
             "OAuth2PasswordBearer": []
           }
         ],
-        "summary": "Assign Kiosk",
+        "summary": "Get Dj Policy",
         "tags": [
-          "kiosk"
+          "llm"
         ]
       }
     },
@@ -10292,7 +12748,7 @@
     },
     "/api/public/events/{code}/stream": {
       "get": {
-        "description": "Public SSE endpoint for real-time event updates.\n\nSECURITY (CRIT-5): rate-limited and existence-checked. Before this fix,\nthe endpoint had no rate limit and no existence check, allowing\nunauthenticated DoS (unlimited long-lived connections exhausting FDs)\nand passive eavesdropping via 6-char event-code brute force.\n\nEvent types:\n- request_created: New request submitted\n- request_status_changed: Request status update\n- now_playing_changed: Now-playing track update\n- requests_bulk_update: Batch accept/reject\n- bridge_status_changed: Bridge connect/disconnect",
+        "description": "Public SSE endpoint for real-time event updates.\n\nSECURITY (CRIT-5): rate-limited and existence-checked. Before this fix,\nthe endpoint had no rate limit and no existence check, allowing\nunauthenticated DoS (unlimited long-lived connections exhausting FDs)\nand passive eavesdropping via 6-char event-code brute force.\n\nPOOL SAFETY (issue #356): the one-shot existence/auth check runs inside a\nshort-lived ``with SessionLocal()`` block whose pooled connection is\nreturned BEFORE the EventSourceResponse is returned. An EventSource\nconnection can stay open indefinitely, so we must NOT hold a\nrequest-scoped ``get_db`` session across the stream lifetime \u2014 doing so\npinned one pooled connection per open stream and exhausted the QueuePool\n(size 5 + overflow 10 = 15 connections) under modest guest load.\n\nEvent types:\n- request_created: New request submitted\n- request_status_changed: Request status update\n- now_playing_changed: Now-playing track update\n- requests_bulk_update: Batch accept/reject\n- bridge_status_changed: Bridge connect/disconnect",
         "operationId": "event_stream_api_public_events__code__stream_get",
         "parameters": [
           {
@@ -10941,6 +13397,225 @@
         ]
       }
     },
+    "/api/setbuilder/sets": {
+      "get": {
+        "description": "List the current DJ's sets, newest first.",
+        "operationId": "list_sets_api_setbuilder_sets_get",
+        "responses": {
+          "200": {
+            "content": {
+              "application/json": {
+                "schema": {
+                  "items": {
+                    "$ref": "#/components/schemas/SetSummary"
+                  },
+                  "title": "Response List Sets Api Setbuilder Sets Get",
+                  "type": "array"
+                }
+              }
+            },
+            "description": "Successful Response"
+          }
+        },
+        "security": [
+          {
+            "OAuth2PasswordBearer": []
+          }
+        ],
+        "summary": "List Sets",
+        "tags": [
+          "setbuilder"
+        ]
+      },
+      "post": {
+        "description": "Create a new empty set owned by the current DJ.",
+        "operationId": "create_set_api_setbuilder_sets_post",
+        "requestBody": {
+          "content": {
+            "application/json": {
+              "schema": {
+                "$ref": "#/components/schemas/SetCreate"
+              }
+            }
+          },
+          "required": true
+        },
+        "responses": {
+          "201": {
+            "content": {
+              "application/json": {
+                "schema": {
+                  "$ref": "#/components/schemas/SetDetail"
+                }
+              }
+            },
+            "description": "Successful Response"
+          },
+          "422": {
+            "content": {
+              "application/json": {
+                "schema": {
+                  "$ref": "#/components/schemas/HTTPValidationError"
+                }
+              }
+            },
+            "description": "Validation Error"
+          }
+        },
+        "security": [
+          {
+            "OAuth2PasswordBearer": []
+          }
+        ],
+        "summary": "Create Set",
+        "tags": [
+          "setbuilder"
+        ]
+      }
+    },
+    "/api/setbuilder/sets/{set_id}": {
+      "delete": {
+        "description": "Delete one of the current DJ's sets, or 404.",
+        "operationId": "delete_set_api_setbuilder_sets__set_id__delete",
+        "parameters": [
+          {
+            "in": "path",
+            "name": "set_id",
+            "required": true,
+            "schema": {
+              "title": "Set Id",
+              "type": "integer"
+            }
+          }
+        ],
+        "responses": {
+          "204": {
+            "description": "Successful Response"
+          },
+          "422": {
+            "content": {
+              "application/json": {
+                "schema": {
+                  "$ref": "#/components/schemas/HTTPValidationError"
+                }
+              }
+            },
+            "description": "Validation Error"
+          }
+        },
+        "security": [
+          {
+            "OAuth2PasswordBearer": []
+          }
+        ],
+        "summary": "Delete Set",
+        "tags": [
+          "setbuilder"
+        ]
+      },
+      "get": {
+        "description": "Get one of the current DJ's sets, or 404.",
+        "operationId": "get_set_api_setbuilder_sets__set_id__get",
+        "parameters": [
+          {
+            "in": "path",
+            "name": "set_id",
+            "required": true,
+            "schema": {
+              "title": "Set Id",
+              "type": "integer"
+            }
+          }
+        ],
+        "responses": {
+          "200": {
+            "content": {
+              "application/json": {
+                "schema": {
+                  "$ref": "#/components/schemas/SetDetail"
+                }
+              }
+            },
+            "description": "Successful Response"
+          },
+          "422": {
+            "content": {
+              "application/json": {
+                "schema": {
+                  "$ref": "#/components/schemas/HTTPValidationError"
+                }
+              }
+            },
+            "description": "Validation Error"
+          }
+        },
+        "security": [
+          {
+            "OAuth2PasswordBearer": []
+          }
+        ],
+        "summary": "Get Set",
+        "tags": [
+          "setbuilder"
+        ]
+      },
+      "patch": {
+        "description": "Rename one of the current DJ's sets, or 404.",
+        "operationId": "rename_set_api_setbuilder_sets__set_id__patch",
+        "parameters": [
+          {
+            "in": "path",
+            "name": "set_id",
+            "required": true,
+            "schema": {
+              "title": "Set Id",
+              "type": "integer"
+            }
+          }
+        ],
+        "requestBody": {
+          "content": {
+            "application/json": {
+              "schema": {
+                "$ref": "#/components/schemas/SetRename"
+              }
+            }
+          },
+          "required": true
+        },
+        "responses": {
+          "200": {
+            "content": {
+              "application/json": {
+                "schema": {
+                  "$ref": "#/components/schemas/SetDetail"
+                }
+              }
+            },
+            "description": "Successful Response"
+          },
+          "422": {
+            "content": {
+              "application/json": {
+                "schema": {
+                  "$ref": "#/components/schemas/HTTPValidationError"
+                }
+              }
+            },
+            "description": "Validation Error"
+          }
+        },
+        "security": [
+          {
+            "OAuth2PasswordBearer": []
+          }
+        ],
+        "summary": "Rename Set",
+        "tags": [
+          "setbuilder"
+        ]
+      }
+    },
     "/api/tidal/auth/cancel": {
       "post": {
         "description": "Cancel pending device login.",
diff --git a/server/scripts/export_openapi.py b/server/scripts/export_openapi.py
index 7c06c88e..a8e3b994 100644
--- a/server/scripts/export_openapi.py
+++ b/server/scripts/export_openapi.py
@@ -84,6 +84,10 @@ def _promote_response_fields_to_required(spec: dict[str, Any]) -> None:
 
 def export() -> Path:
     output = Path(__file__).resolve().parent.parent / "openapi.json"
+    # Force fresh generation — FastAPI caches the schema on `app.openapi_schema`,
+    # which can hide newly-added routes when this script is invoked from a
+    # long-running process.
+    app.openapi_schema = None
     spec = app.openapi()
     _promote_response_fields_to_required(spec)
     output.write_text(json.dumps(spec, indent=2, sort_keys=True) + "\n")
diff --git a/server/tests/conftest.py b/server/tests/conftest.py
index e65d91de..1a569250 100644
--- a/server/tests/conftest.py
+++ b/server/tests/conftest.py
@@ -9,6 +9,7 @@
 from sqlalchemy.orm import Session, sessionmaker
 from sqlalchemy.pool import StaticPool
 
+from app.api import sse as _sse_module
 from app.api.deps import get_db
 from app.core.time import utcnow
 from app.main import app
@@ -29,6 +30,16 @@
 )
 TestingSessionLocal = sessionmaker(autocommit=False, autoflush=False, bind=engine)
 
+# The SSE endpoint (``app.api.sse``) opens its own short-lived
+# ``with SessionLocal() as db:`` block for the existence check, bypassing the
+# FastAPI ``get_db`` dependency that other endpoints use. The
+# ``app.dependency_overrides[get_db]`` swap below never reaches it, so the SSE
+# handler would hit the real ``DATABASE_URL`` (Postgres in CI) instead of the
+# in-memory SQLite test DB and fail with "relation does not exist". Swap only
+# the SSE module's ``SessionLocal`` reference — scoped so we don't disturb
+# other modules that also import the production ``SessionLocal``.
+_sse_module.SessionLocal = TestingSessionLocal
+
 
 @pytest.fixture(scope="function")
 def db() -> Generator[Session, None, None]:
diff --git a/server/tests/test_export.py b/server/tests/test_export.py
index 6ec794ee..c8fafa24 100644
--- a/server/tests/test_export.py
+++ b/server/tests/test_export.py
@@ -320,6 +320,16 @@ def test_sanitizes_carriage_return(self):
         result = sanitize_csv_value("\rmalicious")
         assert result.startswith("'")
 
+    def test_sanitizes_line_feed(self):
+        """Leading LF is escaped — importers may strip it then evaluate the formula."""
+        result = sanitize_csv_value("\n=cmd|' /C calc'!A0")
+        assert result.startswith("'")
+
+    def test_sanitizes_leading_space(self):
+        """Leading space is escaped — importers trim it then evaluate the formula."""
+        result = sanitize_csv_value(" =cmd|' /C calc'!A0")
+        assert result.startswith("'")
+
     def test_preserves_normal_values(self):
         """Test that normal values are not modified."""
         assert sanitize_csv_value("Normal Song Title") == "Normal Song Title"
diff --git a/server/tests/test_llm_adapter_contract.py b/server/tests/test_llm_adapter_contract.py
new file mode 100644
index 00000000..a90f7220
--- /dev/null
+++ b/server/tests/test_llm_adapter_contract.py
@@ -0,0 +1,256 @@
+"""Adapter contract tests — parametrised over every registered adapter.
+
+This test file defines the *public extension surface* for LLM adapters. Any
+adapter (built-in or third-party plug-in) that subclasses ``LlmAdapter`` and
+registers via :func:`register_adapter` must pass every test here.
+
+The contract intentionally tests structural and exception-mapping invariants
+only — it never makes network calls. Provider-specific HTTP and parsing
+behaviour belongs in per-adapter test files (e.g. ``test_llm_adapters.py``,
+``test_llm_bedrock_adapter.py``).
+
+If you are adding a new adapter:
+
+1. Register it via ``register_adapter("<connector_type>", YourClass)``.
+2. Run this file: ``pytest tests/test_llm_adapter_contract.py``.
+3. Every test must pass without modification.
+
+If a test does *not* apply to your adapter, the right answer is to discuss it
+in a PR — not to silently skip the contract. The contract is what lets the
+gateway dispatch generically.
+"""
+
+from __future__ import annotations
+
+import inspect
+from types import SimpleNamespace
+
+import pytest
+
+from app.services.llm.base import ChatRequest, LlmAdapter, Message
+from app.services.llm.exceptions import AuthInvalid, LlmError
+from app.services.llm.registry import get_adapter_class, list_connector_types
+
+
+# ---------------------------------------------------------------------------
+# Parametrisation — runs against every registered connector_type.
+# ---------------------------------------------------------------------------
+def _all_connector_types() -> list[str]:
+    """Snapshot the registry at collection time.
+
+    The registry is populated by ``app.services.llm.registry._bootstrap()``
+    which eagerly imports the built-in adapters package. Any third-party
+    adapter loaded via ``LLM_PLUGIN_DIR`` is also discovered here.
+    """
+    return list_connector_types()
+
+
+@pytest.fixture
+def malformed_connector():
+    """A connector row whose ``credentials`` blob is not valid JSON.
+
+    Every adapter must reject this without crashing, raising :class:`AuthInvalid`
+    rather than leaking a ``JSONDecodeError`` or hitting the network.
+    """
+    return SimpleNamespace(
+        connector_type="contract-test",
+        credentials="this is not valid json",
+        model_hint=None,
+        base_url_plain=None,
+    )
+
+
+# ---------------------------------------------------------------------------
+# Structural contract — class-level guarantees.
+# ---------------------------------------------------------------------------
+@pytest.mark.parametrize("connector_type", _all_connector_types())
+def test_adapter_subclasses_llm_adapter(connector_type: str):
+    """Every registered adapter must subclass the ``LlmAdapter`` ABC."""
+    cls = get_adapter_class(connector_type)
+    assert issubclass(cls, LlmAdapter), (
+        f"{cls.__name__} is registered as {connector_type!r} but does not subclass LlmAdapter"
+    )
+
+
+@pytest.mark.parametrize("connector_type", _all_connector_types())
+def test_adapter_declares_connector_type(connector_type: str):
+    """Each adapter class must declare a non-empty ``connector_type`` attr.
+
+    The registry uses this string to dispatch; an empty value would shadow
+    every other adapter or fail in surprising ways.
+    """
+    cls = get_adapter_class(connector_type)
+    assert getattr(cls, "connector_type", ""), (
+        f"{cls.__name__} must set a class-level connector_type attribute"
+    )
+    # The class attribute must match the registration key. Otherwise an admin
+    # toggling per-DJ MRU lookup will pull the wrong adapter for the row.
+    assert cls.connector_type == connector_type, (
+        f"{cls.__name__}.connector_type is {cls.connector_type!r} but "
+        f"registered as {connector_type!r}"
+    )
+
+
+@pytest.mark.parametrize("connector_type", _all_connector_types())
+def test_adapter_defines_chat_and_health_check(connector_type: str):
+    """Both abstract methods must be implemented as async callables."""
+    cls = get_adapter_class(connector_type)
+    chat = getattr(cls, "chat", None)
+    health = getattr(cls, "health_check", None)
+    assert callable(chat), f"{cls.__name__}.chat must be defined"
+    assert callable(health), f"{cls.__name__}.health_check must be defined"
+    assert inspect.iscoroutinefunction(chat), (
+        f"{cls.__name__}.chat must be `async def` — the gateway awaits it"
+    )
+    assert inspect.iscoroutinefunction(health), f"{cls.__name__}.health_check must be `async def`"
+
+
+@pytest.mark.parametrize("connector_type", _all_connector_types())
+def test_adapter_constructor_accepts_connector(connector_type: str):
+    """Adapters are instantiated as ``cls(connector)`` by the gateway."""
+    cls = get_adapter_class(connector_type)
+    connector = SimpleNamespace(
+        connector_type=connector_type,
+        credentials="{}",
+        model_hint=None,
+        base_url_plain=None,
+    )
+    # Must not raise — credential decoding is deferred until chat()/health().
+    instance = cls(connector)
+    assert instance.connector is connector
+
+
+# ---------------------------------------------------------------------------
+# Exception contract — typed errors only, no provider leakage.
+# ---------------------------------------------------------------------------
+@pytest.mark.parametrize("connector_type", _all_connector_types())
+async def test_adapter_raises_typed_error_on_malformed_credentials(
+    connector_type: str, malformed_connector
+):
+    """An adapter handed a malformed credential blob must raise a typed
+    :class:`LlmError` (specifically :class:`AuthInvalid`) — never a bare
+    :class:`json.JSONDecodeError`, :class:`KeyError`, or a network exception.
+
+    This is the boundary that keeps provider internals from leaking into
+    API error responses.
+    """
+    cls = get_adapter_class(connector_type)
+    adapter = cls(malformed_connector)
+    request = ChatRequest(
+        messages=[Message(role="user", content="ping")],
+        max_tokens=1,
+    )
+
+    # We expect AuthInvalid (the most specific subtype). Some adapters with
+    # additional credential fields might raise a different LlmError subclass —
+    # accept any of them, but never a non-LlmError. The pytest.raises(LlmError)
+    # context manager is the only assertion needed: a non-LlmError exception
+    # would propagate out and fail the test.
+    with pytest.raises(LlmError):
+        await adapter.chat(request)
+
+
+# ---------------------------------------------------------------------------
+# Registry contract — third-party adapters reach the gateway via this path.
+# ---------------------------------------------------------------------------
+def test_registry_returns_classes_not_instances():
+    """``get_adapter_class`` must return a *class*, not an instance.
+
+    The gateway calls ``cls(connector)`` per dispatch; returning an instance
+    here would silently share state across DJs.
+    """
+    for connector_type in _all_connector_types():
+        cls = get_adapter_class(connector_type)
+        assert inspect.isclass(cls), (
+            f"Registry returned a non-class for {connector_type!r}: {cls!r}"
+        )
+
+
+def test_registry_lookup_raises_keyerror_for_unknown():
+    """Unknown ``connector_type`` lookups raise :class:`KeyError`.
+
+    The gateway relies on this to surface ``NoLlmConfigured`` cleanly.
+    """
+    with pytest.raises(KeyError):
+        get_adapter_class("definitely-not-a-real-connector-type")
+
+
+# ---------------------------------------------------------------------------
+# Skeleton contract — proves the documented reference adapter satisfies the
+# same surface as the built-in providers.
+# ---------------------------------------------------------------------------
+def _import_echo_adapter():
+    """Import the docs-tree skeleton adapter as a regular module.
+
+    The skeleton lives outside the ``app`` package (``docs/examples/``), so we
+    register a one-off path entry to import it. We do this *inside* the test
+    rather than at module load time so the registry stays clean for parametrised
+    runs above (the skeleton is also asserted to register cleanly on import).
+    """
+    import importlib
+    import os
+    import sys
+
+    repo_root = os.path.abspath(os.path.join(os.path.dirname(__file__), "..", ".."))
+    if repo_root not in sys.path:
+        sys.path.insert(0, repo_root)
+    return importlib.import_module("docs.examples.echo_adapter")
+
+
+def test_skeleton_echo_adapter_satisfies_contract():
+    """The documented skeleton must pass the same structural contract above.
+
+    This is what guarantees the ``docs/LLM-PLUGIN.md`` "quick start" actually
+    works — a third-party author copying the skeleton gets a registered,
+    contract-compliant adapter without modifying any core file.
+    """
+    module = _import_echo_adapter()
+    echo_cls = module.EchoAdapter
+
+    # Same structural checks the parametrised tests above run, applied directly
+    # so this test still fires when the skeleton is not pre-registered.
+    assert issubclass(echo_cls, LlmAdapter)
+    assert echo_cls.connector_type == "echo"
+    assert inspect.iscoroutinefunction(echo_cls.chat)
+    assert inspect.iscoroutinefunction(echo_cls.health_check)
+
+    # Registry hit via the public surface.
+    assert get_adapter_class("echo") is echo_cls
+
+
+async def test_skeleton_echo_adapter_round_trip():
+    """Smoke-test the echo skeleton end-to-end through ``chat()``.
+
+    Importantly this avoids any network call — proving that the skeleton can
+    be used as a deterministic stand-in for gateway tests.
+    """
+    module = _import_echo_adapter()
+    connector = SimpleNamespace(
+        connector_type="echo",
+        credentials="{}",
+        model_hint="echo-1",
+        base_url_plain=None,
+    )
+    adapter = module.EchoAdapter(connector)
+    request = ChatRequest(
+        messages=[Message(role="user", content="hello world")],
+        max_tokens=8,
+    )
+    response = await adapter.chat(request)
+    assert response.text == "hello world"
+    assert response.stop_reason == "end_turn"
+    assert response.model == "echo-1"
+
+
+async def test_skeleton_echo_adapter_health_check_validates_credentials():
+    """``health_check()`` must raise :class:`AuthInvalid` for malformed creds."""
+    module = _import_echo_adapter()
+    connector = SimpleNamespace(
+        connector_type="echo",
+        credentials="not-json",
+        model_hint=None,
+        base_url_plain=None,
+    )
+    adapter = module.EchoAdapter(connector)
+    with pytest.raises(AuthInvalid):
+        await adapter.health_check()
diff --git a/server/tests/test_llm_adapters.py b/server/tests/test_llm_adapters.py
new file mode 100644
index 00000000..cebfa81a
--- /dev/null
+++ b/server/tests/test_llm_adapters.py
@@ -0,0 +1,1309 @@
+"""Tests for the OpenAI / OpenAI-compatible / Anthropic adapters.
+
+Each adapter is mocked at the HTTP boundary (httpx for OpenAI, anthropic SDK
+for Anthropic) so we exercise the adapter logic without real network calls.
+"""
+
+from __future__ import annotations
+
+import json
+from types import SimpleNamespace
+from unittest.mock import AsyncMock, patch
+
+import httpx
+import pytest
+
+from app.services.llm.adapters._httpx_openai import build_healthcheck_request
+from app.services.llm.adapters.anthropic_apikey import AnthropicApiKeyAdapter
+from app.services.llm.adapters.azure_openai import AzureOpenAIAdapter, _build_azure_endpoint
+from app.services.llm.adapters.gemini_apikey import GeminiApiKeyAdapter
+from app.services.llm.adapters.openai_apikey import OpenAIApiKeyAdapter
+from app.services.llm.adapters.openai_compatible import OpenAICompatibleAdapter
+from app.services.llm.adapters.openrouter_apikey import (
+    OPENROUTER_BASE_URL,
+    OpenRouterApiKeyAdapter,
+)
+from app.services.llm.adapters.xai_apikey import XAI_BASE_URL, XaiApiKeyAdapter
+from app.services.llm.base import ChatRequest, ContentBlock, Message, ToolSpec
+from app.services.llm.exceptions import (
+    AuthInvalid,
+    ProviderUnavailable,
+    QuotaExceeded,
+    RateLimited,
+    ToolTranslationError,
+)
+
+_HTTPX_PATH = "app.services.llm.adapters._httpx_openai.httpx.AsyncClient"
+_AZURE_HTTPX_PATH = "app.services.llm.adapters.azure_openai.httpx.AsyncClient"
+_GEMINI_HTTPX_PATH = "app.services.llm.adapters.gemini_apikey.httpx.AsyncClient"
+
+
+class _FakeAsyncClient:
+    """Wrap a fake Anthropic client so it works with ``async with``.
+
+    The real ``AsyncAnthropic`` client is an async context manager; the adapter
+    uses ``async with self._client(...) as client`` to release HTTP resources.
+    """
+
+    def __init__(self, client):
+        self._client = client
+
+    async def __aenter__(self):
+        return self._client
+
+    async def __aexit__(self, *exc):
+        return False
+
+
+# ---------------------------------------------------------------------------
+# Shared healthcheck request
+# ---------------------------------------------------------------------------
+def test_healthcheck_request_imposes_no_tiny_output_cap():
+    # A 1-token cap is consumed entirely by reasoning models' internal tokens,
+    # producing zero output and an HTTP 400. The probe must leave the budget
+    # to the provider's default.
+    req = build_healthcheck_request()
+    assert req.max_tokens is None
+
+
+# ---------------------------------------------------------------------------
+# Helpers
+# ---------------------------------------------------------------------------
+def _make_openai_connector():
+    return SimpleNamespace(
+        connector_type="openai_apikey",
+        credentials=json.dumps({"api_key": "sk-test-key-123456789012"}),
+        model_hint="gpt-5-mini",
+        base_url_plain=None,
+    )
+
+
+def _make_compatible_connector(base_url="http://127.0.0.1:11434/v1", bearer=None):
+    creds = {"base_url": base_url, "bearer": bearer}
+    return SimpleNamespace(
+        connector_type="openai_compatible",
+        credentials=json.dumps(creds),
+        model_hint="llama3",
+        base_url_plain=base_url,
+    )
+
+
+def _make_azure_connector(
+    api_key="azure-secret-key",
+    resource="my-resource",
+    deployment="gpt4o",
+    api_version="2024-06-01",
+):
+    creds = {
+        "api_key": api_key,
+        "azure_resource_name": resource,
+        "azure_deployment_name": deployment,
+        "azure_api_version": api_version,
+    }
+    return SimpleNamespace(
+        connector_type="azure_openai",
+        credentials=json.dumps(creds),
+        model_hint=None,
+        base_url_plain=None,
+    )
+
+
+def _make_openrouter_connector(model_hint="openai/gpt-4o-mini"):
+    return SimpleNamespace(
+        connector_type="openrouter_apikey",
+        credentials=json.dumps({"api_key": "sk-or-v1-aaaaaaaaaaaaaaaaaaaaaaaaaaaa"}),
+        model_hint=model_hint,
+        base_url_plain=None,
+    )
+
+
+def _make_anthropic_connector():
+    return SimpleNamespace(
+        connector_type="anthropic_apikey",
+        credentials=json.dumps({"api_key": "sk-ant-fake-key-aaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaa"}),
+        model_hint="claude-haiku-4-5-20251001",
+        base_url_plain=None,
+    )
+
+
+def _make_xai_connector(model_hint="grok-3-mini"):
+    return SimpleNamespace(
+        connector_type="xai_apikey",
+        credentials=json.dumps({"api_key": "xai-fake-key-1234567890123456789012"}),
+        model_hint=model_hint,
+        base_url_plain=None,
+    )
+
+
+# Non-secret placeholder — avoids committing an "AIza…"-shaped literal that trips
+# secret scanners. The adapter doesn't validate key shape (that's done upstream),
+# so any string works for transport-level assertions.
+_GEMINI_TEST_KEY = "gemini-test-key-not-a-real-secret"
+
+
+def _make_gemini_connector(model_hint="gemini-2.5-flash"):
+    return SimpleNamespace(
+        connector_type="gemini_apikey",
+        credentials=json.dumps({"api_key": _GEMINI_TEST_KEY}),
+        model_hint=model_hint,
+        base_url_plain=None,
+    )
+
+
+def _gemini_success_body(text="hi"):
+    return {
+        "candidates": [
+            {"content": {"role": "model", "parts": [{"text": text}]}, "finishReason": "STOP"}
+        ],
+        "usageMetadata": {"promptTokenCount": 3, "candidatesTokenCount": 1},
+        "modelVersion": "gemini-2.5-flash",
+    }
+
+
+def _openai_success_body(text="hi"):
+    return {
+        "model": "gpt-5-mini",
+        "choices": [{"finish_reason": "stop", "message": {"role": "assistant", "content": text}}],
+        "usage": {"prompt_tokens": 3, "completion_tokens": 1},
+    }
+
+
+def _ok_response(json_body):
+    return httpx.Response(
+        200,
+        request=httpx.Request("POST", "https://example.com/v1/chat/completions"),
+        json=json_body,
+    )
+
+
+class _AsyncClient:
+    """Minimal httpx.AsyncClient stub for unit tests."""
+
+    def __init__(self, response: httpx.Response | Exception):
+        self._response = response
+        self.calls: list = []
+
+    async def __aenter__(self):
+        return self
+
+    async def __aexit__(self, *args):
+        return None
+
+    async def post(self, url, json=None, headers=None):
+        self.calls.append({"url": url, "json": json, "headers": headers})
+        if isinstance(self._response, Exception):
+            raise self._response
+        return self._response
+
+
+# ---------------------------------------------------------------------------
+# OpenAI API-key adapter
+# ---------------------------------------------------------------------------
+class TestOpenAIApiKeyAdapter:
+    @pytest.mark.asyncio
+    async def test_happy_path(self):
+        connector = _make_openai_connector()
+        adapter = OpenAIApiKeyAdapter(connector)
+        request = ChatRequest(messages=[Message(role="user", content="hi")])
+
+        client = _AsyncClient(_ok_response(_openai_success_body("pong")))
+        with patch(_HTTPX_PATH, return_value=client):
+            resp = await adapter.chat(request)
+
+        assert resp.text == "pong"
+        assert client.calls[0]["headers"]["Authorization"].startswith("Bearer ")
+        assert client.calls[0]["url"].endswith("/chat/completions")
+
+    @pytest.mark.asyncio
+    async def test_uses_max_completion_tokens_not_max_tokens(self):
+        # OpenAI Platform's newer (GPT-5 / o-series) models reject the legacy
+        # `max_tokens` field with HTTP 400 and require `max_completion_tokens`.
+        connector = _make_openai_connector()
+        adapter = OpenAIApiKeyAdapter(connector)
+        request = ChatRequest(messages=[Message(role="user", content="hi")], max_tokens=100)
+
+        client = _AsyncClient(_ok_response(_openai_success_body("pong")))
+        with patch(_HTTPX_PATH, return_value=client):
+            await adapter.chat(request)
+
+        body = client.calls[0]["json"]
+        assert body["max_completion_tokens"] == 100
+        assert "max_tokens" not in body
+
+    @pytest.mark.asyncio
+    async def test_401_maps_to_auth_invalid(self):
+        connector = _make_openai_connector()
+        adapter = OpenAIApiKeyAdapter(connector)
+        resp = httpx.Response(
+            401,
+            request=httpx.Request("POST", "https://example.com"),
+            json={"error": "bad key"},
+        )
+        client = _AsyncClient(resp)
+        with patch(_HTTPX_PATH, return_value=client):
+            with pytest.raises(AuthInvalid):
+                await adapter.chat(ChatRequest(messages=[Message(role="user", content="x")]))
+
+    @pytest.mark.asyncio
+    async def test_429_maps_to_rate_limited_with_retry_after(self):
+        connector = _make_openai_connector()
+        adapter = OpenAIApiKeyAdapter(connector)
+        resp = httpx.Response(
+            429,
+            request=httpx.Request("POST", "https://example.com"),
+            headers={"Retry-After": "42"},
+            json={"error": "ratelimit"},
+        )
+        client = _AsyncClient(resp)
+        with patch(_HTTPX_PATH, return_value=client):
+            with pytest.raises(RateLimited) as exc_info:
+                await adapter.chat(ChatRequest(messages=[Message(role="user", content="x")]))
+        assert exc_info.value.retry_after_seconds == 42
+
+    @pytest.mark.asyncio
+    async def test_500_maps_to_provider_unavailable(self):
+        connector = _make_openai_connector()
+        adapter = OpenAIApiKeyAdapter(connector)
+        resp = httpx.Response(
+            502,
+            request=httpx.Request("POST", "https://example.com"),
+            json={"error": "boom"},
+        )
+        client = _AsyncClient(resp)
+        with patch(_HTTPX_PATH, return_value=client):
+            with pytest.raises(ProviderUnavailable):
+                await adapter.chat(ChatRequest(messages=[Message(role="user", content="x")]))
+
+    @pytest.mark.asyncio
+    async def test_402_maps_to_quota_exceeded(self):
+        connector = _make_openai_connector()
+        adapter = OpenAIApiKeyAdapter(connector)
+        resp = httpx.Response(
+            402,
+            request=httpx.Request("POST", "https://example.com"),
+            json={"error": "billing"},
+        )
+        client = _AsyncClient(resp)
+        with patch(_HTTPX_PATH, return_value=client):
+            with pytest.raises(QuotaExceeded):
+                await adapter.chat(ChatRequest(messages=[Message(role="user", content="x")]))
+
+    @pytest.mark.asyncio
+    async def test_timeout_maps_to_provider_unavailable(self):
+        connector = _make_openai_connector()
+        adapter = OpenAIApiKeyAdapter(connector)
+        client = _AsyncClient(httpx.TimeoutException("timeout"))
+        with patch(_HTTPX_PATH, return_value=client):
+            with pytest.raises(ProviderUnavailable):
+                await adapter.chat(ChatRequest(messages=[Message(role="user", content="x")]))
+
+    @pytest.mark.asyncio
+    async def test_malformed_credentials_raise_auth_invalid(self):
+        connector = SimpleNamespace(
+            connector_type="openai_apikey",
+            credentials="not json at all",
+            model_hint="gpt-5-mini",
+            base_url_plain=None,
+        )
+        adapter = OpenAIApiKeyAdapter(connector)
+        with pytest.raises(AuthInvalid):
+            await adapter.chat(ChatRequest(messages=[Message(role="user", content="x")]))
+
+    @pytest.mark.asyncio
+    async def test_missing_api_key_raises_auth_invalid(self):
+        connector = SimpleNamespace(
+            connector_type="openai_apikey",
+            credentials=json.dumps({}),
+            model_hint="gpt-5-mini",
+            base_url_plain=None,
+        )
+        adapter = OpenAIApiKeyAdapter(connector)
+        with pytest.raises(AuthInvalid):
+            await adapter.chat(ChatRequest(messages=[Message(role="user", content="x")]))
+
+
+# ---------------------------------------------------------------------------
+# OpenAI-compatible adapter
+# ---------------------------------------------------------------------------
+class TestOpenAICompatibleAdapter:
+    @pytest.mark.asyncio
+    async def test_no_bearer_no_auth_header(self):
+        connector = _make_compatible_connector()
+        adapter = OpenAICompatibleAdapter(connector)
+        client = _AsyncClient(_ok_response(_openai_success_body("hello")))
+        with patch(_HTTPX_PATH, return_value=client):
+            resp = await adapter.chat(ChatRequest(messages=[Message(role="user", content="hi")]))
+        assert resp.text == "hello"
+        assert "Authorization" not in client.calls[0]["headers"]
+
+    @pytest.mark.asyncio
+    async def test_with_bearer_sets_authorization(self):
+        connector = _make_compatible_connector(bearer="abc123")
+        adapter = OpenAICompatibleAdapter(connector)
+        client = _AsyncClient(_ok_response(_openai_success_body("hello")))
+        with patch(_HTTPX_PATH, return_value=client):
+            await adapter.chat(ChatRequest(messages=[Message(role="user", content="hi")]))
+        assert client.calls[0]["headers"]["Authorization"] == "Bearer abc123"
+
+    @pytest.mark.asyncio
+    async def test_uses_legacy_max_tokens(self):
+        # Third-party OpenAI-compatible servers (Ollama / vLLM / LMStudio) speak
+        # the legacy `max_tokens` field — they must NOT receive max_completion_tokens.
+        connector = _make_compatible_connector()
+        adapter = OpenAICompatibleAdapter(connector)
+        request = ChatRequest(messages=[Message(role="user", content="hi")], max_tokens=100)
+
+        client = _AsyncClient(_ok_response(_openai_success_body("ok")))
+        with patch(_HTTPX_PATH, return_value=client):
+            await adapter.chat(request)
+
+        body = client.calls[0]["json"]
+        assert body["max_tokens"] == 100
+        assert "max_completion_tokens" not in body
+
+    def test_fails_closed_when_blob_missing_base_url(self):
+        # base_url_plain is a display-only mirror; it must NEVER be used to route
+        # traffic. If the encrypted blob lacks base_url, fail closed.
+        connector = SimpleNamespace(
+            connector_type="openai_compatible",
+            credentials=json.dumps({"bearer": "abc"}),  # no base_url in the blob
+            model_hint="llama3",
+            base_url_plain="http://127.0.0.1:11434/v1",  # mirror present but ignored
+        )
+        adapter = OpenAICompatibleAdapter(connector)
+        with pytest.raises(AuthInvalid):
+            adapter._extract_credentials()
+
+
+# ---------------------------------------------------------------------------
+# OpenRouter API-key adapter
+# ---------------------------------------------------------------------------
+class TestOpenRouterApiKeyAdapter:
+    @pytest.mark.asyncio
+    async def test_happy_path_uses_fixed_base_url_and_bearer(self):
+        connector = _make_openrouter_connector()
+        adapter = OpenRouterApiKeyAdapter(connector)
+        client = _AsyncClient(_ok_response(_openai_success_body("pong")))
+        with patch(_HTTPX_PATH, return_value=client):
+            resp = await adapter.chat(ChatRequest(messages=[Message(role="user", content="hi")]))
+
+        assert resp.text == "pong"
+        # The api_key is surfaced as a Bearer token...
+        assert client.calls[0]["headers"]["Authorization"].startswith("Bearer ")
+        # ...and the request always targets the fixed OpenRouter endpoint.
+        assert client.calls[0]["url"] == f"{OPENROUTER_BASE_URL}/chat/completions"
+
+    @pytest.mark.asyncio
+    async def test_model_hint_is_sent_as_model(self):
+        connector = _make_openrouter_connector(model_hint="anthropic/claude-3.5-sonnet")
+        adapter = OpenRouterApiKeyAdapter(connector)
+        client = _AsyncClient(_ok_response(_openai_success_body("ok")))
+        with patch(_HTTPX_PATH, return_value=client):
+            await adapter.chat(ChatRequest(messages=[Message(role="user", content="hi")]))
+        assert client.calls[0]["json"]["model"] == "anthropic/claude-3.5-sonnet"
+
+    @pytest.mark.asyncio
+    async def test_falls_back_to_default_model_when_no_hint(self):
+        connector = _make_openrouter_connector(model_hint=None)
+        adapter = OpenRouterApiKeyAdapter(connector)
+        client = _AsyncClient(_ok_response(_openai_success_body("ok")))
+        with patch(_HTTPX_PATH, return_value=client):
+            await adapter.chat(ChatRequest(messages=[Message(role="user", content="hi")]))
+        assert client.calls[0]["json"]["model"] == "openai/gpt-4o-mini"
+
+    @pytest.mark.asyncio
+    async def test_401_maps_to_auth_invalid(self):
+        connector = _make_openrouter_connector()
+        adapter = OpenRouterApiKeyAdapter(connector)
+        resp = httpx.Response(
+            401, request=httpx.Request("POST", "https://example.com"), json={"error": "bad"}
+        )
+        client = _AsyncClient(resp)
+        with patch(_HTTPX_PATH, return_value=client):
+            with pytest.raises(AuthInvalid):
+                await adapter.chat(ChatRequest(messages=[Message(role="user", content="x")]))
+
+    @pytest.mark.asyncio
+    async def test_429_maps_to_rate_limited(self):
+        connector = _make_openrouter_connector()
+        adapter = OpenRouterApiKeyAdapter(connector)
+        resp = httpx.Response(
+            429,
+            request=httpx.Request("POST", "https://example.com"),
+            headers={"Retry-After": "12"},
+            json={"error": "limit"},
+        )
+        client = _AsyncClient(resp)
+        with patch(_HTTPX_PATH, return_value=client):
+            with pytest.raises(RateLimited) as info:
+                await adapter.chat(ChatRequest(messages=[Message(role="user", content="x")]))
+        assert info.value.retry_after_seconds == 12
+
+    @pytest.mark.asyncio
+    async def test_5xx_maps_to_provider_unavailable(self):
+        connector = _make_openrouter_connector()
+        adapter = OpenRouterApiKeyAdapter(connector)
+        resp = httpx.Response(
+            503, request=httpx.Request("POST", "https://example.com"), json={"error": "down"}
+        )
+        client = _AsyncClient(resp)
+        with patch(_HTTPX_PATH, return_value=client):
+            with pytest.raises(ProviderUnavailable):
+                await adapter.chat(ChatRequest(messages=[Message(role="user", content="x")]))
+
+    @pytest.mark.asyncio
+    async def test_402_maps_to_quota_exceeded(self):
+        connector = _make_openrouter_connector()
+        adapter = OpenRouterApiKeyAdapter(connector)
+        resp = httpx.Response(
+            402, request=httpx.Request("POST", "https://example.com"), json={"error": "billing"}
+        )
+        client = _AsyncClient(resp)
+        with patch(_HTTPX_PATH, return_value=client):
+            with pytest.raises(QuotaExceeded):
+                await adapter.chat(ChatRequest(messages=[Message(role="user", content="x")]))
+
+    @pytest.mark.asyncio
+    async def test_timeout_maps_to_provider_unavailable(self):
+        connector = _make_openrouter_connector()
+        adapter = OpenRouterApiKeyAdapter(connector)
+        client = _AsyncClient(httpx.TimeoutException("timeout"))
+        with patch(_HTTPX_PATH, return_value=client):
+            with pytest.raises(ProviderUnavailable):
+                await adapter.chat(ChatRequest(messages=[Message(role="user", content="x")]))
+
+    @pytest.mark.asyncio
+    async def test_malformed_body_raises_tool_translation_error(self):
+        connector = _make_openrouter_connector()
+        adapter = OpenRouterApiKeyAdapter(connector)
+        resp = httpx.Response(
+            200,
+            request=httpx.Request("POST", "https://example.com"),
+            content=b"not json",
+        )
+        client = _AsyncClient(resp)
+        with patch(_HTTPX_PATH, return_value=client):
+            with pytest.raises(ToolTranslationError):
+                await adapter.chat(ChatRequest(messages=[Message(role="user", content="x")]))
+
+    @pytest.mark.asyncio
+    async def test_malformed_credentials_raise_auth_invalid(self):
+        connector = SimpleNamespace(
+            connector_type="openrouter_apikey",
+            credentials="not json",
+            model_hint="openai/gpt-4o-mini",
+            base_url_plain=None,
+        )
+        adapter = OpenRouterApiKeyAdapter(connector)
+        with pytest.raises(AuthInvalid):
+            await adapter.chat(ChatRequest(messages=[Message(role="user", content="x")]))
+
+    @pytest.mark.asyncio
+    async def test_missing_api_key_raises_auth_invalid(self):
+        connector = SimpleNamespace(
+            connector_type="openrouter_apikey",
+            credentials=json.dumps({}),
+            model_hint="openai/gpt-4o-mini",
+            base_url_plain=None,
+        )
+        adapter = OpenRouterApiKeyAdapter(connector)
+        with pytest.raises(AuthInvalid):
+            await adapter.health_check()
+
+    @pytest.mark.asyncio
+    async def test_health_check_hits_fixed_base_url(self):
+        connector = _make_openrouter_connector()
+        adapter = OpenRouterApiKeyAdapter(connector)
+        client = _AsyncClient(_ok_response(_openai_success_body("ok")))
+        with patch(_HTTPX_PATH, return_value=client):
+            await adapter.health_check()
+        assert client.calls[0]["url"] == f"{OPENROUTER_BASE_URL}/chat/completions"
+
+
+# ---------------------------------------------------------------------------
+# Anthropic API-key adapter
+# ---------------------------------------------------------------------------
+class TestAnthropicApiKeyAdapter:
+    @pytest.mark.asyncio
+    async def test_happy_path(self):
+        connector = _make_anthropic_connector()
+        adapter = AnthropicApiKeyAdapter(connector)
+
+        fake_message = SimpleNamespace(
+            model="claude-haiku-4-5-20251001",
+            stop_reason="end_turn",
+            content=[SimpleNamespace(type="text", text="hi")],
+            usage=SimpleNamespace(input_tokens=3, output_tokens=1),
+        )
+
+        with patch.object(
+            adapter,
+            "_client",
+            return_value=_FakeAsyncClient(
+                SimpleNamespace(
+                    messages=SimpleNamespace(create=AsyncMock(return_value=fake_message))
+                )
+            ),
+        ):
+            resp = await adapter.chat(ChatRequest(messages=[Message(role="user", content="hi")]))
+
+        assert resp.text == "hi"
+        assert resp.usage.prompt == 3
+        assert resp.usage.completion == 1
+
+    @pytest.mark.asyncio
+    async def test_status_error_401_maps_to_auth_invalid(self):
+        from anthropic import APIStatusError
+
+        connector = _make_anthropic_connector()
+        adapter = AnthropicApiKeyAdapter(connector)
+
+        err_response = httpx.Response(
+            401,
+            request=httpx.Request("POST", "https://api.anthropic.com/v1/messages"),
+            json={"error": "bad"},
+        )
+        exc = APIStatusError("auth failed", response=err_response, body=None)
+
+        with patch.object(
+            adapter,
+            "_client",
+            return_value=_FakeAsyncClient(
+                SimpleNamespace(messages=SimpleNamespace(create=AsyncMock(side_effect=exc)))
+            ),
+        ):
+            with pytest.raises(AuthInvalid):
+                await adapter.chat(ChatRequest(messages=[Message(role="user", content="x")]))
+
+    @pytest.mark.asyncio
+    async def test_status_error_429_maps_to_rate_limited(self):
+        from anthropic import APIStatusError
+
+        connector = _make_anthropic_connector()
+        adapter = AnthropicApiKeyAdapter(connector)
+
+        err_response = httpx.Response(
+            429,
+            request=httpx.Request("POST", "https://api.anthropic.com/v1/messages"),
+            headers={"retry-after": "30"},
+            json={"error": "limit"},
+        )
+        exc = APIStatusError("rate limited", response=err_response, body=None)
+
+        with patch.object(
+            adapter,
+            "_client",
+            return_value=_FakeAsyncClient(
+                SimpleNamespace(messages=SimpleNamespace(create=AsyncMock(side_effect=exc)))
+            ),
+        ):
+            with pytest.raises(RateLimited) as info:
+                await adapter.chat(ChatRequest(messages=[Message(role="user", content="x")]))
+        assert info.value.retry_after_seconds == 30
+
+    @pytest.mark.asyncio
+    async def test_tool_call_message_requires_tool_call_id(self):
+        connector = _make_anthropic_connector()
+        adapter = AnthropicApiKeyAdapter(connector)
+        # Build a tool message without tool_call_id — should raise
+        with pytest.raises(ToolTranslationError):
+            await adapter.chat(
+                ChatRequest(messages=[Message(role="tool", content="result", tool_call_id=None)])
+            )
+
+
+# ---------------------------------------------------------------------------
+# Gemini API-key adapter (native generativelanguage API)
+# ---------------------------------------------------------------------------
+class TestGeminiApiKeyAdapter:
+    @pytest.mark.asyncio
+    async def test_happy_path(self):
+        connector = _make_gemini_connector()
+        adapter = GeminiApiKeyAdapter(connector)
+        request = ChatRequest(messages=[Message(role="user", content="hi")])
+
+        client = _AsyncClient(_ok_response(_gemini_success_body("pong")))
+        with patch(_GEMINI_HTTPX_PATH, return_value=client):
+            resp = await adapter.chat(request)
+
+        assert resp.text == "pong"
+        assert resp.usage.prompt == 3
+        assert resp.usage.completion == 1
+        # API key goes in the x-goog-api-key header, never the URL/query string.
+        assert client.calls[0]["headers"]["x-goog-api-key"] == _GEMINI_TEST_KEY
+        assert _GEMINI_TEST_KEY not in client.calls[0]["url"]
+        assert client.calls[0]["url"].endswith(":generateContent")
+        assert "gemini-2.5-flash" in client.calls[0]["url"]
+
+    @pytest.mark.asyncio
+    async def test_system_prompt_maps_to_system_instruction(self):
+        connector = _make_gemini_connector()
+        adapter = GeminiApiKeyAdapter(connector)
+        request = ChatRequest(
+            messages=[Message(role="user", content="hi")],
+            system="You are a DJ assistant.",
+        )
+        client = _AsyncClient(_ok_response(_gemini_success_body()))
+        with patch(_GEMINI_HTTPX_PATH, return_value=client):
+            await adapter.chat(request)
+        body = client.calls[0]["json"]
+        assert body["systemInstruction"]["parts"][0]["text"] == "You are a DJ assistant."
+        # Assistant turns map to the Gemini "model" role.
+        assert body["contents"][0]["role"] == "user"
+
+    @pytest.mark.asyncio
+    async def test_assistant_role_maps_to_model(self):
+        connector = _make_gemini_connector()
+        adapter = GeminiApiKeyAdapter(connector)
+        request = ChatRequest(
+            messages=[
+                Message(role="user", content="hi"),
+                Message(role="assistant", content="hello"),
+                Message(role="user", content="rank these"),
+            ]
+        )
+        client = _AsyncClient(_ok_response(_gemini_success_body()))
+        with patch(_GEMINI_HTTPX_PATH, return_value=client):
+            await adapter.chat(request)
+        roles = [c["role"] for c in client.calls[0]["json"]["contents"]]
+        assert roles == ["user", "model", "user"]
+
+    @pytest.mark.asyncio
+    async def test_tool_translation_and_parsing(self):
+        connector = _make_gemini_connector()
+        adapter = GeminiApiKeyAdapter(connector)
+        tool = ToolSpec(
+            name="search_queries",
+            description="Generate search queries",
+            input_schema={"type": "object", "properties": {"q": {"type": "string"}}},
+        )
+        request = ChatRequest(
+            messages=[Message(role="user", content="go")],
+            tools=[tool],
+            force_tool="search_queries",
+        )
+        body = {
+            "candidates": [
+                {
+                    "content": {
+                        "parts": [
+                            {"functionCall": {"name": "search_queries", "args": {"q": "house"}}}
+                        ]
+                    },
+                    "finishReason": "STOP",
+                }
+            ],
+            "usageMetadata": {"promptTokenCount": 8, "candidatesTokenCount": 4},
+        }
+        client = _AsyncClient(_ok_response(body))
+        with patch(_GEMINI_HTTPX_PATH, return_value=client):
+            resp = await adapter.chat(request)
+
+        # Request carried Gemini function_declarations + forced toolConfig.
+        sent = client.calls[0]["json"]
+        assert sent["tools"][0]["function_declarations"][0]["name"] == "search_queries"
+        assert sent["toolConfig"]["function_calling_config"]["mode"] == "ANY"
+        # Response parsed back into a canonical tool call.
+        assert resp.stop_reason == "tool_use"
+        assert resp.tool_calls[0].name == "search_queries"
+        assert resp.tool_calls[0].input == {"q": "house"}
+
+    @pytest.mark.asyncio
+    async def test_401_maps_to_auth_invalid(self):
+        connector = _make_gemini_connector()
+        adapter = GeminiApiKeyAdapter(connector)
+        resp = httpx.Response(
+            401,
+            request=httpx.Request("POST", "https://example.com"),
+            json={"error": "bad key"},
+        )
+        client = _AsyncClient(resp)
+        with patch(_GEMINI_HTTPX_PATH, return_value=client):
+            with pytest.raises(AuthInvalid):
+                await adapter.chat(ChatRequest(messages=[Message(role="user", content="x")]))
+
+    @pytest.mark.asyncio
+    async def test_403_maps_to_auth_invalid(self):
+        connector = _make_gemini_connector()
+        adapter = GeminiApiKeyAdapter(connector)
+        resp = httpx.Response(
+            403,
+            request=httpx.Request("POST", "https://example.com"),
+            json={"error": "forbidden"},
+        )
+        client = _AsyncClient(resp)
+        with patch(_GEMINI_HTTPX_PATH, return_value=client):
+            with pytest.raises(AuthInvalid):
+                await adapter.chat(ChatRequest(messages=[Message(role="user", content="x")]))
+
+    @pytest.mark.asyncio
+    async def test_429_maps_to_rate_limited_with_retry_after(self):
+        connector = _make_gemini_connector()
+        adapter = GeminiApiKeyAdapter(connector)
+        resp = httpx.Response(
+            429,
+            request=httpx.Request("POST", "https://example.com"),
+            headers={"Retry-After": "17"},
+            json={"error": "ratelimit"},
+        )
+        client = _AsyncClient(resp)
+        with patch(_GEMINI_HTTPX_PATH, return_value=client):
+            with pytest.raises(RateLimited) as exc_info:
+                await adapter.chat(ChatRequest(messages=[Message(role="user", content="x")]))
+        assert exc_info.value.retry_after_seconds == 17
+
+    @pytest.mark.asyncio
+    async def test_5xx_maps_to_provider_unavailable(self):
+        connector = _make_gemini_connector()
+        adapter = GeminiApiKeyAdapter(connector)
+        resp = httpx.Response(
+            503,
+            request=httpx.Request("POST", "https://example.com"),
+            json={"error": "overloaded"},
+        )
+        client = _AsyncClient(resp)
+        with patch(_GEMINI_HTTPX_PATH, return_value=client):
+            with pytest.raises(ProviderUnavailable):
+                await adapter.chat(ChatRequest(messages=[Message(role="user", content="x")]))
+
+    @pytest.mark.asyncio
+    async def test_timeout_maps_to_provider_unavailable(self):
+        connector = _make_gemini_connector()
+        adapter = GeminiApiKeyAdapter(connector)
+        client = _AsyncClient(httpx.TimeoutException("timeout"))
+        with patch(_GEMINI_HTTPX_PATH, return_value=client):
+            with pytest.raises(ProviderUnavailable):
+                await adapter.chat(ChatRequest(messages=[Message(role="user", content="x")]))
+
+    @pytest.mark.asyncio
+    async def test_network_error_maps_to_provider_unavailable(self):
+        connector = _make_gemini_connector()
+        adapter = GeminiApiKeyAdapter(connector)
+        client = _AsyncClient(httpx.ConnectError("boom"))
+        with patch(_GEMINI_HTTPX_PATH, return_value=client):
+            with pytest.raises(ProviderUnavailable):
+                await adapter.chat(ChatRequest(messages=[Message(role="user", content="x")]))
+
+    @pytest.mark.asyncio
+    async def test_malformed_json_body_raises_translation_error(self):
+        connector = _make_gemini_connector()
+        adapter = GeminiApiKeyAdapter(connector)
+        bad = httpx.Response(
+            200,
+            request=httpx.Request("POST", "https://example.com"),
+            content=b"not json at all",
+        )
+        client = _AsyncClient(bad)
+        with patch(_GEMINI_HTTPX_PATH, return_value=client):
+            with pytest.raises(ToolTranslationError):
+                await adapter.chat(ChatRequest(messages=[Message(role="user", content="x")]))
+
+    @pytest.mark.asyncio
+    async def test_malformed_response_shape_raises_translation_error(self):
+        connector = _make_gemini_connector()
+        adapter = GeminiApiKeyAdapter(connector)
+        client = _AsyncClient(_ok_response({"unexpected": "shape"}))
+        with patch(_GEMINI_HTTPX_PATH, return_value=client):
+            with pytest.raises(ToolTranslationError):
+                await adapter.chat(ChatRequest(messages=[Message(role="user", content="x")]))
+
+    @pytest.mark.asyncio
+    async def test_malformed_credentials_raise_auth_invalid(self):
+        connector = SimpleNamespace(
+            connector_type="gemini_apikey",
+            credentials="not json at all",
+            model_hint="gemini-2.5-flash",
+            base_url_plain=None,
+        )
+        adapter = GeminiApiKeyAdapter(connector)
+        with pytest.raises(AuthInvalid):
+            await adapter.chat(ChatRequest(messages=[Message(role="user", content="x")]))
+
+    @pytest.mark.asyncio
+    async def test_missing_api_key_raises_auth_invalid(self):
+        connector = SimpleNamespace(
+            connector_type="gemini_apikey",
+            credentials=json.dumps({}),
+            model_hint="gemini-2.5-flash",
+            base_url_plain=None,
+        )
+        adapter = GeminiApiKeyAdapter(connector)
+        with pytest.raises(AuthInvalid):
+            await adapter.chat(ChatRequest(messages=[Message(role="user", content="x")]))
+
+    @pytest.mark.asyncio
+    async def test_health_check_pings(self):
+        connector = _make_gemini_connector()
+        adapter = GeminiApiKeyAdapter(connector)
+        client = _AsyncClient(_ok_response(_gemini_success_body()))
+        with patch(_GEMINI_HTTPX_PATH, return_value=client):
+            await adapter.health_check()
+        assert len(client.calls) == 1
+
+    @pytest.mark.asyncio
+    async def test_tool_result_message_requires_tool_call_id(self):
+        connector = _make_gemini_connector()
+        adapter = GeminiApiKeyAdapter(connector)
+        with pytest.raises(ToolTranslationError):
+            await adapter.chat(
+                ChatRequest(messages=[Message(role="tool", content="result", tool_call_id=None)])
+            )
+
+    @pytest.mark.asyncio
+    async def test_tool_result_message_maps_to_function_response(self):
+        connector = _make_gemini_connector()
+        adapter = GeminiApiKeyAdapter(connector)
+        request = ChatRequest(
+            messages=[
+                Message(role="tool", content="42", tool_call_id="search_queries"),
+            ]
+        )
+        client = _AsyncClient(_ok_response(_gemini_success_body()))
+        with patch(_GEMINI_HTTPX_PATH, return_value=client):
+            await adapter.chat(request)
+        contents = client.calls[0]["json"]["contents"]
+        fr = contents[0]["parts"][0]["functionResponse"]
+        assert fr["name"] == "search_queries"
+        assert fr["response"] == {"content": "42"}
+
+    @pytest.mark.asyncio
+    async def test_system_role_message_is_dropped_from_contents(self):
+        connector = _make_gemini_connector()
+        adapter = GeminiApiKeyAdapter(connector)
+        request = ChatRequest(
+            messages=[
+                Message(role="system", content="ignored legacy system msg"),
+                Message(role="user", content="hi"),
+            ]
+        )
+        client = _AsyncClient(_ok_response(_gemini_success_body()))
+        with patch(_GEMINI_HTTPX_PATH, return_value=client):
+            await adapter.chat(request)
+        contents = client.calls[0]["json"]["contents"]
+        # The system message is not surfaced as a content turn.
+        assert len(contents) == 1
+        assert contents[0]["role"] == "user"
+
+    @pytest.mark.asyncio
+    async def test_list_content_blocks_flatten_to_text(self):
+        """Regression: list-based content (ContentBlock objects AND raw dicts)
+        must flatten into the part text, not silently drop to empty strings."""
+        connector = _make_gemini_connector()
+        adapter = GeminiApiKeyAdapter(connector)
+        obj_msg = Message(
+            role="user",
+            content=[ContentBlock(text="hello "), ContentBlock(text="world")],
+        )
+        # A dict-shaped block reaching the adapter unvalidated (model_construct
+        # skips Pydantic coercion) must still contribute its text.
+        dict_msg = Message.model_construct(role="assistant", content=[{"text": "ack"}])
+        request = ChatRequest(messages=[obj_msg, dict_msg])
+        client = _AsyncClient(_ok_response(_gemini_success_body()))
+        with patch(_GEMINI_HTTPX_PATH, return_value=client):
+            await adapter.chat(request)
+        contents = client.calls[0]["json"]["contents"]
+        assert contents[0]["parts"][0]["text"] == "hello world"
+        assert contents[1]["parts"][0]["text"] == "ack"
+
+    @pytest.mark.asyncio
+    async def test_402_maps_to_quota_exceeded(self):
+        connector = _make_gemini_connector()
+        adapter = GeminiApiKeyAdapter(connector)
+        resp = httpx.Response(
+            402,
+            request=httpx.Request("POST", "https://example.com"),
+            json={"error": "billing"},
+        )
+        client = _AsyncClient(resp)
+        with patch(_GEMINI_HTTPX_PATH, return_value=client):
+            with pytest.raises(QuotaExceeded):
+                await adapter.chat(ChatRequest(messages=[Message(role="user", content="x")]))
+
+    @pytest.mark.asyncio
+    async def test_400_maps_to_translation_error(self):
+        connector = _make_gemini_connector()
+        adapter = GeminiApiKeyAdapter(connector)
+        resp = httpx.Response(
+            400,
+            request=httpx.Request("POST", "https://example.com"),
+            json={"error": "bad request"},
+        )
+        client = _AsyncClient(resp)
+        with patch(_GEMINI_HTTPX_PATH, return_value=client):
+            with pytest.raises(ToolTranslationError):
+                await adapter.chat(ChatRequest(messages=[Message(role="user", content="x")]))
+
+    @pytest.mark.asyncio
+    async def test_429_without_retry_after_is_none(self):
+        connector = _make_gemini_connector()
+        adapter = GeminiApiKeyAdapter(connector)
+        resp = httpx.Response(
+            429,
+            request=httpx.Request("POST", "https://example.com"),
+            json={"error": "ratelimit"},
+        )
+        client = _AsyncClient(resp)
+        with patch(_GEMINI_HTTPX_PATH, return_value=client):
+            with pytest.raises(RateLimited) as exc_info:
+                await adapter.chat(ChatRequest(messages=[Message(role="user", content="x")]))
+        assert exc_info.value.retry_after_seconds is None
+
+
+# ---------------------------------------------------------------------------
+# Azure OpenAI adapter
+# ---------------------------------------------------------------------------
+class TestAzureOpenAIAdapter:
+    @pytest.mark.asyncio
+    async def test_happy_path_url_and_api_key_header(self):
+        connector = _make_azure_connector(
+            resource="acme", deployment="gpt4o", api_version="2024-06-01"
+        )
+        adapter = AzureOpenAIAdapter(connector)
+        client = _AsyncClient(_ok_response(_openai_success_body("pong")))
+        with patch(_AZURE_HTTPX_PATH, return_value=client):
+            resp = await adapter.chat(ChatRequest(messages=[Message(role="user", content="hi")]))
+
+        assert resp.text == "pong"
+        call = client.calls[0]
+        # Per-deployment URL with api-version query string.
+        assert call["url"] == (
+            "https://acme.openai.azure.com/openai/deployments/gpt4o"
+            "/chat/completions?api-version=2024-06-01"
+        )
+        # Azure uses the `api-key` header, NOT `Authorization: Bearer`.
+        assert call["headers"]["api-key"] == "azure-secret-key"
+        assert "Authorization" not in call["headers"]
+
+    @pytest.mark.asyncio
+    async def test_health_check_succeeds(self):
+        connector = _make_azure_connector()
+        adapter = AzureOpenAIAdapter(connector)
+        client = _AsyncClient(_ok_response(_openai_success_body("ok")))
+        with patch(_AZURE_HTTPX_PATH, return_value=client):
+            await adapter.health_check()
+        assert client.calls[0]["headers"]["api-key"] == "azure-secret-key"
+
+    @pytest.mark.asyncio
+    async def test_uses_max_completion_tokens_not_max_tokens(self):
+        # Azure serves the same OpenAI models, which reject legacy `max_tokens`.
+        connector = _make_azure_connector()
+        adapter = AzureOpenAIAdapter(connector)
+        request = ChatRequest(messages=[Message(role="user", content="hi")], max_tokens=100)
+        client = _AsyncClient(_ok_response(_openai_success_body("ok")))
+        with patch(_AZURE_HTTPX_PATH, return_value=client):
+            await adapter.chat(request)
+        body = client.calls[0]["json"]
+        assert body["max_completion_tokens"] == 100
+        assert "max_tokens" not in body
+
+    @pytest.mark.asyncio
+    async def test_401_maps_to_auth_invalid(self):
+        adapter = AzureOpenAIAdapter(_make_azure_connector())
+        resp = httpx.Response(
+            401, request=httpx.Request("POST", "https://acme.openai.azure.com"), json={}
+        )
+        with patch(_AZURE_HTTPX_PATH, return_value=_AsyncClient(resp)):
+            with pytest.raises(AuthInvalid):
+                await adapter.chat(ChatRequest(messages=[Message(role="user", content="x")]))
+
+    @pytest.mark.asyncio
+    async def test_429_maps_to_rate_limited_with_retry_after(self):
+        adapter = AzureOpenAIAdapter(_make_azure_connector())
+        resp = httpx.Response(
+            429,
+            request=httpx.Request("POST", "https://acme.openai.azure.com"),
+            headers={"Retry-After": "17"},
+            json={},
+        )
+        with patch(_AZURE_HTTPX_PATH, return_value=_AsyncClient(resp)):
+            with pytest.raises(RateLimited) as info:
+                await adapter.chat(ChatRequest(messages=[Message(role="user", content="x")]))
+        assert info.value.retry_after_seconds == 17
+
+    @pytest.mark.asyncio
+    async def test_5xx_maps_to_provider_unavailable(self):
+        adapter = AzureOpenAIAdapter(_make_azure_connector())
+        resp = httpx.Response(
+            503, request=httpx.Request("POST", "https://acme.openai.azure.com"), json={}
+        )
+        with patch(_AZURE_HTTPX_PATH, return_value=_AsyncClient(resp)):
+            with pytest.raises(ProviderUnavailable):
+                await adapter.chat(ChatRequest(messages=[Message(role="user", content="x")]))
+
+    @pytest.mark.asyncio
+    async def test_402_maps_to_quota_exceeded(self):
+        adapter = AzureOpenAIAdapter(_make_azure_connector())
+        resp = httpx.Response(
+            402, request=httpx.Request("POST", "https://acme.openai.azure.com"), json={}
+        )
+        with patch(_AZURE_HTTPX_PATH, return_value=_AsyncClient(resp)):
+            with pytest.raises(QuotaExceeded):
+                await adapter.chat(ChatRequest(messages=[Message(role="user", content="x")]))
+
+    @pytest.mark.asyncio
+    async def test_timeout_maps_to_provider_unavailable(self):
+        adapter = AzureOpenAIAdapter(_make_azure_connector())
+        client = _AsyncClient(httpx.TimeoutException("timeout"))
+        with patch(_AZURE_HTTPX_PATH, return_value=client):
+            with pytest.raises(ProviderUnavailable):
+                await adapter.chat(ChatRequest(messages=[Message(role="user", content="x")]))
+
+    @pytest.mark.asyncio
+    async def test_malformed_json_body_raises_tool_translation_error(self):
+        adapter = AzureOpenAIAdapter(_make_azure_connector())
+        resp = httpx.Response(
+            200,
+            request=httpx.Request("POST", "https://acme.openai.azure.com"),
+            content=b"not json",
+            headers={"Content-Type": "application/json"},
+        )
+        with patch(_AZURE_HTTPX_PATH, return_value=_AsyncClient(resp)):
+            with pytest.raises(ToolTranslationError):
+                await adapter.chat(ChatRequest(messages=[Message(role="user", content="x")]))
+
+    @pytest.mark.asyncio
+    async def test_missing_config_raises_auth_invalid(self):
+        connector = SimpleNamespace(
+            connector_type="azure_openai",
+            credentials=json.dumps({"api_key": "k"}),  # missing azure_* fields
+            model_hint=None,
+            base_url_plain=None,
+        )
+        adapter = AzureOpenAIAdapter(connector)
+        with pytest.raises(AuthInvalid):
+            await adapter.chat(ChatRequest(messages=[Message(role="user", content="x")]))
+
+    @pytest.mark.asyncio
+    async def test_malformed_credentials_raise_auth_invalid(self):
+        connector = SimpleNamespace(
+            connector_type="azure_openai",
+            credentials="not json",
+            model_hint=None,
+            base_url_plain=None,
+        )
+        adapter = AzureOpenAIAdapter(connector)
+        with pytest.raises(AuthInvalid):
+            await adapter.chat(ChatRequest(messages=[Message(role="user", content="x")]))
+
+    def test_build_endpoint_encodes_and_validates(self):
+        # Valid components compose the expected URL with the query encoded.
+        url = _build_azure_endpoint("acme", "gpt-4o", "2024-06-01")
+        assert url == (
+            "https://acme.openai.azure.com/openai/deployments/gpt-4o"
+            "/chat/completions?api-version=2024-06-01"
+        )
+
+    @pytest.mark.parametrize(
+        ("resource", "deployment", "version"),
+        [
+            ("acme.evil.com/x", "gpt-4o", "2024-06-01"),  # authority rewrite
+            ("acme", "../../admin", "2024-06-01"),  # path traversal
+            ("acme", "gpt-4o", "2024-06-01&inject=1"),  # query injection
+            ("acme/", "gpt-4o", "2024-06-01"),  # trailing slash in host
+            ("acme", "gpt 4o", "2024-06-01"),  # whitespace in deployment
+        ],
+    )
+    def test_build_endpoint_rejects_url_injection(self, resource, deployment, version):
+        with pytest.raises(AuthInvalid):
+            _build_azure_endpoint(resource, deployment, version)
+
+
+# ---------------------------------------------------------------------------
+# xAI Grok API-key adapter
+# ---------------------------------------------------------------------------
+def _openai_tool_call_body(name="pick", args='{"q": "house"}'):
+    return {
+        "model": "grok-3-mini",
+        "choices": [
+            {
+                "finish_reason": "tool_calls",
+                "message": {
+                    "role": "assistant",
+                    "content": None,
+                    "tool_calls": [
+                        {
+                            "id": "call_1",
+                            "type": "function",
+                            "function": {"name": name, "arguments": args},
+                        }
+                    ],
+                },
+            }
+        ],
+        "usage": {"prompt_tokens": 5, "completion_tokens": 2},
+    }
+
+
+class TestXaiApiKeyAdapter:
+    @pytest.mark.asyncio
+    async def test_happy_path_uses_fixed_base_url_and_bearer(self):
+        connector = _make_xai_connector()
+        adapter = XaiApiKeyAdapter(connector)
+        request = ChatRequest(messages=[Message(role="user", content="hi")])
+
+        client = _AsyncClient(_ok_response(_openai_success_body("pong")))
+        with patch(_HTTPX_PATH, return_value=client):
+            resp = await adapter.chat(request)
+
+        assert resp.text == "pong"
+        # Base URL is pinned to xAI — never user-supplied.
+        assert client.calls[0]["url"] == f"{XAI_BASE_URL}/chat/completions"
+        # API key is sent as a bearer token.
+        assert client.calls[0]["headers"]["Authorization"] == (
+            "Bearer xai-fake-key-1234567890123456789012"
+        )
+
+    @pytest.mark.asyncio
+    async def test_tool_use_via_inherited_openai_path(self):
+        connector = _make_xai_connector()
+        adapter = XaiApiKeyAdapter(connector)
+        request = ChatRequest(
+            messages=[Message(role="user", content="suggest")],
+            tools=[
+                ToolSpec(
+                    name="pick",
+                    description="pick a track",
+                    input_schema={"type": "object", "properties": {"q": {"type": "string"}}},
+                )
+            ],
+            force_tool="pick",
+        )
+
+        client = _AsyncClient(_ok_response(_openai_tool_call_body()))
+        with patch(_HTTPX_PATH, return_value=client):
+            resp = await adapter.chat(request)
+
+        # Tool-use translated through the inherited OpenAI-compatible path.
+        assert resp.stop_reason == "tool_use"
+        assert len(resp.tool_calls) == 1
+        assert resp.tool_calls[0].name == "pick"
+        assert resp.tool_calls[0].input == {"q": "house"}
+        # The request body carried the OpenAI function-calling tool shape.
+        sent = client.calls[0]["json"]
+        assert sent["tools"][0]["function"]["name"] == "pick"
+        assert sent["tool_choice"]["function"]["name"] == "pick"
+
+    @pytest.mark.asyncio
+    async def test_401_maps_to_auth_invalid(self):
+        connector = _make_xai_connector()
+        adapter = XaiApiKeyAdapter(connector)
+        resp = httpx.Response(
+            401,
+            request=httpx.Request("POST", "https://api.x.ai/v1/chat/completions"),
+            json={"error": "bad key"},
+        )
+        client = _AsyncClient(resp)
+        with patch(_HTTPX_PATH, return_value=client):
+            with pytest.raises(AuthInvalid):
+                await adapter.chat(ChatRequest(messages=[Message(role="user", content="x")]))
+
+    @pytest.mark.asyncio
+    async def test_429_maps_to_rate_limited_with_retry_after(self):
+        connector = _make_xai_connector()
+        adapter = XaiApiKeyAdapter(connector)
+        resp = httpx.Response(
+            429,
+            request=httpx.Request("POST", "https://api.x.ai/v1/chat/completions"),
+            headers={"Retry-After": "17"},
+            json={"error": "ratelimit"},
+        )
+        client = _AsyncClient(resp)
+        with patch(_HTTPX_PATH, return_value=client):
+            with pytest.raises(RateLimited) as exc_info:
+                await adapter.chat(ChatRequest(messages=[Message(role="user", content="x")]))
+        assert exc_info.value.retry_after_seconds == 17
+
+    @pytest.mark.asyncio
+    async def test_5xx_maps_to_provider_unavailable_with_xai_context(self):
+        connector = _make_xai_connector()
+        adapter = XaiApiKeyAdapter(connector)
+        resp = httpx.Response(
+            503,
+            request=httpx.Request("POST", "https://api.x.ai/v1/chat/completions"),
+            json={"error": "boom"},
+        )
+        client = _AsyncClient(resp)
+        with patch(_HTTPX_PATH, return_value=client):
+            with pytest.raises(ProviderUnavailable) as exc_info:
+                await adapter.chat(ChatRequest(messages=[Message(role="user", content="x")]))
+        assert "xAI" in str(exc_info.value)
+
+    @pytest.mark.asyncio
+    async def test_402_maps_to_quota_exceeded(self):
+        connector = _make_xai_connector()
+        adapter = XaiApiKeyAdapter(connector)
+        resp = httpx.Response(
+            402,
+            request=httpx.Request("POST", "https://api.x.ai/v1/chat/completions"),
+            json={"error": "billing"},
+        )
+        client = _AsyncClient(resp)
+        with patch(_HTTPX_PATH, return_value=client):
+            with pytest.raises(QuotaExceeded):
+                await adapter.chat(ChatRequest(messages=[Message(role="user", content="x")]))
+
+    @pytest.mark.asyncio
+    async def test_timeout_maps_to_provider_unavailable(self):
+        connector = _make_xai_connector()
+        adapter = XaiApiKeyAdapter(connector)
+        client = _AsyncClient(httpx.TimeoutException("timeout"))
+        with patch(_HTTPX_PATH, return_value=client):
+            with pytest.raises(ProviderUnavailable):
+                await adapter.chat(ChatRequest(messages=[Message(role="user", content="x")]))
+
+    @pytest.mark.asyncio
+    async def test_malformed_response_raises_tool_translation_error(self):
+        connector = _make_xai_connector()
+        adapter = XaiApiKeyAdapter(connector)
+        # 200 with a body that has no choices -> parse error.
+        resp = httpx.Response(
+            200,
+            request=httpx.Request("POST", "https://api.x.ai/v1/chat/completions"),
+            json={"unexpected": "shape"},
+        )
+        client = _AsyncClient(resp)
+        with patch(_HTTPX_PATH, return_value=client):
+            with pytest.raises(ToolTranslationError):
+                await adapter.chat(ChatRequest(messages=[Message(role="user", content="x")]))
+
+    @pytest.mark.asyncio
+    async def test_malformed_credentials_raise_auth_invalid(self):
+        connector = SimpleNamespace(
+            connector_type="xai_apikey",
+            credentials="not json at all",
+            model_hint="grok-3-mini",
+            base_url_plain=None,
+        )
+        adapter = XaiApiKeyAdapter(connector)
+        with pytest.raises(AuthInvalid):
+            await adapter.chat(ChatRequest(messages=[Message(role="user", content="x")]))
+
+    @pytest.mark.asyncio
+    async def test_missing_api_key_raises_auth_invalid(self):
+        connector = SimpleNamespace(
+            connector_type="xai_apikey",
+            credentials=json.dumps({}),
+            model_hint="grok-3-mini",
+            base_url_plain=None,
+        )
+        adapter = XaiApiKeyAdapter(connector)
+        with pytest.raises(AuthInvalid):
+            await adapter.chat(ChatRequest(messages=[Message(role="user", content="x")]))
+
+    @pytest.mark.asyncio
+    async def test_health_check_pings_fixed_base_url(self):
+        connector = _make_xai_connector()
+        adapter = XaiApiKeyAdapter(connector)
+        client = _AsyncClient(_ok_response(_openai_success_body("ok")))
+        with patch(_HTTPX_PATH, return_value=client):
+            await adapter.health_check()
+        assert client.calls[0]["url"] == f"{XAI_BASE_URL}/chat/completions"
+
+    @pytest.mark.asyncio
+    async def test_default_model_used_when_no_model_hint(self):
+        connector = _make_xai_connector(model_hint=None)
+        adapter = XaiApiKeyAdapter(connector)
+        client = _AsyncClient(_ok_response(_openai_success_body("ok")))
+        with patch(_HTTPX_PATH, return_value=client):
+            await adapter.chat(ChatRequest(messages=[Message(role="user", content="x")]))
+        assert client.calls[0]["json"]["model"] == "grok-3-mini"
diff --git a/server/tests/test_llm_admin_audit.py b/server/tests/test_llm_admin_audit.py
new file mode 100644
index 00000000..66dd6657
--- /dev/null
+++ b/server/tests/test_llm_admin_audit.py
@@ -0,0 +1,309 @@
+"""Tests for the admin LLM audit-trail browse + CSV export endpoints (#341).
+
+Exercises:
+- GET /api/admin/llm/audit — paginated, filterable JSON browse
+- GET /api/admin/llm/audit.csv — filtered CSV export
+- admin-only auth guard
+- joined actor username + target connector display name
+- never leaks credential material
+"""
+
+from __future__ import annotations
+
+import csv
+import io
+import json
+
+from fastapi.testclient import TestClient
+from sqlalchemy.orm import Session
+
+from app.core.time import utcnow
+from app.models.llm_connector import LlmAuditEvent, LlmConnector
+from app.models.user import User
+from app.services.auth import get_password_hash
+
+
+def _make_dj(db: Session, username: str) -> User:
+    user = User(
+        username=username,
+        password_hash=get_password_hash("password123456"),
+        role="dj",
+    )
+    db.add(user)
+    db.commit()
+    db.refresh(user)
+    return user
+
+
+def _make_connector(db: Session, *, user_id: int, display_name: str) -> LlmConnector:
+    row = LlmConnector(
+        user_id=user_id,
+        connector_type="openai_apikey",
+        display_name=display_name,
+        status="active",
+        credentials=json.dumps({"api_key": "sk-secret-should-never-leak"}),
+    )
+    db.add(row)
+    db.commit()
+    db.refresh(row)
+    return row
+
+
+def _make_audit(
+    db: Session,
+    *,
+    actor_user_id: int,
+    target_connector_id: int | None,
+    event_type: str,
+) -> LlmAuditEvent:
+    row = LlmAuditEvent(
+        actor_user_id=actor_user_id,
+        target_connector_id=target_connector_id,
+        event_type=event_type,
+        created_at=utcnow(),
+    )
+    db.add(row)
+    db.commit()
+    db.refresh(row)
+    return row
+
+
+class TestAuditBrowse:
+    def test_requires_admin(self, client: TestClient, auth_headers):
+        resp = client.get("/api/admin/llm/audit", headers=auth_headers)
+        assert resp.status_code == 403
+
+    def test_unauthenticated_rejected(self, client: TestClient):
+        resp = client.get("/api/admin/llm/audit")
+        assert resp.status_code == 401
+
+    def test_empty_list(self, client: TestClient, admin_headers):
+        resp = client.get("/api/admin/llm/audit", headers=admin_headers)
+        assert resp.status_code == 200
+        data = resp.json()
+        assert data["rows"] == []
+        assert data["total"] == 0
+
+    def test_lists_events_with_joined_labels(
+        self, client: TestClient, admin_headers, db, test_user
+    ):
+        conn = _make_connector(db, user_id=test_user.id, display_name="My OpenAI")
+        _make_audit(
+            db,
+            actor_user_id=test_user.id,
+            target_connector_id=conn.id,
+            event_type="connector_created",
+        )
+
+        resp = client.get("/api/admin/llm/audit", headers=admin_headers)
+        assert resp.status_code == 200
+        data = resp.json()
+        assert data["total"] == 1
+        row = data["rows"][0]
+        assert row["event_type"] == "connector_created"
+        assert row["actor_username"] == "testuser"
+        assert row["target_connector_display_name"] == "My OpenAI"
+        assert row["target_connector_id"] == conn.id
+
+    def test_never_leaks_credentials(self, client: TestClient, admin_headers, db, test_user):
+        conn = _make_connector(db, user_id=test_user.id, display_name="My OpenAI")
+        _make_audit(
+            db,
+            actor_user_id=test_user.id,
+            target_connector_id=conn.id,
+            event_type="connector_created",
+        )
+        resp = client.get("/api/admin/llm/audit", headers=admin_headers)
+        assert "sk-secret-should-never-leak" not in resp.text
+        assert "credentials" not in resp.text
+
+    def test_filter_by_event_type(self, client: TestClient, admin_headers, db, test_user):
+        conn = _make_connector(db, user_id=test_user.id, display_name="C")
+        _make_audit(
+            db,
+            actor_user_id=test_user.id,
+            target_connector_id=conn.id,
+            event_type="connector_created",
+        )
+        _make_audit(
+            db,
+            actor_user_id=test_user.id,
+            target_connector_id=conn.id,
+            event_type="connector_credentials_rotated",
+        )
+        resp = client.get(
+            "/api/admin/llm/audit?event_type=connector_credentials_rotated",
+            headers=admin_headers,
+        )
+        assert resp.status_code == 200
+        data = resp.json()
+        assert data["total"] == 1
+        assert data["rows"][0]["event_type"] == "connector_credentials_rotated"
+
+    def test_filter_by_actor(self, client: TestClient, admin_headers, db, test_user):
+        other = _make_dj(db, "otherdj")
+        conn = _make_connector(db, user_id=test_user.id, display_name="C")
+        _make_audit(
+            db,
+            actor_user_id=test_user.id,
+            target_connector_id=conn.id,
+            event_type="connector_created",
+        )
+        _make_audit(
+            db,
+            actor_user_id=other.id,
+            target_connector_id=conn.id,
+            event_type="connector_revoked_by_admin",
+        )
+        resp = client.get(f"/api/admin/llm/audit?actor_user_id={other.id}", headers=admin_headers)
+        assert resp.status_code == 200
+        data = resp.json()
+        assert data["total"] == 1
+        assert data["rows"][0]["actor_username"] == "otherdj"
+
+    def test_filter_by_target_connector(self, client: TestClient, admin_headers, db, test_user):
+        conn_a = _make_connector(db, user_id=test_user.id, display_name="A")
+        conn_b = _make_connector(db, user_id=test_user.id, display_name="B")
+        _make_audit(
+            db,
+            actor_user_id=test_user.id,
+            target_connector_id=conn_a.id,
+            event_type="connector_created",
+        )
+        _make_audit(
+            db,
+            actor_user_id=test_user.id,
+            target_connector_id=conn_b.id,
+            event_type="connector_created",
+        )
+        resp = client.get(
+            f"/api/admin/llm/audit?target_connector_id={conn_b.id}", headers=admin_headers
+        )
+        assert resp.status_code == 200
+        data = resp.json()
+        assert data["total"] == 1
+        assert data["rows"][0]["target_connector_id"] == conn_b.id
+
+    def test_pagination(self, client: TestClient, admin_headers, db, test_user):
+        conn = _make_connector(db, user_id=test_user.id, display_name="C")
+        for _ in range(5):
+            _make_audit(
+                db,
+                actor_user_id=test_user.id,
+                target_connector_id=conn.id,
+                event_type="connector_created",
+            )
+        resp = client.get("/api/admin/llm/audit?limit=2&offset=0", headers=admin_headers)
+        assert resp.status_code == 200
+        data = resp.json()
+        assert data["total"] == 5
+        assert len(data["rows"]) == 2
+
+        resp2 = client.get("/api/admin/llm/audit?limit=2&offset=4", headers=admin_headers)
+        assert len(resp2.json()["rows"]) == 1
+
+    def test_invalid_limit_rejected(self, client: TestClient, admin_headers):
+        resp = client.get("/api/admin/llm/audit?limit=0", headers=admin_headers)
+        assert resp.status_code == 422
+        resp = client.get("/api/admin/llm/audit?limit=9999", headers=admin_headers)
+        assert resp.status_code == 422
+
+    def test_null_target_connector_renders(self, client: TestClient, admin_headers, db, test_user):
+        # policy_changed events may have a null target connector
+        _make_audit(
+            db,
+            actor_user_id=test_user.id,
+            target_connector_id=None,
+            event_type="policy_changed",
+        )
+        resp = client.get("/api/admin/llm/audit", headers=admin_headers)
+        assert resp.status_code == 200
+        row = resp.json()["rows"][0]
+        assert row["target_connector_id"] is None
+        assert row["target_connector_display_name"] is None
+
+
+class TestAuditCsvExport:
+    def test_requires_admin(self, client: TestClient, auth_headers):
+        resp = client.get("/api/admin/llm/audit.csv", headers=auth_headers)
+        assert resp.status_code == 403
+
+    def test_unauthenticated_rejected(self, client: TestClient):
+        resp = client.get("/api/admin/llm/audit.csv")
+        assert resp.status_code == 401
+
+    def test_csv_content_type_and_rows(self, client: TestClient, admin_headers, db, test_user):
+        conn = _make_connector(db, user_id=test_user.id, display_name="My OpenAI")
+        _make_audit(
+            db,
+            actor_user_id=test_user.id,
+            target_connector_id=conn.id,
+            event_type="connector_created",
+        )
+        resp = client.get("/api/admin/llm/audit.csv", headers=admin_headers)
+        assert resp.status_code == 200
+        assert "text/csv" in resp.headers["content-type"]
+        assert "attachment" in resp.headers.get("content-disposition", "")
+
+        reader = list(csv.reader(io.StringIO(resp.text)))
+        header = reader[0]
+        assert header == ["timestamp", "actor", "event_type", "target_connector", "notes"]
+        assert any("connector_created" in r for r in reader[1:])
+        assert any("My OpenAI" in r for r in reader[1:])
+        assert any("testuser" in r for r in reader[1:])
+
+    def test_csv_honors_event_type_filter(self, client: TestClient, admin_headers, db, test_user):
+        conn = _make_connector(db, user_id=test_user.id, display_name="C")
+        _make_audit(
+            db,
+            actor_user_id=test_user.id,
+            target_connector_id=conn.id,
+            event_type="connector_created",
+        )
+        _make_audit(
+            db,
+            actor_user_id=test_user.id,
+            target_connector_id=conn.id,
+            event_type="connector_deleted",
+        )
+        resp = client.get(
+            "/api/admin/llm/audit.csv?event_type=connector_deleted", headers=admin_headers
+        )
+        assert resp.status_code == 200
+        body = resp.text
+        assert "connector_deleted" in body
+        assert "connector_created" not in body
+
+    def test_csv_never_leaks_credentials(self, client: TestClient, admin_headers, db, test_user):
+        conn = _make_connector(db, user_id=test_user.id, display_name="My OpenAI")
+        _make_audit(
+            db,
+            actor_user_id=test_user.id,
+            target_connector_id=conn.id,
+            event_type="connector_created",
+        )
+        resp = client.get("/api/admin/llm/audit.csv", headers=admin_headers)
+        assert "sk-secret-should-never-leak" not in resp.text
+
+    def test_csv_neutralizes_formula_injection(
+        self, client: TestClient, admin_headers, db, test_user
+    ):
+        # A connector display name that starts with "=" would execute as a
+        # spreadsheet formula if written verbatim into the CSV.
+        conn = _make_connector(db, user_id=test_user.id, display_name='=HYPERLINK("http://evil")')
+        _make_audit(
+            db,
+            actor_user_id=test_user.id,
+            target_connector_id=conn.id,
+            event_type="connector_created",
+        )
+        resp = client.get("/api/admin/llm/audit.csv", headers=admin_headers)
+        assert resp.status_code == 200
+
+        rows = list(csv.reader(io.StringIO(resp.text)))
+        target_cells = [cell for row in rows[1:] for cell in row if "HYPERLINK" in cell]
+        assert target_cells, "expected the injected display name to be present"
+        # Every cell carrying the payload must be defanged with a leading quote
+        # so spreadsheet apps treat it as literal text, not a formula.
+        for cell in target_cells:
+            assert cell.startswith("'="), cell
diff --git a/server/tests/test_llm_api.py b/server/tests/test_llm_api.py
new file mode 100644
index 00000000..4888e15b
--- /dev/null
+++ b/server/tests/test_llm_api.py
@@ -0,0 +1,1093 @@
+"""Tests for the per-DJ LLM connector API + admin oversight API.
+
+Exercises:
+- CRUD endpoints, ownership scoping (404 for other DJs' connectors)
+- policy gating (admin can disable connector types)
+- credential rotation audit
+- admin force-revoke + system default cleanup
+- usage rollup
+"""
+
+from __future__ import annotations
+
+import json
+from unittest.mock import AsyncMock, patch
+
+from fastapi.testclient import TestClient
+from sqlalchemy.orm import Session
+
+from app.models.llm_connector import LlmAuditEvent, LlmConnector
+from app.models.user import User
+from app.services.auth import get_password_hash
+
+
+# ---------- helpers ----------
+def _login(client: TestClient, username: str, password: str) -> dict[str, str]:
+    resp = client.post("/api/auth/login", data={"username": username, "password": password})
+    assert resp.status_code == 200, resp.json()
+    return {"Authorization": f"Bearer {resp.json()['access_token']}"}
+
+
+def _make_other_dj(db: Session) -> User:
+    user = User(
+        username="otherdj",
+        password_hash=get_password_hash("otherpassword123"),
+        role="dj",
+    )
+    db.add(user)
+    db.commit()
+    db.refresh(user)
+    return user
+
+
+# ---------- list / create / scope ----------
+class TestPerDJConnectorsCRUD:
+    def test_list_empty_for_new_user(self, client: TestClient, auth_headers):
+        resp = client.get("/api/llm/connectors", headers=auth_headers)
+        assert resp.status_code == 200
+        assert resp.json() == []
+
+    def test_create_openai_apikey_happy_path(self, client: TestClient, auth_headers, db):
+        body = {
+            "connector_type": "openai_apikey",
+            "display_name": "My OpenAI",
+            "api_key": "sk-proj-abc1234567890abcdef12",
+            "model_hint": "gpt-5-mini",
+        }
+        resp = client.post("/api/llm/connectors", json=body, headers=auth_headers)
+        assert resp.status_code == 201, resp.json()
+        data = resp.json()
+        assert data["connector_type"] == "openai_apikey"
+        assert data["display_name"] == "My OpenAI"
+        # Credentials never returned
+        assert "credentials" not in data
+        assert "api_key" not in data
+
+        # Audit event recorded
+        event = (
+            db.query(LlmAuditEvent).filter(LlmAuditEvent.target_connector_id == data["id"]).first()
+        )
+        assert event is not None
+        assert event.event_type == "connector_created"
+
+    def test_create_anthropic_apikey_happy_path(self, client: TestClient, auth_headers):
+        body = {
+            "connector_type": "anthropic_apikey",
+            "display_name": "My Claude",
+            "api_key": "sk-ant-1234567890abcdef1234567890abcdef1234567890",
+            "model_hint": "claude-haiku-4-5-20251001",
+        }
+        resp = client.post("/api/llm/connectors", json=body, headers=auth_headers)
+        assert resp.status_code == 201, resp.json()
+
+    def test_create_openrouter_apikey_happy_path(self, client: TestClient, auth_headers):
+        body = {
+            "connector_type": "openrouter_apikey",
+            "display_name": "My OpenRouter",
+            "api_key": "sk-or-v1-1234567890abcdef1234567890abcdef",
+            "model_hint": "openai/gpt-4o-mini",
+        }
+        resp = client.post("/api/llm/connectors", json=body, headers=auth_headers)
+        assert resp.status_code == 201, resp.json()
+        data = resp.json()
+        assert data["connector_type"] == "openrouter_apikey"
+        assert data["model_hint"] == "openai/gpt-4o-mini"
+        assert "credentials" not in data
+        assert "api_key" not in data
+
+    def test_create_openrouter_rejects_non_openrouter_key(self, client: TestClient, auth_headers):
+        body = {
+            "connector_type": "openrouter_apikey",
+            "display_name": "Wrong prefix",
+            "api_key": "sk-proj-abc1234567890abcdef12",
+        }
+        resp = client.post("/api/llm/connectors", json=body, headers=auth_headers)
+        assert resp.status_code == 400
+
+    def test_create_openrouter_blocked_by_apikey_policy(
+        self, client: TestClient, auth_headers, admin_headers
+    ):
+        # OpenRouter is gated by the generic api-key flag (no per-provider flag).
+        resp = client.patch(
+            "/api/admin/llm/policy",
+            json={"llm_apikey_connectors_enabled": False},
+            headers=admin_headers,
+        )
+        assert resp.status_code == 200, resp.json()
+        body = {
+            "connector_type": "openrouter_apikey",
+            "display_name": "Should Fail",
+            "api_key": "sk-or-v1-1234567890abcdef1234567890abcdef",
+        }
+        resp = client.post("/api/llm/connectors", json=body, headers=auth_headers)
+        assert resp.status_code == 403
+
+    def test_create_xai_apikey_happy_path(self, client: TestClient, auth_headers):
+        body = {
+            "connector_type": "xai_apikey",
+            "display_name": "My Grok",
+            "api_key": "xai-1234567890abcdef1234567890abcdef",
+            "model_hint": "grok-3-mini",
+        }
+        resp = client.post("/api/llm/connectors", json=body, headers=auth_headers)
+        assert resp.status_code == 201, resp.json()
+        data = resp.json()
+        assert data["connector_type"] == "xai_apikey"
+        assert "api_key" not in data
+
+    def test_create_xai_apikey_rejects_invalid_key_format(self, client: TestClient, auth_headers):
+        body = {
+            "connector_type": "xai_apikey",
+            "display_name": "Bad Grok",
+            # Missing the xai- prefix.
+            "api_key": "sk-1234567890abcdef1234567890",
+        }
+        resp = client.post("/api/llm/connectors", json=body, headers=auth_headers)
+        assert resp.status_code == 400
+
+    def test_create_xai_apikey_blocked_by_apikey_policy(
+        self, client: TestClient, auth_headers, admin_headers
+    ):
+        # The generic api-key policy flag also gates xAI connectors.
+        resp = client.patch(
+            "/api/admin/llm/policy",
+            json={"llm_apikey_connectors_enabled": False},
+            headers=admin_headers,
+        )
+        assert resp.status_code == 200, resp.json()
+        body = {
+            "connector_type": "xai_apikey",
+            "display_name": "Blocked Grok",
+            "api_key": "xai-1234567890abcdef1234567890abcdef",
+        }
+        resp = client.post("/api/llm/connectors", json=body, headers=auth_headers)
+        assert resp.status_code == 403
+
+    def test_create_gemini_apikey_happy_path(self, client: TestClient, auth_headers):
+        # Built at runtime (valid 39-char shape) so no "AIza…" literal is committed.
+        gemini_key = "AIza" + ("A" * 35)
+        body = {
+            "connector_type": "gemini_apikey",
+            "display_name": "My Gemini",
+            "api_key": gemini_key,
+            "model_hint": "gemini-2.5-flash",
+        }
+        resp = client.post("/api/llm/connectors", json=body, headers=auth_headers)
+        assert resp.status_code == 201, resp.json()
+        data = resp.json()
+        assert data["connector_type"] == "gemini_apikey"
+        assert "api_key" not in data
+
+    def test_create_gemini_rejects_non_google_key(self, client: TestClient, auth_headers):
+        body = {
+            "connector_type": "gemini_apikey",
+            "display_name": "Bad Gemini",
+            "api_key": "sk-not-a-google-key",
+        }
+        resp = client.post("/api/llm/connectors", json=body, headers=auth_headers)
+        assert resp.status_code == 400
+
+    def test_gemini_blocked_by_apikey_policy(self, client: TestClient, auth_headers, admin_headers):
+        # Gemini reuses the generic api-key policy flag — no per-provider toggle.
+        resp = client.patch(
+            "/api/admin/llm/policy",
+            json={"llm_apikey_connectors_enabled": False},
+            headers=admin_headers,
+        )
+        assert resp.status_code == 200
+        gemini_key = "AIza" + ("A" * 35)
+        body = {
+            "connector_type": "gemini_apikey",
+            "display_name": "Should Fail",
+            "api_key": gemini_key,
+        }
+        resp = client.post("/api/llm/connectors", json=body, headers=auth_headers)
+        assert resp.status_code == 403
+
+    def test_create_openai_compatible_happy_path(self, client: TestClient, auth_headers):
+        body = {
+            "connector_type": "openai_compatible",
+            "display_name": "Local Ollama",
+            "base_url": "http://127.0.0.1:11434/v1",
+            "model_hint": "llama3",
+        }
+        resp = client.post("/api/llm/connectors", json=body, headers=auth_headers)
+        assert resp.status_code == 201, resp.json()
+        data = resp.json()
+        assert data["base_url_plain"] == "http://127.0.0.1:11434/v1"
+
+    def test_create_bedrock_happy_path(self, client: TestClient, auth_headers, db, test_user):
+        body = {
+            "connector_type": "bedrock",
+            "display_name": "My Bedrock",
+            "aws_access_key_id": "AKIAEXAMPLEKEY12345",
+            "aws_secret_access_key": "wJalrXUtnFEMI/K7MDENG+bPxRfiCYEXAMPLEKEY",
+            "aws_region": "us-east-1",
+            "aws_model_id": "anthropic.claude-3-5-sonnet-20241022-v2:0",
+        }
+        resp = client.post("/api/llm/connectors", json=body, headers=auth_headers)
+        assert resp.status_code == 201, resp.json()
+        data = resp.json()
+        assert data["connector_type"] == "bedrock"
+        # base_url_plain stays null — no plaintext credential surface for bedrock.
+        assert data["base_url_plain"] is None
+        # Verify the encrypted blob round-trips with all four AWS fields.
+        row = db.query(LlmConnector).filter(LlmConnector.id == data["id"]).one()
+        blob = json.loads(row.credentials)
+        assert blob["aws_access_key_id"] == "AKIAEXAMPLEKEY12345"
+        assert blob["aws_secret_access_key"] == "wJalrXUtnFEMI/K7MDENG+bPxRfiCYEXAMPLEKEY"
+        assert blob["aws_region"] == "us-east-1"
+        assert blob["aws_model_id"] == "anthropic.claude-3-5-sonnet-20241022-v2:0"
+
+    def test_create_bedrock_requires_all_aws_fields(self, client: TestClient, auth_headers):
+        body = {
+            "connector_type": "bedrock",
+            "display_name": "Incomplete",
+            "aws_access_key_id": "AKIAEXAMPLEKEY12345",
+            "aws_secret_access_key": "secret",
+            # missing aws_region + aws_model_id
+        }
+        resp = client.post("/api/llm/connectors", json=body, headers=auth_headers)
+        # model_validator → ValueError → 422 (pydantic) before our handler
+        assert resp.status_code in (400, 422)
+
+    def test_create_bedrock_blocked_when_apikey_connectors_disabled(
+        self, client: TestClient, auth_headers, db
+    ):
+        from app.services.system_settings import get_system_settings
+
+        settings = get_system_settings(db)
+        settings.llm_apikey_connectors_enabled = False
+        db.commit()
+
+        body = {
+            "connector_type": "bedrock",
+            "display_name": "Blocked Bedrock",
+            "aws_access_key_id": "AKIAEXAMPLEKEY12345",
+            "aws_secret_access_key": "secret",
+            "aws_region": "us-east-1",
+            "aws_model_id": "meta.llama3-70b-instruct-v1:0",
+        }
+        resp = client.post("/api/llm/connectors", json=body, headers=auth_headers)
+        assert resp.status_code == 403
+
+    def test_rotate_bedrock_credentials(self, client: TestClient, auth_headers, db, test_user):
+        row = LlmConnector(
+            user_id=test_user.id,
+            connector_type="bedrock",
+            display_name="Rotatable",
+            status="active",
+            credentials=json.dumps(
+                {
+                    "aws_access_key_id": "AKIAOLDKEY1234567890",
+                    "aws_secret_access_key": "oldsecret",
+                    "aws_region": "us-east-1",
+                    "aws_model_id": "anthropic.claude-3-5-sonnet-20241022-v2:0",
+                }
+            ),
+        )
+        db.add(row)
+        db.commit()
+        db.refresh(row)
+
+        # Rotate only the secret — other fields must be preserved.
+        resp = client.put(
+            f"/api/llm/connectors/{row.id}/credentials",
+            json={"aws_secret_access_key": "newsecret"},
+            headers=auth_headers,
+        )
+        assert resp.status_code == 200, resp.json()
+        db.refresh(row)
+        blob = json.loads(row.credentials)
+        assert blob["aws_secret_access_key"] == "newsecret"
+        assert blob["aws_access_key_id"] == "AKIAOLDKEY1234567890"
+        assert blob["aws_region"] == "us-east-1"
+        assert blob["aws_model_id"] == "anthropic.claude-3-5-sonnet-20241022-v2:0"
+
+    def test_create_openai_compatible_rejects_public_http(self, client: TestClient, auth_headers):
+        body = {
+            "connector_type": "openai_compatible",
+            "display_name": "Bad URL",
+            "base_url": "http://example.com/v1",
+        }
+        resp = client.post("/api/llm/connectors", json=body, headers=auth_headers)
+        assert resp.status_code == 400
+
+    def test_create_azure_openai_happy_path(self, client: TestClient, auth_headers):
+        body = {
+            "connector_type": "azure_openai",
+            "display_name": "Venue Azure",
+            "api_key": "azure-secret-key-12345",
+            "azure_resource_name": "venue-co",
+            "azure_deployment_name": "gpt4o-prod",
+            "azure_api_version": "2024-06-01",
+        }
+        resp = client.post("/api/llm/connectors", json=body, headers=auth_headers)
+        assert resp.status_code == 201, resp.json()
+        data = resp.json()
+        assert data["connector_type"] == "azure_openai"
+        # Credentials (incl. azure config) are never echoed back.
+        assert "api_key" not in data
+        assert "azure_resource_name" not in data
+        assert data["base_url_plain"] is None
+
+    def test_create_azure_openai_requires_all_config_fields(self, client: TestClient, auth_headers):
+        body = {
+            "connector_type": "azure_openai",
+            "display_name": "Incomplete Azure",
+            "api_key": "azure-secret-key-12345",
+            "azure_resource_name": "venue-co",
+            # missing deployment + api_version
+        }
+        resp = client.post("/api/llm/connectors", json=body, headers=auth_headers)
+        assert resp.status_code in (400, 422)
+
+    def test_rotate_azure_openai_config_without_recreating(
+        self, client: TestClient, auth_headers, db, test_user
+    ):
+        create_body = {
+            "connector_type": "azure_openai",
+            "display_name": "Rotatable Azure",
+            "api_key": "azure-secret-key-12345",
+            "azure_resource_name": "old-resource",
+            "azure_deployment_name": "old-deployment",
+            "azure_api_version": "2024-02-01",
+        }
+        created = client.post("/api/llm/connectors", json=create_body, headers=auth_headers)
+        assert created.status_code == 201, created.json()
+        connector_id = created.json()["id"]
+
+        # Rotate ONLY the deployment + resource — api_key omitted, must be kept.
+        rotate = client.put(
+            f"/api/llm/connectors/{connector_id}/credentials",
+            json={
+                "azure_resource_name": "new-resource",
+                "azure_deployment_name": "new-deployment",
+            },
+            headers=auth_headers,
+        )
+        assert rotate.status_code == 200, rotate.json()
+
+        # Verify the persisted blob carried forward the api_key + version.
+        row = db.get(LlmConnector, connector_id)
+        db.refresh(row)
+        blob = json.loads(row.credentials)
+        assert blob["api_key"] == "azure-secret-key-12345"
+        assert blob["azure_resource_name"] == "new-resource"
+        assert blob["azure_deployment_name"] == "new-deployment"
+        assert blob["azure_api_version"] == "2024-02-01"
+
+    def test_create_azure_openai_rejects_whitespace_only_config(
+        self, client: TestClient, auth_headers
+    ):
+        body = {
+            "connector_type": "azure_openai",
+            "display_name": "Blank Azure",
+            "api_key": "azure-secret-key-12345",
+            "azure_resource_name": "venue-co",
+            "azure_deployment_name": "   ",  # whitespace-only must be rejected
+            "azure_api_version": "2024-06-01",
+        }
+        resp = client.post("/api/llm/connectors", json=body, headers=auth_headers)
+        assert resp.status_code in (400, 422), resp.json()
+
+    def test_rotate_azure_openai_rejects_explicit_empty_field(
+        self, client: TestClient, auth_headers, db, test_user
+    ):
+        create_body = {
+            "connector_type": "azure_openai",
+            "display_name": "Rotatable Azure",
+            "api_key": "azure-secret-key-12345",
+            "azure_resource_name": "old-resource",
+            "azure_deployment_name": "old-deployment",
+            "azure_api_version": "2024-02-01",
+        }
+        created = client.post("/api/llm/connectors", json=create_body, headers=auth_headers)
+        assert created.status_code == 201, created.json()
+        connector_id = created.json()["id"]
+
+        # An explicit "" for one field must be rejected by the storage layer
+        # (passed through to _build_azure_creds), not silently treated as
+        # "omitted". A second valid field satisfies the schema-level
+        # "at least one provided" check so the request reaches rotate_credentials.
+        rotate = client.put(
+            f"/api/llm/connectors/{connector_id}/credentials",
+            json={"azure_resource_name": "", "azure_deployment_name": "still-valid"},
+            headers=auth_headers,
+        )
+        assert rotate.status_code in (400, 422), rotate.json()
+
+        # The original blob is untouched.
+        row = db.get(LlmConnector, connector_id)
+        db.refresh(row)
+        blob = json.loads(row.credentials)
+        assert blob["azure_resource_name"] == "old-resource"
+        assert blob["azure_deployment_name"] == "old-deployment"
+
+    def test_create_rejects_invalid_key_format(self, client: TestClient, auth_headers):
+        body = {
+            "connector_type": "openai_apikey",
+            "display_name": "Bad Key",
+            "api_key": "not-a-valid-key",
+        }
+        resp = client.post("/api/llm/connectors", json=body, headers=auth_headers)
+        assert resp.status_code == 400
+
+    def test_create_rejects_unknown_type(self, client: TestClient, auth_headers):
+        body = {
+            "connector_type": "unknown_provider",
+            "display_name": "Future Provider",
+            "api_key": "sk-anything",
+        }
+        # Pydantic Literal rejects this with 422 before we reach our handler.
+        resp = client.post("/api/llm/connectors", json=body, headers=auth_headers)
+        assert resp.status_code in (400, 422)
+
+    def test_create_blocked_by_admin_policy(
+        self, client: TestClient, auth_headers, db, admin_headers
+    ):
+        # Disable apikey connectors via admin policy
+        resp = client.patch(
+            "/api/admin/llm/policy",
+            json={"llm_apikey_connectors_enabled": False},
+            headers=admin_headers,
+        )
+        assert resp.status_code == 200
+
+        body = {
+            "connector_type": "openai_apikey",
+            "display_name": "Should Fail",
+            "api_key": "sk-proj-abc1234567890abcdef12",
+        }
+        resp = client.post("/api/llm/connectors", json=body, headers=auth_headers)
+        assert resp.status_code == 403
+
+    def test_pending_user_cannot_use_connectors(self, client: TestClient, pending_headers):
+        resp = client.get("/api/llm/connectors", headers=pending_headers)
+        assert resp.status_code == 403
+
+    def test_unauthenticated_cannot_list(self, client: TestClient):
+        resp = client.get("/api/llm/connectors")
+        assert resp.status_code == 401
+
+    def test_list_only_shows_own_connectors(self, client: TestClient, auth_headers, db, test_user):
+        other = _make_other_dj(db)
+        other_row = LlmConnector(
+            user_id=other.id,
+            connector_type="openai_apikey",
+            display_name="Other's connector",
+            status="active",
+            credentials=json.dumps({"api_key": "sk-x"}),
+        )
+        db.add(other_row)
+        db.commit()
+        db.refresh(other_row)
+
+        resp = client.get("/api/llm/connectors", headers=auth_headers)
+        assert resp.status_code == 200
+        assert all(r["user_id"] == test_user.id for r in resp.json())
+
+    def test_404_when_accessing_other_dj_connector(self, client: TestClient, auth_headers, db):
+        other = _make_other_dj(db)
+        other_row = LlmConnector(
+            user_id=other.id,
+            connector_type="openai_apikey",
+            display_name="Other's connector",
+            status="active",
+            credentials=json.dumps({"api_key": "sk-x"}),
+        )
+        db.add(other_row)
+        db.commit()
+        db.refresh(other_row)
+
+        resp = client.delete(f"/api/llm/connectors/{other_row.id}", headers=auth_headers)
+        assert resp.status_code == 404
+
+    def test_delete_own_connector(self, client: TestClient, auth_headers, db, test_user):
+        row = LlmConnector(
+            user_id=test_user.id,
+            connector_type="openai_apikey",
+            display_name="Mine",
+            status="active",
+            credentials=json.dumps({"api_key": "sk-x"}),
+        )
+        db.add(row)
+        db.commit()
+        db.refresh(row)
+
+        resp = client.delete(f"/api/llm/connectors/{row.id}", headers=auth_headers)
+        assert resp.status_code == 204
+        # Audit event recorded
+        assert (
+            db.query(LlmAuditEvent).filter(LlmAuditEvent.event_type == "connector_deleted").count()
+            == 1
+        )
+
+    def test_delete_own_connector_clears_system_default(
+        self, client: TestClient, auth_headers, db, test_user
+    ):
+        from app.services.system_settings import get_system_settings
+
+        row = LlmConnector(
+            user_id=test_user.id,
+            connector_type="openai_apikey",
+            display_name="DefaultMine",
+            status="active",
+            credentials=json.dumps({"api_key": "sk-x"}),
+        )
+        db.add(row)
+        db.commit()
+        db.refresh(row)
+
+        settings = get_system_settings(db)
+        settings.llm_default_connector_id = row.id
+        db.commit()
+
+        resp = client.delete(f"/api/llm/connectors/{row.id}", headers=auth_headers)
+        assert resp.status_code == 204
+
+        db.expire_all()
+        settings = get_system_settings(db)
+        assert settings.llm_default_connector_id is None
+
+    def test_rotate_credentials_audited(self, client: TestClient, auth_headers, db, test_user):
+        row = LlmConnector(
+            user_id=test_user.id,
+            connector_type="openai_apikey",
+            display_name="Mine",
+            status="active",
+            credentials=json.dumps({"api_key": "sk-old1234567890abcdef12"}),
+        )
+        db.add(row)
+        db.commit()
+        db.refresh(row)
+
+        resp = client.put(
+            f"/api/llm/connectors/{row.id}/credentials",
+            json={"api_key": "sk-new1234567890abcdef12"},
+            headers=auth_headers,
+        )
+        assert resp.status_code == 200, resp.json()
+        # Audit event for rotation written
+        assert (
+            db.query(LlmAuditEvent)
+            .filter(LlmAuditEvent.event_type == "connector_credentials_rotated")
+            .count()
+            == 1
+        )
+
+
+# ---------- /connectors/{id}/test (health check) ----------
+class TestHealthCheck:
+    def test_test_endpoint_returns_ok(self, client: TestClient, auth_headers, db, test_user):
+        row = LlmConnector(
+            user_id=test_user.id,
+            connector_type="openai_apikey",
+            display_name="Mine",
+            status="active",
+            credentials=json.dumps({"api_key": "sk-key123"}),
+        )
+        db.add(row)
+        db.commit()
+        db.refresh(row)
+
+        with patch(
+            "app.services.llm.adapters.openai_apikey.OpenAIApiKeyAdapter.health_check",
+            new=AsyncMock(return_value=None),
+        ):
+            resp = client.post(f"/api/llm/connectors/{row.id}/test", headers=auth_headers)
+        assert resp.status_code == 200
+        assert resp.json()["ok"] is True
+
+    def test_test_returns_sanitized_error_on_auth_invalid(
+        self, client: TestClient, auth_headers, db, test_user
+    ):
+        from app.services.llm.exceptions import AuthInvalid
+
+        row = LlmConnector(
+            user_id=test_user.id,
+            connector_type="openai_apikey",
+            display_name="Mine",
+            status="active",
+            credentials=json.dumps({"api_key": "sk-key123"}),
+        )
+        db.add(row)
+        db.commit()
+        db.refresh(row)
+
+        with patch(
+            "app.services.llm.adapters.openai_apikey.OpenAIApiKeyAdapter.health_check",
+            new=AsyncMock(side_effect=AuthInvalid("upstream secret should not leak")),
+        ):
+            resp = client.post(f"/api/llm/connectors/{row.id}/test", headers=auth_headers)
+        assert resp.status_code == 200
+        data = resp.json()
+        assert data["ok"] is False
+        assert data["error_code"] == "auth_invalid"
+        # Sanitised — no raw exception message
+        assert "upstream secret should not leak" not in (data["message"] or "")
+
+        db.refresh(row)
+        assert row.status == "auth_invalid"
+
+
+# ---------- OpenRouter model catalogue endpoint ----------
+class TestOpenRouterModels:
+    def test_returns_cached_model_list(self, client: TestClient, auth_headers):
+        from app.schemas.ai_settings import AIModelInfo
+
+        models = [
+            AIModelInfo(id="openai/gpt-4o-mini", name="GPT-4o mini"),
+            AIModelInfo(id="anthropic/claude-3.5-sonnet", name="Claude 3.5 Sonnet"),
+        ]
+        with patch(
+            "app.api.llm.get_openrouter_models",
+            new=AsyncMock(return_value=models),
+        ):
+            resp = client.get("/api/llm/openrouter/models", headers=auth_headers)
+        assert resp.status_code == 200
+        ids = [m["id"] for m in resp.json()["models"]]
+        assert ids == ["openai/gpt-4o-mini", "anthropic/claude-3.5-sonnet"]
+
+    def test_returns_empty_when_catalogue_unavailable(self, client: TestClient, auth_headers):
+        with patch("app.api.llm.get_openrouter_models", new=AsyncMock(return_value=[])):
+            resp = client.get("/api/llm/openrouter/models", headers=auth_headers)
+        assert resp.status_code == 200
+        assert resp.json()["models"] == []
+
+    def test_requires_authentication(self, client: TestClient):
+        resp = client.get("/api/llm/openrouter/models")
+        assert resp.status_code == 401
+
+
+# ---------- Admin policy / oversight ----------
+class TestAdminLlm:
+    def test_get_policy(self, client: TestClient, admin_headers):
+        resp = client.get("/api/admin/llm/policy", headers=admin_headers)
+        assert resp.status_code == 200
+        data = resp.json()
+        assert "llm_apikey_connectors_enabled" in data
+        assert "llm_compatible_connector_enabled" in data
+
+    def test_patch_policy_toggles(self, client: TestClient, admin_headers):
+        resp = client.patch(
+            "/api/admin/llm/policy",
+            json={
+                "llm_apikey_connectors_enabled": False,
+                "llm_compatible_connector_enabled": False,
+            },
+            headers=admin_headers,
+        )
+        assert resp.status_code == 200
+        data = resp.json()
+        assert data["llm_apikey_connectors_enabled"] is False
+        assert data["llm_compatible_connector_enabled"] is False
+
+    def test_non_admin_cannot_get_policy(self, client: TestClient, auth_headers):
+        resp = client.get("/api/admin/llm/policy", headers=auth_headers)
+        assert resp.status_code == 403
+
+    def test_patch_policy_rejects_clear_default_with_id(self, client: TestClient, admin_headers):
+        # clear_default and a non-null default id are contradictory.
+        resp = client.patch(
+            "/api/admin/llm/policy",
+            json={"clear_default": True, "llm_default_connector_id": 1},
+            headers=admin_headers,
+        )
+        assert resp.status_code == 422
+
+    def test_policy_exposes_retention_default(self, client: TestClient, admin_headers):
+        # Issue #342: retention is surfaced via the policy endpoint and defaults to 30.
+        resp = client.get("/api/admin/llm/policy", headers=admin_headers)
+        assert resp.status_code == 200
+        assert resp.json()["llm_call_log_retention_days"] == 30
+
+    def test_patch_retention_persists(self, client: TestClient, admin_headers, db):
+        resp = client.patch(
+            "/api/admin/llm/policy",
+            json={"llm_call_log_retention_days": 90},
+            headers=admin_headers,
+        )
+        assert resp.status_code == 200
+        assert resp.json()["llm_call_log_retention_days"] == 90
+
+        # Persisted to the DB-backed singleton, visible on a fresh GET.
+        resp = client.get("/api/admin/llm/policy", headers=admin_headers)
+        assert resp.json()["llm_call_log_retention_days"] == 90
+
+        from app.services.system_settings import get_system_settings
+
+        assert get_system_settings(db).llm_call_log_retention_days == 90
+
+    def test_patch_retention_below_min_rejected(self, client: TestClient, admin_headers):
+        # Sanity bound: minimum 7 days. Rejected at the API level (422).
+        resp = client.patch(
+            "/api/admin/llm/policy",
+            json={"llm_call_log_retention_days": 6},
+            headers=admin_headers,
+        )
+        assert resp.status_code == 422
+
+    def test_patch_retention_above_max_rejected(self, client: TestClient, admin_headers):
+        # Sanity bound: maximum 365 days. Rejected at the API level (422).
+        resp = client.patch(
+            "/api/admin/llm/policy",
+            json={"llm_call_log_retention_days": 366},
+            headers=admin_headers,
+        )
+        assert resp.status_code == 422
+
+    def test_patch_retention_accepts_boundaries(self, client: TestClient, admin_headers):
+        for value in (7, 365):
+            resp = client.patch(
+                "/api/admin/llm/policy",
+                json={"llm_call_log_retention_days": value},
+                headers=admin_headers,
+            )
+            assert resp.status_code == 200
+            assert resp.json()["llm_call_log_retention_days"] == value
+
+    def test_list_connectors_admin_shows_all(
+        self, client: TestClient, admin_headers, db, test_user
+    ):
+        row = LlmConnector(
+            user_id=test_user.id,
+            connector_type="openai_apikey",
+            display_name="Mine",
+            status="active",
+            credentials=json.dumps({"api_key": "sk-x"}),
+        )
+        db.add(row)
+        db.commit()
+        db.refresh(row)
+        resp = client.get("/api/admin/llm/connectors", headers=admin_headers)
+        assert resp.status_code == 200
+        users = [r["dj_username"] for r in resp.json()]
+        assert "testuser" in users
+
+    def test_force_revoke_clears_default(self, client: TestClient, admin_headers, db, test_user):
+        row = LlmConnector(
+            user_id=test_user.id,
+            connector_type="openai_apikey",
+            display_name="Mine",
+            status="active",
+            credentials=json.dumps({"api_key": "sk-x"}),
+        )
+        db.add(row)
+        db.commit()
+        db.refresh(row)
+
+        # Set as default
+        resp = client.patch(
+            "/api/admin/llm/policy",
+            json={"llm_default_connector_id": row.id},
+            headers=admin_headers,
+        )
+        assert resp.status_code == 200
+
+        # Revoke
+        resp = client.post(f"/api/admin/llm/connectors/{row.id}/revoke", headers=admin_headers)
+        assert resp.status_code == 200
+        assert resp.json()["status"] == "disabled"
+
+        # Default cleared
+        resp = client.get("/api/admin/llm/policy", headers=admin_headers)
+        assert resp.json()["llm_default_connector_id"] is None
+
+        # Audit recorded
+        assert (
+            db.query(LlmAuditEvent)
+            .filter(LlmAuditEvent.event_type == "connector_revoked_by_admin")
+            .count()
+            == 1
+        )
+
+    def test_usage_endpoint(self, client: TestClient, admin_headers, db, test_user):
+        # Seed a connector and a call log row
+        row = LlmConnector(
+            user_id=test_user.id,
+            connector_type="openai_apikey",
+            display_name="Mine",
+            status="active",
+            credentials=json.dumps({"api_key": "sk-x"}),
+        )
+        db.add(row)
+        db.commit()
+        db.refresh(row)
+        from app.services.llm.connector_storage import log_call
+
+        log_call(
+            db,
+            connector_id=row.id,
+            purpose="recommendation",
+            status="ok",
+            latency_ms=100,
+            tokens_in=10,
+            tokens_out=5,
+        )
+        db.commit()
+
+        resp = client.get("/api/admin/llm/usage?days=30", headers=admin_headers)
+        assert resp.status_code == 200
+        data = resp.json()
+        assert data["days"] == 30
+        assert any(r["connector_id"] == row.id for r in data["rows"])
+
+    # ---------- Monthly token cap (issue #339) ----------
+
+    def test_connectors_listing_includes_cap_and_usage(
+        self, client: TestClient, admin_headers, db, test_user
+    ):
+        row = LlmConnector(
+            user_id=test_user.id,
+            connector_type="openai_apikey",
+            display_name="Capped",
+            status="active",
+            credentials=json.dumps({"api_key": "sk-x"}),
+            monthly_token_cap=1000,
+        )
+        db.add(row)
+        db.commit()
+        db.refresh(row)
+        from app.services.llm.connector_storage import log_call
+
+        log_call(
+            db,
+            connector_id=row.id,
+            purpose="recommendation",
+            status="ok",
+            latency_ms=10,
+            tokens_in=120,
+            tokens_out=80,
+        )
+        db.commit()
+
+        resp = client.get("/api/admin/llm/connectors", headers=admin_headers)
+        assert resp.status_code == 200
+        listed = next(r for r in resp.json() if r["id"] == row.id)
+        assert listed["monthly_token_cap"] == 1000
+        assert listed["current_month_tokens"] == 200
+
+    def test_set_connector_cap(self, client: TestClient, admin_headers, db, test_user):
+        row = LlmConnector(
+            user_id=test_user.id,
+            connector_type="openai_apikey",
+            display_name="C",
+            status="active",
+            credentials=json.dumps({"api_key": "sk-x"}),
+        )
+        db.add(row)
+        db.commit()
+        db.refresh(row)
+
+        resp = client.patch(
+            f"/api/admin/llm/connectors/{row.id}/cap",
+            headers=admin_headers,
+            json={"monthly_token_cap": 50000},
+        )
+        assert resp.status_code == 200
+        assert resp.json()["monthly_token_cap"] == 50000
+
+        # Clearing it (null) returns it to unlimited.
+        resp = client.patch(
+            f"/api/admin/llm/connectors/{row.id}/cap",
+            headers=admin_headers,
+            json={"monthly_token_cap": None},
+        )
+        assert resp.status_code == 200
+        assert resp.json()["monthly_token_cap"] is None
+
+        # Audit row written (reuses policy_changed event type).
+        assert (
+            db.query(LlmAuditEvent)
+            .filter(
+                LlmAuditEvent.event_type == "policy_changed",
+                LlmAuditEvent.target_connector_id == row.id,
+            )
+            .count()
+            == 2
+        )
+
+    def test_set_cap_zero_allowed(self, client: TestClient, admin_headers, db, test_user):
+        # 0 is a valid cap meaning "no further calls this month".
+        row = LlmConnector(
+            user_id=test_user.id,
+            connector_type="openai_apikey",
+            display_name="Zero",
+            status="active",
+            credentials=json.dumps({"api_key": "sk-x"}),
+        )
+        db.add(row)
+        db.commit()
+        db.refresh(row)
+
+        resp = client.patch(
+            f"/api/admin/llm/connectors/{row.id}/cap",
+            headers=admin_headers,
+            json={"monthly_token_cap": 0},
+        )
+        assert resp.status_code == 200
+        assert resp.json()["monthly_token_cap"] == 0
+
+    def test_set_cap_rejects_negative(self, client: TestClient, admin_headers, db, test_user):
+        row = LlmConnector(
+            user_id=test_user.id,
+            connector_type="openai_apikey",
+            display_name="Neg",
+            status="active",
+            credentials=json.dumps({"api_key": "sk-x"}),
+        )
+        db.add(row)
+        db.commit()
+        db.refresh(row)
+
+        resp = client.patch(
+            f"/api/admin/llm/connectors/{row.id}/cap",
+            headers=admin_headers,
+            json={"monthly_token_cap": -5},
+        )
+        assert resp.status_code == 422  # Pydantic ge=0 rejection
+
+    def test_set_cap_rejects_empty_body(self, client: TestClient, admin_headers, db, test_user):
+        # monthly_token_cap is required: an empty {} body must be rejected (422),
+        # not silently treated as null — otherwise an accidental no-field PATCH
+        # would wipe a configured cap (CodeRabbit #377).
+        row = LlmConnector(
+            user_id=test_user.id,
+            connector_type="openai_apikey",
+            display_name="EmptyBody",
+            status="active",
+            credentials=json.dumps({"api_key": "sk-x"}),
+            monthly_token_cap=1000,
+        )
+        db.add(row)
+        db.commit()
+        db.refresh(row)
+
+        resp = client.patch(
+            f"/api/admin/llm/connectors/{row.id}/cap",
+            headers=admin_headers,
+            json={},
+        )
+        assert resp.status_code == 422
+        # The cap must be untouched by the rejected request.
+        db.refresh(row)
+        assert row.monthly_token_cap == 1000
+
+    def test_set_cap_404_for_missing_connector(self, client: TestClient, admin_headers):
+        resp = client.patch(
+            "/api/admin/llm/connectors/999999/cap",
+            headers=admin_headers,
+            json={"monthly_token_cap": 100},
+        )
+        assert resp.status_code == 404
+
+    def test_set_cap_requires_admin(self, client: TestClient, auth_headers, db, test_user):
+        # A non-admin (plain DJ) must be rejected even for their own connector.
+        row = LlmConnector(
+            user_id=test_user.id,
+            connector_type="openai_apikey",
+            display_name="C3",
+            status="active",
+            credentials=json.dumps({"api_key": "sk-x"}),
+        )
+        db.add(row)
+        db.commit()
+        db.refresh(row)
+
+        resp = client.patch(
+            f"/api/admin/llm/connectors/{row.id}/cap",
+            headers=auth_headers,
+            json={"monthly_token_cap": 100},
+        )
+        assert resp.status_code == 403
+
+
+# ---------- DJ-readable policy endpoint (issue #355) ----------
+class TestDjPolicyEndpoint:
+    """GET /api/llm/policy — DJ-scoped, non-sensitive policy surface.
+
+    A normal DJ must be able to read which connector types the admin has
+    enabled so the settings/ai page can fail closed instead of offering
+    providers that the server will reject at create time.
+    """
+
+    def test_dj_can_read_policy_defaults_all_allowed(self, client: TestClient, auth_headers):
+        resp = client.get("/api/llm/policy", headers=auth_headers)
+        assert resp.status_code == 200
+        data = resp.json()
+        # Defaults: both flags enabled.
+        assert data["llm_apikey_connectors_enabled"] is True
+        assert data["llm_compatible_connector_enabled"] is True
+        # The allowed-types set must cover every valid connector type by default.
+        assert set(data["allowed_connector_types"]) == {
+            "openai_apikey",
+            "anthropic_apikey",
+            "openai_compatible",
+            "gemini_apikey",
+            "azure_openai",
+            "bedrock",
+            "openrouter_apikey",
+            "xai_apikey",
+        }
+        # Must NOT leak the sensitive admin-only default-connector pointer.
+        assert "llm_default_connector_id" not in data
+
+    def test_policy_reflects_apikey_disabled(self, client: TestClient, auth_headers, admin_headers):
+        resp = client.patch(
+            "/api/admin/llm/policy",
+            json={"llm_apikey_connectors_enabled": False},
+            headers=admin_headers,
+        )
+        assert resp.status_code == 200
+
+        resp = client.get("/api/llm/policy", headers=auth_headers)
+        assert resp.status_code == 200
+        data = resp.json()
+        assert data["llm_apikey_connectors_enabled"] is False
+        assert data["llm_compatible_connector_enabled"] is True
+        # Only the openai_compatible type remains allowed.
+        assert data["allowed_connector_types"] == ["openai_compatible"]
+
+    def test_policy_reflects_compatible_disabled(
+        self, client: TestClient, auth_headers, admin_headers
+    ):
+        resp = client.patch(
+            "/api/admin/llm/policy",
+            json={"llm_compatible_connector_enabled": False},
+            headers=admin_headers,
+        )
+        assert resp.status_code == 200
+
+        resp = client.get("/api/llm/policy", headers=auth_headers)
+        assert resp.status_code == 200
+        data = resp.json()
+        assert data["llm_compatible_connector_enabled"] is False
+        assert "openai_compatible" not in data["allowed_connector_types"]
+        # API-key types still present.
+        assert "openai_apikey" in data["allowed_connector_types"]
+
+    def test_policy_all_disabled_yields_empty_allowed(
+        self, client: TestClient, auth_headers, admin_headers
+    ):
+        resp = client.patch(
+            "/api/admin/llm/policy",
+            json={
+                "llm_apikey_connectors_enabled": False,
+                "llm_compatible_connector_enabled": False,
+            },
+            headers=admin_headers,
+        )
+        assert resp.status_code == 200
+
+        resp = client.get("/api/llm/policy", headers=auth_headers)
+        assert resp.status_code == 200
+        assert resp.json()["allowed_connector_types"] == []
+
+    def test_pending_user_cannot_read_policy(self, client: TestClient, pending_headers):
+        resp = client.get("/api/llm/policy", headers=pending_headers)
+        assert resp.status_code == 403
+
+    def test_unauthenticated_cannot_read_policy(self, client: TestClient):
+        resp = client.get("/api/llm/policy")
+        assert resp.status_code == 401
diff --git a/server/tests/test_llm_bedrock_adapter.py b/server/tests/test_llm_bedrock_adapter.py
new file mode 100644
index 00000000..a6b6143b
--- /dev/null
+++ b/server/tests/test_llm_bedrock_adapter.py
@@ -0,0 +1,330 @@
+"""Tests for the AWS Bedrock adapter (SigV4 over httpx, no boto3).
+
+The HTTP boundary is mocked — we never reach real AWS. Both Bedrock Claude
+(``anthropic.*``) and Bedrock Llama (``meta.*``) model families are exercised
+because their request bodies and tool semantics differ.
+"""
+
+from __future__ import annotations
+
+import json
+from types import SimpleNamespace
+from unittest.mock import patch
+
+import httpx
+import pytest
+
+from app.services.llm.adapters.bedrock import BedrockAdapter, model_family
+from app.services.llm.base import ChatRequest, Message, ToolSpec
+from app.services.llm.exceptions import (
+    AuthInvalid,
+    ProviderUnavailable,
+    QuotaExceeded,
+    RateLimited,
+    ToolTranslationError,
+)
+
+_HTTPX_PATH = "app.services.llm.adapters.bedrock.httpx.AsyncClient"
+
+
+# ---------------------------------------------------------------------------
+# Helpers
+# ---------------------------------------------------------------------------
+def _bedrock_connector(model_id="anthropic.claude-3-5-sonnet-20241022-v2:0"):
+    return SimpleNamespace(
+        connector_type="bedrock",
+        credentials=json.dumps(
+            {
+                "aws_access_key_id": "AKIDEXAMPLE",
+                "aws_secret_access_key": "wJalrXUtnFEMI/K7MDENG+bPxRfiCYEXAMPLEKEY",
+                "aws_region": "us-east-1",
+                "aws_model_id": model_id,
+            }
+        ),
+        model_hint=None,
+        base_url_plain=None,
+    )
+
+
+def _anthropic_body(text="hi"):
+    return {
+        "model": "claude",
+        "stop_reason": "end_turn",
+        "content": [{"type": "text", "text": text}],
+        "usage": {"input_tokens": 3, "output_tokens": 1},
+    }
+
+
+def _anthropic_tool_body(name, tool_input):
+    return {
+        "model": "claude",
+        "stop_reason": "tool_use",
+        "content": [{"type": "tool_use", "id": "tu_1", "name": name, "input": tool_input}],
+        "usage": {"input_tokens": 5, "output_tokens": 2},
+    }
+
+
+def _llama_body(generation, stop_reason="stop"):
+    return {
+        "generation": generation,
+        "stop_reason": stop_reason,
+        "prompt_token_count": 7,
+        "generation_token_count": 4,
+    }
+
+
+def _ok(json_body):
+    return httpx.Response(
+        200,
+        request=httpx.Request("POST", "https://bedrock-runtime.us-east-1.amazonaws.com/x"),
+        json=json_body,
+    )
+
+
+def _err(status, headers=None):
+    return httpx.Response(
+        status,
+        request=httpx.Request("POST", "https://bedrock-runtime.us-east-1.amazonaws.com/x"),
+        headers=headers or {},
+        json={"message": "x"},
+    )
+
+
+class _AsyncClient:
+    def __init__(self, response):
+        self._response = response
+        self.calls: list = []
+
+    async def __aenter__(self):
+        return self
+
+    async def __aexit__(self, *args):
+        return None
+
+    async def post(self, url, content=None, headers=None):
+        self.calls.append({"url": url, "content": content, "headers": headers})
+        if isinstance(self._response, Exception):
+            raise self._response
+        return self._response
+
+
+# ---------------------------------------------------------------------------
+# model family detection
+# ---------------------------------------------------------------------------
+class TestModelFamily:
+    def test_anthropic_family(self):
+        assert model_family("anthropic.claude-3-5-sonnet-20241022-v2:0") == "anthropic"
+
+    def test_anthropic_inference_profile_prefix(self):
+        assert model_family("us.anthropic.claude-3-5-haiku-20241022-v1:0") == "anthropic"
+
+    def test_llama_family_meta_prefix(self):
+        assert model_family("meta.llama3-70b-instruct-v1:0") == "llama"
+
+    def test_llama_family_name_match(self):
+        assert model_family("us.meta.llama3-1-8b-instruct-v1:0") == "llama"
+
+    def test_unknown_family_raises(self):
+        with pytest.raises(ToolTranslationError):
+            model_family("amazon.titan-text-express-v1")
+
+
+# ---------------------------------------------------------------------------
+# Bedrock Claude (anthropic.*)
+# ---------------------------------------------------------------------------
+class TestBedrockClaude:
+    @pytest.mark.asyncio
+    async def test_happy_path_signs_and_parses(self):
+        adapter = BedrockAdapter(_bedrock_connector())
+        client = _AsyncClient(_ok(_anthropic_body("pong")))
+        with patch(_HTTPX_PATH, return_value=client):
+            resp = await adapter.chat(ChatRequest(messages=[Message(role="user", content="hi")]))
+
+        assert resp.text == "pong"
+        assert resp.usage.prompt == 3
+        assert resp.usage.completion == 1
+        assert resp.model == "anthropic.claude-3-5-sonnet-20241022-v2:0"
+        # SigV4 auth — not a bearer token.
+        auth = client.calls[0]["headers"]["Authorization"]
+        assert auth.startswith("AWS4-HMAC-SHA256 ")
+        assert "X-Amz-Date" in client.calls[0]["headers"]
+        assert client.calls[0]["url"].endswith(
+            "/model/anthropic.claude-3-5-sonnet-20241022-v2:0/invoke"
+        )
+
+    @pytest.mark.asyncio
+    async def test_request_body_uses_anthropic_schema(self):
+        adapter = BedrockAdapter(_bedrock_connector())
+        client = _AsyncClient(_ok(_anthropic_body()))
+        with patch(_HTTPX_PATH, return_value=client):
+            await adapter.chat(
+                ChatRequest(messages=[Message(role="user", content="hi")], system="be terse")
+            )
+        body = json.loads(client.calls[0]["content"])
+        assert body["anthropic_version"] == "bedrock-2023-05-31"
+        assert body["system"] == "be terse"
+        assert body["messages"] == [{"role": "user", "content": "hi"}]
+
+    @pytest.mark.asyncio
+    async def test_tool_use_reuses_anthropic_translation(self):
+        adapter = BedrockAdapter(_bedrock_connector())
+        tool = ToolSpec(name="pick", description="pick a song", input_schema={"type": "object"})
+        client = _AsyncClient(_ok(_anthropic_tool_body("pick", {"q": "house"})))
+        with patch(_HTTPX_PATH, return_value=client):
+            resp = await adapter.chat(
+                ChatRequest(
+                    messages=[Message(role="user", content="hi")],
+                    tools=[tool],
+                    force_tool="pick",
+                )
+            )
+        assert resp.stop_reason == "tool_use"
+        assert resp.tool_calls[0].name == "pick"
+        assert resp.tool_calls[0].input == {"q": "house"}
+        body = json.loads(client.calls[0]["content"])
+        assert body["tools"][0]["name"] == "pick"
+        assert body["tool_choice"] == {"type": "tool", "name": "pick"}
+
+
+# ---------------------------------------------------------------------------
+# Bedrock Llama (meta.*)
+# ---------------------------------------------------------------------------
+class TestBedrockLlama:
+    @pytest.mark.asyncio
+    async def test_happy_path_prompt_body(self):
+        adapter = BedrockAdapter(_bedrock_connector("meta.llama3-70b-instruct-v1:0"))
+        client = _AsyncClient(_ok(_llama_body("hello there")))
+        with patch(_HTTPX_PATH, return_value=client):
+            resp = await adapter.chat(ChatRequest(messages=[Message(role="user", content="hi")]))
+        assert resp.text == "hello there"
+        assert resp.stop_reason == "end_turn"
+        assert resp.usage.prompt == 7
+        assert resp.usage.completion == 4
+        assert resp.model == "meta.llama3-70b-instruct-v1:0"
+        body = json.loads(client.calls[0]["content"])
+        # Llama uses a prompt string, not anthropic messages.
+        assert "prompt" in body
+        assert "anthropic_version" not in body
+        assert "<|begin_of_text|>" in body["prompt"]
+
+    @pytest.mark.asyncio
+    async def test_length_stop_reason_maps_to_max_tokens(self):
+        adapter = BedrockAdapter(_bedrock_connector("meta.llama3-70b-instruct-v1:0"))
+        client = _AsyncClient(_ok(_llama_body("partial", stop_reason="length")))
+        with patch(_HTTPX_PATH, return_value=client):
+            resp = await adapter.chat(ChatRequest(messages=[Message(role="user", content="hi")]))
+        assert resp.stop_reason == "max_tokens"
+
+    @pytest.mark.asyncio
+    async def test_tool_call_parsed_from_generation_json(self):
+        adapter = BedrockAdapter(_bedrock_connector("meta.llama3-1-70b-instruct-v1:0"))
+        tool = ToolSpec(name="pick", description="pick", input_schema={"type": "object"})
+        generation = '{"name": "pick", "input": {"q": "techno"}}'
+        client = _AsyncClient(_ok(_llama_body(generation)))
+        with patch(_HTTPX_PATH, return_value=client):
+            resp = await adapter.chat(
+                ChatRequest(
+                    messages=[Message(role="user", content="hi")],
+                    tools=[tool],
+                    force_tool="pick",
+                )
+            )
+        assert resp.stop_reason == "tool_use"
+        assert resp.tool_calls[0].name == "pick"
+        assert resp.tool_calls[0].input == {"q": "techno"}
+        # Tool instructions are embedded in the prompt for Llama.
+        body = json.loads(client.calls[0]["content"])
+        assert "pick" in body["prompt"]
+
+    @pytest.mark.asyncio
+    async def test_unknown_tool_name_in_generation_is_plain_text(self):
+        adapter = BedrockAdapter(_bedrock_connector("meta.llama3-70b-instruct-v1:0"))
+        tool = ToolSpec(name="pick", description="pick", input_schema={"type": "object"})
+        generation = '{"name": "other", "input": {}}'
+        client = _AsyncClient(_ok(_llama_body(generation)))
+        with patch(_HTTPX_PATH, return_value=client):
+            resp = await adapter.chat(
+                ChatRequest(messages=[Message(role="user", content="hi")], tools=[tool])
+            )
+        assert resp.tool_calls == []
+        assert resp.text == generation
+
+
+# ---------------------------------------------------------------------------
+# Error mapping (shared) — exercised via the Claude family
+# ---------------------------------------------------------------------------
+class TestBedrockErrorMapping:
+    @pytest.mark.parametrize(
+        ("response", "expected"),
+        [
+            (_err(401), AuthInvalid),
+            (_err(403), AuthInvalid),
+            # 400 + ThrottlingException error-type header → treated as rate limiting.
+            (_err(400, {"x-amzn-errortype": "ThrottlingException"}), RateLimited),
+            (_err(402), QuotaExceeded),
+            (_err(503), ProviderUnavailable),
+            (httpx.TimeoutException("timeout"), ProviderUnavailable),
+            # 400 without a throttle header → malformed input.
+            (_err(400), ToolTranslationError),
+        ],
+    )
+    @pytest.mark.asyncio
+    async def test_status_maps_to_exception(self, response, expected):
+        adapter = BedrockAdapter(_bedrock_connector())
+        client = _AsyncClient(response)
+        with patch(_HTTPX_PATH, return_value=client):
+            with pytest.raises(expected):
+                await adapter.chat(ChatRequest(messages=[Message(role="user", content="x")]))
+
+    @pytest.mark.asyncio
+    async def test_429_maps_to_rate_limited_with_retry_after(self):
+        adapter = BedrockAdapter(_bedrock_connector())
+        client = _AsyncClient(_err(429, headers={"Retry-After": "12"}))
+        with patch(_HTTPX_PATH, return_value=client):
+            with pytest.raises(RateLimited) as info:
+                await adapter.chat(ChatRequest(messages=[Message(role="user", content="x")]))
+        assert info.value.retry_after_seconds == 12
+
+
+# ---------------------------------------------------------------------------
+# Credential extraction
+# ---------------------------------------------------------------------------
+class TestBedrockCredentials:
+    @pytest.mark.asyncio
+    async def test_malformed_credentials_raise_auth_invalid(self):
+        connector = SimpleNamespace(
+            connector_type="bedrock",
+            credentials="not json",
+            model_hint=None,
+            base_url_plain=None,
+        )
+        adapter = BedrockAdapter(connector)
+        with pytest.raises(AuthInvalid):
+            await adapter.chat(ChatRequest(messages=[Message(role="user", content="x")]))
+
+    @pytest.mark.asyncio
+    async def test_missing_field_raises_auth_invalid(self):
+        connector = SimpleNamespace(
+            connector_type="bedrock",
+            credentials=json.dumps(
+                {
+                    "aws_access_key_id": "AKID",
+                    "aws_secret_access_key": "secret",
+                    "aws_region": "us-east-1",
+                    # missing aws_model_id
+                }
+            ),
+            model_hint=None,
+            base_url_plain=None,
+        )
+        adapter = BedrockAdapter(connector)
+        with pytest.raises(AuthInvalid):
+            await adapter.chat(ChatRequest(messages=[Message(role="user", content="x")]))
+
+    @pytest.mark.asyncio
+    async def test_health_check_pings(self):
+        adapter = BedrockAdapter(_bedrock_connector())
+        client = _AsyncClient(_ok(_anthropic_body("ok")))
+        with patch(_HTTPX_PATH, return_value=client):
+            await adapter.health_check()
+        assert len(client.calls) == 1
diff --git a/server/tests/test_llm_call_log_retention.py b/server/tests/test_llm_call_log_retention.py
new file mode 100644
index 00000000..5413b4e3
--- /dev/null
+++ b/server/tests/test_llm_call_log_retention.py
@@ -0,0 +1,150 @@
+"""Tests for configurable llm_call_log retention (issue #342).
+
+Covers:
+- The purge helper deletes only rows older than the supplied window.
+- The daily cleanup job reads the retention window from system settings each
+  run (no hardcoded constant), so an admin change takes effect on the next pass.
+"""
+
+from __future__ import annotations
+
+import json
+from datetime import timedelta
+
+import pytest
+from sqlalchemy.orm import Session
+
+from app.core.time import utcnow
+from app.models.llm_connector import LlmCallLog, LlmConnector
+from app.services.llm.connector_storage import purge_call_log_older_than
+from app.services.system_settings import update_system_settings
+
+
+def _make_connector(db: Session, user_id: int) -> LlmConnector:
+    row = LlmConnector(
+        user_id=user_id,
+        connector_type="openai_apikey",
+        display_name="Mine",
+        status="active",
+        credentials=json.dumps({"api_key": "sk-x"}),
+    )
+    db.add(row)
+    db.commit()
+    db.refresh(row)
+    return row
+
+
+def _seed_call_log(db: Session, connector_id: int, *, age_days: int) -> LlmCallLog:
+    # Set created_at explicitly at construction so the backdated timestamp wins
+    # over the column's server_default.
+    row = LlmCallLog(
+        connector_id=connector_id,
+        purpose="recommendation",
+        status="ok",
+        latency_ms=100,
+        tokens_in=10,
+        tokens_out=5,
+        created_at=utcnow() - timedelta(days=age_days),
+    )
+    db.add(row)
+    db.commit()
+    db.refresh(row)
+    return row
+
+
+class TestPurgeHelper:
+    def test_deletes_only_older_than_window(self, db: Session, test_user):
+        connector = _make_connector(db, test_user.id)
+        old = _seed_call_log(db, connector.id, age_days=40)
+        recent = _seed_call_log(db, connector.id, age_days=5)
+        # Capture ids before the bulk delete — accessing attributes on a deleted
+        # ORM instance afterwards would trigger a reload error.
+        old_id, recent_id = old.id, recent.id
+
+        deleted = purge_call_log_older_than(db, retention_days=30)
+        db.commit()
+
+        assert deleted == 1
+        ids = {r.id for r in db.query(LlmCallLog.id).all()}
+        assert recent_id in ids
+        assert old_id not in ids
+
+    def test_no_rows_to_delete_returns_zero(self, db: Session, test_user):
+        connector = _make_connector(db, test_user.id)
+        _seed_call_log(db, connector.id, age_days=5)
+
+        deleted = purge_call_log_older_than(db, retention_days=30)
+        db.commit()
+
+        assert deleted == 0
+        assert db.query(LlmCallLog).count() == 1
+
+    def test_rejects_out_of_bounds_window_without_deleting(self, db: Session, test_user):
+        # A corrupt/tampered persisted value outside the 7-365 contract must fail
+        # closed: raise before deleting, never push the cutoff to now/future and
+        # wipe history. The daily cleanup loop catches this and retries next pass.
+        connector = _make_connector(db, test_user.id)
+        _seed_call_log(db, connector.id, age_days=5)
+
+        for bad in (0, -1, 6, 366, 100000):
+            with pytest.raises(ValueError):
+                purge_call_log_older_than(db, retention_days=bad)
+            db.rollback()
+
+        assert db.query(LlmCallLog).count() == 1
+
+    def test_boundary_row_at_exactly_window_kept(self, db: Session, test_user):
+        # A row aged just under the window must be kept; just over must go.
+        connector = _make_connector(db, test_user.id)
+        just_under = _seed_call_log(db, connector.id, age_days=29)
+        just_over = _seed_call_log(db, connector.id, age_days=31)
+        under_id, over_id = just_under.id, just_over.id
+
+        purge_call_log_older_than(db, retention_days=30)
+        db.commit()
+
+        ids = {r.id for r in db.query(LlmCallLog.id).all()}
+        assert under_id in ids
+        assert over_id not in ids
+
+
+class TestCleanupReadsSettings:
+    """The daily cleanup job must read the retention window from settings each
+    run, not from a hardcoded constant."""
+
+    def test_cleanup_honors_admin_changed_window(self, db: Session, test_user, monkeypatch):
+        connector = _make_connector(db, test_user.id)
+        # A row aged 20 days survives the default 30-day window but should be
+        # purged once the admin shortens retention to 7 days.
+        _seed_call_log(db, connector.id, age_days=20)
+
+        # Admin shortens retention.
+        update_system_settings(db, llm_call_log_retention_days=7)
+
+        # The cleanup job opens its own session via `from app.db.session import
+        # SessionLocal`; point that factory at the test session so the in-memory
+        # SQLite state is shared.
+        import app.main as main_module
+
+        monkeypatch.setattr("app.db.session.SessionLocal", lambda: db, raising=False)
+
+        # Prevent the job's db.close() from tearing down the shared test session.
+        monkeypatch.setattr(db, "close", lambda: None)
+
+        main_module._run_llm_call_log_cleanup()
+
+        assert db.query(LlmCallLog).count() == 0
+
+    def test_cleanup_keeps_rows_within_window(self, db: Session, test_user, monkeypatch):
+        connector = _make_connector(db, test_user.id)
+        _seed_call_log(db, connector.id, age_days=20)
+
+        # Default window (30) keeps the 20-day-old row.
+        import app.main as main_module
+
+        monkeypatch.setattr("app.db.session.SessionLocal", lambda: db, raising=False)
+        monkeypatch.setattr(db, "close", lambda: None)
+
+        main_module._run_llm_call_log_cleanup()
+
+        assert db.query(LlmCallLog).count() == 1
diff --git a/server/tests/test_llm_client.py b/server/tests/test_llm_client.py
index 0165b45f..1b55431a 100644
--- a/server/tests/test_llm_client.py
+++ b/server/tests/test_llm_client.py
@@ -4,6 +4,7 @@
 
 import pytest
 
+from app.services.llm.base import ChatResponse, ToolCall
 from app.services.recommendation.llm_client import (
     SEARCH_QUERIES_TOOL,
     SYSTEM_PROMPT,
@@ -155,79 +156,176 @@ def test_mixed_content_blocks(self):
         assert "Here are my suggestions" in result.raw_response
 
 
-class TestCallLLM:
+class TestParseToolResponseMalformedPayloads:
+    """Defensive parsing — a malformed provider payload must not crash the flow.
+
+    Custom OpenAI-compatible endpoints (Ollama, vLLM) may not enforce the forced
+    tool JSON schema. Regression for the CodeRabbit "harden tool payload parsing"
+    finding on PR #362: bad items are skipped, valid ones still parse.
+    """
+
+    def _tool_block(self, tool_input):
+        block = MagicMock()
+        block.type = "tool_use"
+        block.name = "search_queries"
+        block.input = tool_input
+        return block
+
+    def test_input_not_a_dict_is_skipped(self):
+        response = MagicMock()
+        response.content = [self._tool_block(["not", "a", "dict"])]
+        result = _parse_tool_response(response)
+        assert result.queries == []
+
+    def test_queries_not_a_list_is_skipped(self):
+        response = MagicMock()
+        response.content = [self._tool_block({"queries": "oops"})]
+        result = _parse_tool_response(response)
+        assert result.queries == []
+
+    def test_non_dict_query_item_is_skipped(self):
+        response = MagicMock()
+        response.content = [
+            self._tool_block(
+                {
+                    "queries": [
+                        "garbage",
+                        {"search_query": "valid query", "reasoning": "ok"},
+                    ]
+                }
+            )
+        ]
+        result = _parse_tool_response(response)
+        assert len(result.queries) == 1
+        assert result.queries[0].search_query == "valid query"
+
+    def test_missing_or_blank_search_query_is_skipped(self):
+        response = MagicMock()
+        response.content = [
+            self._tool_block(
+                {
+                    "queries": [
+                        {"reasoning": "no search_query key"},
+                        {"search_query": "", "reasoning": "blank"},
+                        {"search_query": "   ", "reasoning": "whitespace"},
+                        {"search_query": 123, "reasoning": "not a string"},
+                        {"search_query": "keep me", "reasoning": "good"},
+                    ]
+                }
+            )
+        ]
+        result = _parse_tool_response(response)
+        assert len(result.queries) == 1
+        assert result.queries[0].search_query == "keep me"
+
+    def test_non_string_reasoning_coerced_to_empty(self):
+        response = MagicMock()
+        response.content = [
+            self._tool_block(
+                {"queries": [{"search_query": "valid", "reasoning": {"unexpected": "dict"}}]}
+            )
+        ]
+        result = _parse_tool_response(response)
+        assert len(result.queries) == 1
+        assert result.queries[0].reasoning == ""
+
     @pytest.mark.asyncio
-    @patch("app.services.recommendation.llm_client.AsyncAnthropic")
-    @patch("app.services.recommendation.llm_client.get_settings")
-    async def test_calls_api_correctly(self, mock_settings, mock_anthropic_cls):
-        settings = MagicMock()
-        settings.anthropic_api_key = "sk-ant-test-key"
-        settings.anthropic_model = "claude-haiku-4-5-20251001"
-        settings.anthropic_max_tokens = 1024
-        settings.anthropic_timeout_seconds = 15
-        mock_settings.return_value = settings
-
-        # Mock API response
-        tool_block = MagicMock()
-        tool_block.type = "tool_use"
-        tool_block.name = "search_queries"
-        tool_block.input = {
-            "queries": [{"search_query": "chill house", "reasoning": "DJ wants chill vibes"}]
-        }
-        mock_response = MagicMock()
-        mock_response.content = [tool_block]
+    @patch("app.services.recommendation.llm_client.Gateway")
+    async def test_chatresponse_path_skips_malformed_items(self, mock_gateway):
+        response = ChatResponse(
+            tool_calls=[
+                ToolCall(
+                    id="t1",
+                    name="search_queries",
+                    input={
+                        "queries": [
+                            "garbage",
+                            {"search_query": "good one", "reasoning": "ok"},
+                            {"reasoning": "missing search_query"},
+                        ]
+                    },
+                )
+            ],
+            stop_reason="tool_use",
+        )
+        mock_gateway.dispatch = AsyncMock(return_value=response)
+        result = await call_llm(
+            EventProfile(track_count=0), "test", db=MagicMock(), actor=MagicMock()
+        )
+        assert len(result.queries) == 1
+        assert result.queries[0].search_query == "good one"
 
-        mock_client = MagicMock()
-        mock_client.messages.create = AsyncMock(return_value=mock_response)
-        mock_anthropic_cls.return_value = mock_client
 
-        profile = EventProfile(
-            avg_bpm=120.0,
-            dominant_genres=["House"],
-            track_count=5,
+class TestCallLLM:
+    """``call_llm`` always routes through the LLM Gateway.
+
+    The legacy direct-Anthropic env-var fallback was removed in #343 — every
+    production caller supplies ``db`` + ``actor`` and the connector system is
+    the sole source of credentials. These tests patch ``Gateway.dispatch``.
+    """
+
+    @pytest.mark.asyncio
+    @patch("app.services.recommendation.llm_client.Gateway")
+    async def test_dispatches_via_gateway(self, mock_gateway):
+        response = ChatResponse(
+            tool_calls=[
+                ToolCall(
+                    id="t1",
+                    name="search_queries",
+                    input={
+                        "queries": [
+                            {"search_query": "chill house", "reasoning": "DJ wants chill vibes"}
+                        ]
+                    },
+                )
+            ],
+            stop_reason="tool_use",
+            model="claude-haiku-4-5-20251001",
         )
+        mock_gateway.dispatch = AsyncMock(return_value=response)
+
+        db = MagicMock()
+        actor = MagicMock()
+        profile = EventProfile(avg_bpm=120.0, dominant_genres=["House"], track_count=5)
 
-        result = await call_llm(profile, "chill vibes")
+        result = await call_llm(profile, "chill vibes", db=db, actor=actor)
 
         assert len(result.queries) == 1
         assert result.queries[0].search_query == "chill house"
-
-        # Verify API call parameters
-        mock_client.messages.create.assert_called_once()
-        call_kwargs = mock_client.messages.create.call_args[1]
-        assert call_kwargs["model"] == "claude-haiku-4-5-20251001"
-        assert call_kwargs["max_tokens"] == 1024
-        assert call_kwargs["tool_choice"] == {"type": "tool", "name": "search_queries"}
+        assert result.model == "claude-haiku-4-5-20251001"
+
+        mock_gateway.dispatch.assert_awaited_once()
+        # Positional args: (db, actor, chat_request); keyword: purpose.
+        args, kwargs = mock_gateway.dispatch.call_args
+        assert args[0] is db
+        assert args[1] is actor
+        chat_request = args[2]
+        assert chat_request.force_tool == "search_queries"
+        assert chat_request.max_tokens == 1024
+        assert kwargs["purpose"] == "recommendation"
 
     @pytest.mark.asyncio
-    @patch("app.services.recommendation.llm_client.AsyncAnthropic")
-    @patch("app.services.recommendation.llm_client.get_settings")
-    async def test_trims_to_max_queries(self, mock_settings, mock_anthropic_cls):
-        settings = MagicMock()
-        settings.anthropic_api_key = "sk-ant-test-key"
-        settings.anthropic_model = "claude-haiku-4-5-20251001"
-        settings.anthropic_max_tokens = 1024
-        settings.anthropic_timeout_seconds = 15
-        mock_settings.return_value = settings
-
-        # Return 5 queries, request max 2
-        tool_block = MagicMock()
-        tool_block.type = "tool_use"
-        tool_block.name = "search_queries"
-        tool_block.input = {
-            "queries": [
-                {"search_query": f"query {i}", "reasoning": f"reason {i}"} for i in range(5)
-            ]
-        }
-        mock_response = MagicMock()
-        mock_response.content = [tool_block]
-
-        mock_client = MagicMock()
-        mock_client.messages.create = AsyncMock(return_value=mock_response)
-        mock_anthropic_cls.return_value = mock_client
+    @patch("app.services.recommendation.llm_client.Gateway")
+    async def test_trims_to_max_queries(self, mock_gateway):
+        response = ChatResponse(
+            tool_calls=[
+                ToolCall(
+                    id="t1",
+                    name="search_queries",
+                    input={
+                        "queries": [
+                            {"search_query": f"query {i}", "reasoning": f"reason {i}"}
+                            for i in range(5)
+                        ]
+                    },
+                )
+            ],
+            stop_reason="tool_use",
+        )
+        mock_gateway.dispatch = AsyncMock(return_value=response)
 
         profile = EventProfile(track_count=0)
-        result = await call_llm(profile, "test", max_queries=2)
+        result = await call_llm(profile, "test", max_queries=2, db=MagicMock(), actor=MagicMock())
 
         assert len(result.queries) == 2
         assert result.queries[0].search_query == "query 0"
diff --git a/server/tests/test_llm_default_connector.py b/server/tests/test_llm_default_connector.py
new file mode 100644
index 00000000..44b788a4
--- /dev/null
+++ b/server/tests/test_llm_default_connector.py
@@ -0,0 +1,538 @@
+"""Tests for per-DJ explicit default connector (issue #336).
+
+Covers:
+- Gateway resolution prefers the pinned default over MRU.
+- Falls through to MRU when no default is set.
+- Falls through to MRU when the pinned default is no longer active.
+- API endpoints: POST /default sets and atomically clears siblings.
+- API endpoints: DELETE /default clears the flag.
+- Ownership scoping: 404 for other DJ's connectors.
+- Audit events written for set / unset.
+- Setting an inactive connector as default is rejected with 400.
+"""
+
+from __future__ import annotations
+
+import json
+from unittest.mock import AsyncMock, patch
+
+import pytest
+from fastapi.testclient import TestClient
+from sqlalchemy.orm import Session
+
+from app.models.llm_connector import LlmAuditEvent, LlmConnector
+from app.models.user import User
+from app.services.auth import get_password_hash
+from app.services.llm.base import ChatRequest, ChatResponse, Message, TokenUsage
+from app.services.llm.exceptions import NoLlmConfigured
+from app.services.llm.gateway import Gateway
+
+
+# ---------- helpers ----------
+def _login(client: TestClient, username: str, password: str) -> dict[str, str]:
+    resp = client.post("/api/auth/login", data={"username": username, "password": password})
+    assert resp.status_code == 200, resp.json()
+    return {"Authorization": f"Bearer {resp.json()['access_token']}"}
+
+
+def _make_connector(
+    db: Session,
+    user: User,
+    *,
+    display_name: str = "Test connector",
+    status: str = "active",
+    is_default: bool = False,
+) -> LlmConnector:
+    row = LlmConnector(
+        user_id=user.id,
+        connector_type="openai_apikey",
+        display_name=display_name,
+        status=status,
+        credentials=json.dumps({"api_key": "sk-fake-key"}),
+        model_hint="gpt-5-mini",
+        is_default=is_default,
+    )
+    db.add(row)
+    db.commit()
+    db.refresh(row)
+    return row
+
+
+@pytest.fixture
+def dj_user(db) -> User:
+    user = User(
+        username="djdefault",
+        password_hash=get_password_hash("password123"),
+        role="dj",
+    )
+    db.add(user)
+    db.commit()
+    db.refresh(user)
+    return user
+
+
+@pytest.fixture
+def other_dj(db) -> User:
+    user = User(
+        username="otherdjdefault",
+        password_hash=get_password_hash("password123"),
+        role="dj",
+    )
+    db.add(user)
+    db.commit()
+    db.refresh(user)
+    return user
+
+
+# ---------- gateway resolver behavior ----------
+class TestGatewayResolverPrefersDefault:
+    @pytest.mark.asyncio
+    async def test_default_picked_over_mru(self, db, dj_user):
+        """An explicit default beats the MRU heuristic even when MRU is more recent."""
+        from datetime import timedelta
+
+        from app.core.time import utcnow
+
+        # Pinned default — older last_used_at to prove the pin wins.
+        pinned = _make_connector(db, dj_user, display_name="pinned", is_default=True)
+        pinned.last_used_at = utcnow() - timedelta(hours=1)
+        # MRU candidate — more recent activity but not pinned.
+        mru = _make_connector(db, dj_user, display_name="mru-but-not-default")
+        mru.last_used_at = utcnow()
+        db.commit()
+
+        fake = ChatResponse(text="ok", tool_calls=[], stop_reason="end_turn", usage=None)
+        with patch.object(
+            __import__(
+                "app.services.llm.adapters.openai_apikey",
+                fromlist=["OpenAIApiKeyAdapter"],
+            ).OpenAIApiKeyAdapter,
+            "chat",
+            new=AsyncMock(return_value=fake),
+        ):
+            await Gateway.dispatch(
+                db,
+                dj_user,
+                ChatRequest(messages=[Message(role="user", content="hi")]),
+                purpose="test",
+            )
+
+        # The pinned row got its last_used_at bumped — the MRU sibling didn't.
+        db.refresh(pinned)
+        db.refresh(mru)
+        prior_mru_ts = mru.last_used_at
+        assert pinned.last_used_at is not None
+        # The MRU row's timestamp should be older than pinned's (i.e. the pin
+        # was used, not the MRU). We compare via prior_mru_ts which was set
+        # before dispatch — pinned was dispatched so its ts > prior_mru_ts.
+        assert pinned.last_used_at >= prior_mru_ts
+
+    @pytest.mark.asyncio
+    async def test_default_skipped_when_inactive_falls_back_to_mru(self, db, dj_user):
+        """A disabled / auth_invalid default doesn't block MRU resolution."""
+        # Pinned but auth_invalid — gateway must skip it.
+        _make_connector(
+            db, dj_user, display_name="pinned-broken", is_default=True, status="auth_invalid"
+        )
+        mru = _make_connector(db, dj_user, display_name="mru-active")
+
+        fake = ChatResponse(
+            text="from-mru",
+            tool_calls=[],
+            stop_reason="end_turn",
+            usage=TokenUsage(prompt=1, completion=1),
+        )
+        with patch.object(
+            __import__(
+                "app.services.llm.adapters.openai_apikey",
+                fromlist=["OpenAIApiKeyAdapter"],
+            ).OpenAIApiKeyAdapter,
+            "chat",
+            new=AsyncMock(return_value=fake),
+        ):
+            resp = await Gateway.dispatch(
+                db,
+                dj_user,
+                ChatRequest(messages=[Message(role="user", content="hi")]),
+                purpose="test",
+            )
+
+        assert resp.text == "from-mru"
+        db.refresh(mru)
+        assert mru.last_used_at is not None
+
+    @pytest.mark.asyncio
+    async def test_no_default_uses_mru_unchanged(self, db, dj_user):
+        """Existing MRU semantics still apply when no default is pinned."""
+        from datetime import timedelta
+
+        from app.core.time import utcnow
+
+        older = _make_connector(db, dj_user, display_name="older")
+        newer = _make_connector(db, dj_user, display_name="newer")
+        older.last_used_at = utcnow() - timedelta(hours=1)
+        newer.last_used_at = utcnow()
+        db.commit()
+
+        fake = ChatResponse(text="ok", tool_calls=[], stop_reason="end_turn", usage=None)
+        with patch.object(
+            __import__(
+                "app.services.llm.adapters.openai_apikey",
+                fromlist=["OpenAIApiKeyAdapter"],
+            ).OpenAIApiKeyAdapter,
+            "chat",
+            new=AsyncMock(return_value=fake),
+        ):
+            await Gateway.dispatch(
+                db,
+                dj_user,
+                ChatRequest(messages=[Message(role="user", content="hi")]),
+                purpose="test",
+            )
+
+        db.refresh(newer)
+        db.refresh(older)
+        # newer has the bumped ts because MRU picked it.
+        assert newer.last_used_at is not None
+        assert newer.last_used_at >= older.last_used_at
+
+    @pytest.mark.asyncio
+    async def test_all_inactive_raises_no_llm_configured(self, db, dj_user):
+        """Pinned-but-broken + no other active = NoLlmConfigured."""
+        _make_connector(
+            db, dj_user, display_name="pinned-broken", is_default=True, status="disabled"
+        )
+        with pytest.raises(NoLlmConfigured):
+            await Gateway.dispatch(
+                db,
+                dj_user,
+                ChatRequest(messages=[Message(role="user", content="hi")]),
+                purpose="test",
+            )
+
+
+# ---------- POST /default ----------
+class TestSetDefault:
+    def test_set_default_marks_row(self, client: TestClient, auth_headers, db, test_user):
+        row = _make_connector(db, test_user, display_name="A")
+
+        resp = client.post(f"/api/llm/connectors/{row.id}/default", headers=auth_headers)
+        assert resp.status_code == 200, resp.json()
+        assert resp.json()["is_default"] is True
+
+        db.refresh(row)
+        assert row.is_default is True
+
+    def test_set_default_clears_other_defaults_for_same_user(
+        self, client: TestClient, auth_headers, db, test_user
+    ):
+        a = _make_connector(db, test_user, display_name="A", is_default=True)
+        b = _make_connector(db, test_user, display_name="B")
+
+        resp = client.post(f"/api/llm/connectors/{b.id}/default", headers=auth_headers)
+        assert resp.status_code == 200
+
+        db.refresh(a)
+        db.refresh(b)
+        assert a.is_default is False
+        assert b.is_default is True
+
+    def test_set_default_does_not_touch_other_dj(
+        self, client: TestClient, auth_headers, db, test_user, other_dj
+    ):
+        their_default = _make_connector(db, other_dj, display_name="theirs", is_default=True)
+        mine = _make_connector(db, test_user, display_name="mine")
+
+        client.post(f"/api/llm/connectors/{mine.id}/default", headers=auth_headers)
+
+        db.refresh(their_default)
+        assert their_default.is_default is True  # Untouched
+
+    def test_set_default_404_for_other_users_connector(
+        self, client: TestClient, auth_headers, db, other_dj
+    ):
+        theirs = _make_connector(db, other_dj, display_name="not yours")
+
+        resp = client.post(f"/api/llm/connectors/{theirs.id}/default", headers=auth_headers)
+        assert resp.status_code == 404
+
+        # The other DJ's connector wasn't flipped.
+        db.refresh(theirs)
+        assert theirs.is_default is False
+
+    def test_set_default_404_for_unknown_id(self, client: TestClient, auth_headers):
+        resp = client.post("/api/llm/connectors/999999/default", headers=auth_headers)
+        assert resp.status_code == 404
+
+    def test_set_default_rejects_inactive_connector(
+        self, client: TestClient, auth_headers, db, test_user
+    ):
+        row = _make_connector(db, test_user, display_name="broken", status="auth_invalid")
+        resp = client.post(f"/api/llm/connectors/{row.id}/default", headers=auth_headers)
+        assert resp.status_code == 400
+
+        db.refresh(row)
+        assert row.is_default is False
+
+    def test_set_default_writes_audit_event(self, client: TestClient, auth_headers, db, test_user):
+        row = _make_connector(db, test_user, display_name="A")
+        client.post(f"/api/llm/connectors/{row.id}/default", headers=auth_headers)
+
+        audit = (
+            db.query(LlmAuditEvent)
+            .filter(
+                LlmAuditEvent.target_connector_id == row.id,
+                LlmAuditEvent.event_type == "connector_default_set",
+            )
+            .one_or_none()
+        )
+        assert audit is not None
+        assert audit.actor_user_id == test_user.id
+
+    def test_set_default_requires_auth(self, client: TestClient, db, test_user):
+        row = _make_connector(db, test_user, display_name="A")
+        resp = client.post(f"/api/llm/connectors/{row.id}/default")
+        assert resp.status_code == 401
+
+    def test_set_default_persists_across_list_calls(
+        self, client: TestClient, auth_headers, db, test_user
+    ):
+        """Acceptance criterion: setting a default sticks across sessions."""
+        row = _make_connector(db, test_user, display_name="sticks")
+        client.post(f"/api/llm/connectors/{row.id}/default", headers=auth_headers)
+
+        # Simulate a fresh page load: list connectors.
+        listed = client.get("/api/llm/connectors", headers=auth_headers).json()
+        match = next(c for c in listed if c["id"] == row.id)
+        assert match["is_default"] is True
+
+
+# ---------- DELETE /default ----------
+class TestUnsetDefault:
+    def test_unset_default_clears_flag(self, client: TestClient, auth_headers, db, test_user):
+        row = _make_connector(db, test_user, display_name="A", is_default=True)
+        resp = client.delete(f"/api/llm/connectors/{row.id}/default", headers=auth_headers)
+        assert resp.status_code == 200, resp.json()
+        assert resp.json()["is_default"] is False
+
+        db.refresh(row)
+        assert row.is_default is False
+
+    def test_unset_default_is_noop_when_not_default(
+        self, client: TestClient, auth_headers, db, test_user
+    ):
+        row = _make_connector(db, test_user, display_name="A", is_default=False)
+        resp = client.delete(f"/api/llm/connectors/{row.id}/default", headers=auth_headers)
+        # Successful no-op — no error, no audit row.
+        assert resp.status_code == 200
+        assert resp.json()["is_default"] is False
+        assert (
+            db.query(LlmAuditEvent)
+            .filter(LlmAuditEvent.event_type == "connector_default_unset")
+            .count()
+            == 0
+        )
+
+    def test_unset_default_writes_audit_event(
+        self, client: TestClient, auth_headers, db, test_user
+    ):
+        row = _make_connector(db, test_user, display_name="A", is_default=True)
+        client.delete(f"/api/llm/connectors/{row.id}/default", headers=auth_headers)
+
+        audit = (
+            db.query(LlmAuditEvent)
+            .filter(
+                LlmAuditEvent.target_connector_id == row.id,
+                LlmAuditEvent.event_type == "connector_default_unset",
+            )
+            .one_or_none()
+        )
+        assert audit is not None
+        assert audit.actor_user_id == test_user.id
+
+    def test_unset_default_404_for_other_users_connector(
+        self, client: TestClient, auth_headers, db, other_dj
+    ):
+        theirs = _make_connector(db, other_dj, display_name="not yours", is_default=True)
+        resp = client.delete(f"/api/llm/connectors/{theirs.id}/default", headers=auth_headers)
+        assert resp.status_code == 404
+        db.refresh(theirs)
+        assert theirs.is_default is True
+
+    def test_unset_falls_back_to_mru_on_next_dispatch(
+        self, client: TestClient, auth_headers, db, test_user
+    ):
+        """Acceptance criterion: unsetting falls back to MRU."""
+        from datetime import timedelta
+
+        from app.core.time import utcnow
+
+        pinned = _make_connector(db, test_user, display_name="pinned", is_default=True)
+        pinned.last_used_at = utcnow() - timedelta(hours=2)
+        mru = _make_connector(db, test_user, display_name="mru-recent")
+        mru.last_used_at = utcnow()
+        db.commit()
+
+        client.delete(f"/api/llm/connectors/{pinned.id}/default", headers=auth_headers)
+        db.refresh(pinned)
+        assert pinned.is_default is False
+
+        # After unsetting, gateway picks the MRU.
+        import asyncio
+
+        fake = ChatResponse(text="mru-served", tool_calls=[], stop_reason="end_turn", usage=None)
+        with patch.object(
+            __import__(
+                "app.services.llm.adapters.openai_apikey",
+                fromlist=["OpenAIApiKeyAdapter"],
+            ).OpenAIApiKeyAdapter,
+            "chat",
+            new=AsyncMock(return_value=fake),
+        ):
+            resp = asyncio.run(
+                Gateway.dispatch(
+                    db,
+                    test_user,
+                    ChatRequest(messages=[Message(role="user", content="hi")]),
+                    purpose="test",
+                )
+            )
+
+        assert resp.text == "mru-served"
+        db.refresh(mru)
+        # MRU got the bump; pinned did not because it wasn't chosen this time.
+        assert mru.last_used_at is not None
+
+
+# ---------- ConnectorOut surfaces is_default ----------
+class TestListSurfacesIsDefault:
+    def test_list_exposes_is_default_flag(self, client: TestClient, auth_headers, db, test_user):
+        _make_connector(db, test_user, display_name="A", is_default=True)
+        _make_connector(db, test_user, display_name="B")
+
+        rows = client.get("/api/llm/connectors", headers=auth_headers).json()
+        by_name = {r["display_name"]: r for r in rows}
+        assert by_name["A"]["is_default"] is True
+        assert by_name["B"]["is_default"] is False
+
+
+# ---------- service layer invariants ----------
+class TestServiceLayer:
+    def test_set_default_for_user_clears_siblings(self, db, dj_user):
+        from app.services.llm.connector_storage import set_default_for_user
+
+        a = _make_connector(db, dj_user, display_name="A", is_default=True)
+        b = _make_connector(db, dj_user, display_name="B")
+
+        set_default_for_user(db, connector=b)
+        db.commit()
+
+        db.refresh(a)
+        db.refresh(b)
+        assert a.is_default is False
+        assert b.is_default is True
+
+    def test_set_default_idempotent_when_already_default(self, db, dj_user):
+        """Calling set on a row that's already default is a quiet no-op."""
+        from app.services.llm.connector_storage import set_default_for_user
+
+        a = _make_connector(db, dj_user, display_name="A", is_default=True)
+        result = set_default_for_user(db, connector=a)
+        db.commit()
+
+        assert result.id == a.id
+        db.refresh(a)
+        assert a.is_default is True
+
+    def test_unset_default_clears_flag(self, db, dj_user):
+        from app.services.llm.connector_storage import unset_default_for_user
+
+        a = _make_connector(db, dj_user, display_name="A", is_default=True)
+        unset_default_for_user(db, connector=a)
+        db.commit()
+        db.refresh(a)
+        assert a.is_default is False
+
+
+def _load_migration_049():
+    """Import the 049 migration module by file path so the backfill helper is
+    callable from tests (alembic versions/ has no ``__init__.py``).
+    """
+    import importlib.util
+    from pathlib import Path
+
+    path = (
+        Path(__file__).resolve().parent.parent
+        / "alembic"
+        / "versions"
+        / "049_llm_connector_is_default.py"
+    )
+    spec = importlib.util.spec_from_file_location("_migration_049", path)
+    assert spec is not None and spec.loader is not None
+    module = importlib.util.module_from_spec(spec)
+    spec.loader.exec_module(module)
+    return module
+
+
+class TestMigrationBackfill:
+    """Smoke-test the migration's backfill helper against an in-memory DB.
+
+    The helper picks the MRU active connector per user. The migration runs
+    against a bind connection, so we exercise it the same way here. Skipped
+    users (no active connector, or already has a default) must be untouched.
+    """
+
+    def test_backfill_marks_mru_for_each_user(self, db, dj_user, other_dj):
+        from datetime import timedelta
+
+        from app.core.time import utcnow
+
+        migration = _load_migration_049()
+
+        # User A: two active connectors, neither default. MRU = newer.
+        older_a = _make_connector(db, dj_user, display_name="A-older")
+        newer_a = _make_connector(db, dj_user, display_name="A-newer")
+        older_a.last_used_at = utcnow() - timedelta(hours=2)
+        newer_a.last_used_at = utcnow()
+
+        # User B: one active connector with no last_used_at — gets defaulted.
+        only_b = _make_connector(db, other_dj, display_name="B-only")
+        only_b.last_used_at = None
+
+        db.commit()
+
+        migration._backfill_mru_defaults(db.connection())
+        db.commit()
+
+        db.refresh(older_a)
+        db.refresh(newer_a)
+        db.refresh(only_b)
+        assert newer_a.is_default is True
+        assert older_a.is_default is False
+        assert only_b.is_default is True
+
+    def test_backfill_skips_users_with_existing_default(self, db, dj_user):
+        migration = _load_migration_049()
+
+        already = _make_connector(db, dj_user, display_name="already", is_default=True)
+        also = _make_connector(db, dj_user, display_name="also")
+
+        migration._backfill_mru_defaults(db.connection())
+        db.commit()
+
+        db.refresh(already)
+        db.refresh(also)
+        assert already.is_default is True
+        assert also.is_default is False  # Untouched
+
+    def test_backfill_skips_inactive_only(self, db, dj_user):
+        migration = _load_migration_049()
+
+        broken = _make_connector(db, dj_user, display_name="only-broken", status="auth_invalid")
+
+        migration._backfill_mru_defaults(db.connection())
+        db.commit()
+
+        db.refresh(broken)
+        # No active connector → user is skipped, no default created.
+        assert broken.is_default is False
diff --git a/server/tests/test_llm_feature_preference.py b/server/tests/test_llm_feature_preference.py
new file mode 100644
index 00000000..6122ecb6
--- /dev/null
+++ b/server/tests/test_llm_feature_preference.py
@@ -0,0 +1,361 @@
+"""Tests for per-feature connector preference (issue #337)."""
+
+from __future__ import annotations
+
+import json
+from unittest.mock import patch
+
+import pytest
+from sqlalchemy.exc import IntegrityError
+
+from app.models.llm_connector import LlmConnector
+from app.models.llm_feature_preference import KNOWN_FEATURES, LlmFeaturePreference
+from app.models.user import User
+from app.services.auth import get_password_hash
+from app.services.llm.adapters.openai_apikey import OpenAIApiKeyAdapter
+from app.services.llm.base import ChatRequest, ChatResponse, Message, TokenUsage
+from app.services.llm.gateway import Gateway
+
+
+@pytest.fixture
+def dj_user(db) -> User:
+    user = User(
+        username="prefdj",
+        password_hash=get_password_hash("password123"),
+        role="dj",
+    )
+    db.add(user)
+    db.commit()
+    db.refresh(user)
+    return user
+
+
+def _make_connector(db, user, *, display_name="Pref connector", status="active"):
+    row = LlmConnector(
+        user_id=user.id,
+        connector_type="openai_apikey",
+        display_name=display_name,
+        status=status,
+        credentials=json.dumps({"api_key": "sk-fake-key"}),
+        model_hint="gpt-5-mini",
+    )
+    db.add(row)
+    db.commit()
+    db.refresh(row)
+    return row
+
+
+def test_known_features_contains_recommendation_and_set_builder():
+    assert "recommendation" in KNOWN_FEATURES
+    assert "set_builder" in KNOWN_FEATURES
+
+
+def test_unique_constraint_one_pref_per_user_feature(db, dj_user):
+    c1 = _make_connector(db, dj_user, display_name="A")
+    c2 = _make_connector(db, dj_user, display_name="B")
+    db.add(LlmFeaturePreference(user_id=dj_user.id, feature="recommendation", connector_id=c1.id))
+    db.commit()
+    db.add(LlmFeaturePreference(user_id=dj_user.id, feature="recommendation", connector_id=c2.id))
+    with pytest.raises(IntegrityError):
+        db.commit()
+    db.rollback()
+
+
+def test_set_feature_preference_upserts(db, dj_user):
+    from app.services.llm.connector_storage import (
+        get_feature_preferences_for_user,
+        set_feature_preference,
+    )
+
+    c1 = _make_connector(db, dj_user, display_name="A")
+    c2 = _make_connector(db, dj_user, display_name="B")
+
+    set_feature_preference(db, user_id=dj_user.id, feature="recommendation", connector_id=c1.id)
+    db.commit()
+    prefs = get_feature_preferences_for_user(db, dj_user.id)
+    assert {p.feature: p.connector_id for p in prefs} == {"recommendation": c1.id}
+
+    # Re-set the same feature → replace, not duplicate.
+    set_feature_preference(db, user_id=dj_user.id, feature="recommendation", connector_id=c2.id)
+    db.commit()
+    prefs = get_feature_preferences_for_user(db, dj_user.id)
+    assert {p.feature: p.connector_id for p in prefs} == {"recommendation": c2.id}
+
+
+def test_set_feature_preference_is_conflict_safe_upsert(db, dj_user):
+    """Regression: a re-pin must not trip the UNIQUE constraint (CodeRabbit PR #378).
+
+    ``set_feature_preference`` is a DB-native ``ON CONFLICT DO UPDATE`` upsert,
+    so re-pinning an already-pinned (user, feature) — the case a concurrent
+    second request would hit — resolves to last-writer-wins in one atomic
+    statement instead of raising ``IntegrityError`` (which previously bubbled a
+    500). It must leave exactly one row and return the re-pinned connector.
+    """
+    from app.services.llm.connector_storage import (
+        get_feature_preferences_for_user,
+        set_feature_preference,
+    )
+
+    c1 = _make_connector(db, dj_user, display_name="first")
+    c2 = _make_connector(db, dj_user, display_name="second")
+
+    # A row already exists for (dj_user, "recommendation") — exactly the state a
+    # concurrent winner would have committed before the loser's upsert lands.
+    db.add(LlmFeaturePreference(user_id=dj_user.id, feature="recommendation", connector_id=c1.id))
+    db.commit()
+
+    result = set_feature_preference(
+        db, user_id=dj_user.id, feature="recommendation", connector_id=c2.id
+    )
+    db.commit()
+
+    # Last writer wins, and there is still exactly one row for the pair.
+    assert result.connector_id == c2.id
+    prefs = get_feature_preferences_for_user(db, dj_user.id)
+    assert {p.feature: p.connector_id for p in prefs} == {"recommendation": c2.id}
+
+
+def test_clear_feature_preference_removes_row(db, dj_user):
+    from app.services.llm.connector_storage import (
+        clear_feature_preference,
+        get_feature_preferences_for_user,
+        set_feature_preference,
+    )
+
+    c1 = _make_connector(db, dj_user, display_name="A")
+    set_feature_preference(db, user_id=dj_user.id, feature="recommendation", connector_id=c1.id)
+    db.commit()
+
+    removed = clear_feature_preference(db, user_id=dj_user.id, feature="recommendation")
+    db.commit()
+    assert removed is True
+    assert get_feature_preferences_for_user(db, dj_user.id) == []
+
+    # Clearing a non-existent preference is a no-op (returns False).
+    assert clear_feature_preference(db, user_id=dj_user.id, feature="recommendation") is False
+
+
+# ---------- gateway resolution ----------
+def _ok_response() -> ChatResponse:
+    return ChatResponse(
+        text="ok",
+        tool_calls=[],
+        stop_reason="end_turn",
+        usage=TokenUsage(prompt=1, completion=1),
+    )
+
+
+@pytest.mark.asyncio
+async def test_gateway_prefers_feature_pin_over_default(db, dj_user):
+    from app.services.llm.connector_storage import set_default_for_user, set_feature_preference
+
+    pinned = _make_connector(db, dj_user, display_name="pinned")
+    other = _make_connector(db, dj_user, display_name="default")
+    set_default_for_user(db, connector=other)  # per-DJ default points elsewhere
+    set_feature_preference(db, user_id=dj_user.id, feature="recommendation", connector_id=pinned.id)
+    db.commit()
+
+    captured = {}
+
+    async def fake_chat(self, request):  # noqa: ANN001
+        captured["connector_id"] = self.connector.id
+        return _ok_response()
+
+    with patch.object(OpenAIApiKeyAdapter, "chat", new=fake_chat):
+        await Gateway.dispatch(
+            db,
+            dj_user,
+            ChatRequest(messages=[Message(role="user", content="hi")]),
+            purpose="recommendation",
+        )
+    assert captured["connector_id"] == pinned.id
+
+
+@pytest.mark.asyncio
+async def test_gateway_falls_back_when_pinned_connector_auth_invalid(db, dj_user):
+    from app.services.llm.connector_storage import set_default_for_user, set_feature_preference
+
+    pinned = _make_connector(db, dj_user, display_name="pinned", status="auth_invalid")
+    fallback = _make_connector(db, dj_user, display_name="fallback")
+    set_default_for_user(db, connector=fallback)
+    set_feature_preference(db, user_id=dj_user.id, feature="recommendation", connector_id=pinned.id)
+    db.commit()
+
+    captured = {}
+
+    async def fake_chat(self, request):  # noqa: ANN001
+        captured["connector_id"] = self.connector.id
+        return _ok_response()
+
+    with patch.object(OpenAIApiKeyAdapter, "chat", new=fake_chat):
+        await Gateway.dispatch(
+            db,
+            dj_user,
+            ChatRequest(messages=[Message(role="user", content="hi")]),
+            purpose="recommendation",
+        )
+    # Skips the auth_invalid pin, falls through to the per-DJ default.
+    assert captured["connector_id"] == fallback.id
+
+
+@pytest.mark.asyncio
+async def test_gateway_falls_back_when_pinned_connector_deleted(db, dj_user):
+    """A pin whose connector was deleted is skipped (graceful fallback)."""
+    from app.services.llm.connector_storage import set_default_for_user, set_feature_preference
+
+    pinned = _make_connector(db, dj_user, display_name="pinned")
+    fallback = _make_connector(db, dj_user, display_name="fallback")
+    set_default_for_user(db, connector=fallback)
+    set_feature_preference(db, user_id=dj_user.id, feature="recommendation", connector_id=pinned.id)
+    db.commit()
+
+    # Delete the pinned connector directly (simulating a stale FK target). The
+    # ON DELETE CASCADE removes the preference row too, so this exercises the
+    # "pref row gone" path; the status-flip test above covers "pref points at
+    # an inactive connector".
+    db.delete(pinned)
+    db.commit()
+
+    captured = {}
+
+    async def fake_chat(self, request):  # noqa: ANN001
+        captured["connector_id"] = self.connector.id
+        return _ok_response()
+
+    with patch.object(OpenAIApiKeyAdapter, "chat", new=fake_chat):
+        await Gateway.dispatch(
+            db,
+            dj_user,
+            ChatRequest(messages=[Message(role="user", content="hi")]),
+            purpose="recommendation",
+        )
+    assert captured["connector_id"] == fallback.id
+
+
+@pytest.mark.asyncio
+async def test_gateway_ignores_pin_for_unknown_feature(db, dj_user):
+    """A pin set for one feature must not leak into another purpose."""
+    from app.services.llm.connector_storage import set_feature_preference
+
+    pinned = _make_connector(db, dj_user, display_name="pinned")
+    mru = _make_connector(db, dj_user, display_name="mru")
+    set_feature_preference(db, user_id=dj_user.id, feature="recommendation", connector_id=pinned.id)
+    db.commit()
+
+    captured = {}
+
+    async def fake_chat(self, request):  # noqa: ANN001
+        captured["connector_id"] = self.connector.id
+        return _ok_response()
+
+    with patch.object(OpenAIApiKeyAdapter, "chat", new=fake_chat):
+        await Gateway.dispatch(
+            db,
+            dj_user,
+            ChatRequest(messages=[Message(role="user", content="hi")]),
+            purpose="set_builder",
+        )
+    # No pin for set_builder → MRU resolution (most recently created here is `mru`).
+    assert captured["connector_id"] == mru.id
+
+
+# ---------- API endpoints ----------
+def test_set_list_clear_feature_preference_endpoints(client, db, test_user, auth_headers):
+    c = _make_connector(db, test_user, display_name="Endpoint connector")
+
+    # Set
+    resp = client.post(
+        "/api/llm/feature-preferences",
+        json={"feature": "recommendation", "connector_id": c.id},
+        headers=auth_headers,
+    )
+    assert resp.status_code == 200, resp.json()
+    body = resp.json()
+    assert {p["feature"]: p["connector_id"] for p in body["preferences"]} == {
+        "recommendation": c.id
+    }
+    assert "set_builder" in body["known_features"]
+
+    # List
+    resp = client.get("/api/llm/feature-preferences", headers=auth_headers)
+    assert resp.status_code == 200
+    assert resp.json()["preferences"][0]["connector_id"] == c.id
+
+    # Change (re-pin same feature to a second connector → replace, not duplicate)
+    c2 = _make_connector(db, test_user, display_name="Second connector")
+    resp = client.post(
+        "/api/llm/feature-preferences",
+        json={"feature": "recommendation", "connector_id": c2.id},
+        headers=auth_headers,
+    )
+    assert resp.status_code == 200
+    assert {p["feature"]: p["connector_id"] for p in resp.json()["preferences"]} == {
+        "recommendation": c2.id
+    }
+
+    # Clear
+    resp = client.delete("/api/llm/feature-preferences/recommendation", headers=auth_headers)
+    assert resp.status_code == 200
+    assert resp.json()["preferences"] == []
+
+
+def test_set_feature_preference_rejects_unknown_feature(client, db, test_user, auth_headers):
+    c = _make_connector(db, test_user, display_name="X")
+    resp = client.post(
+        "/api/llm/feature-preferences",
+        json={"feature": "totally_made_up", "connector_id": c.id},
+        headers=auth_headers,
+    )
+    assert resp.status_code == 422  # Pydantic Literal rejects it
+
+
+def test_set_feature_preference_rejects_other_djs_connector(client, db, test_user, auth_headers):
+    # Another DJ owns this connector.
+    other = User(username="otherdj", password_hash=get_password_hash("password123"), role="dj")
+    db.add(other)
+    db.commit()
+    db.refresh(other)
+    foreign = _make_connector(db, other, display_name="Not yours")
+
+    resp = client.post(
+        "/api/llm/feature-preferences",
+        json={"feature": "recommendation", "connector_id": foreign.id},
+        headers=auth_headers,
+    )
+    assert resp.status_code == 404  # ownership not leaked
+
+
+def test_set_feature_preference_rejects_inactive_connector(client, db, test_user, auth_headers):
+    c = _make_connector(db, test_user, display_name="Broken", status="auth_invalid")
+    resp = client.post(
+        "/api/llm/feature-preferences",
+        json={"feature": "recommendation", "connector_id": c.id},
+        headers=auth_headers,
+    )
+    assert resp.status_code == 400
+
+
+def test_clear_unknown_feature_returns_422(client, auth_headers):
+    resp = client.delete("/api/llm/feature-preferences/bogus", headers=auth_headers)
+    assert resp.status_code == 422
+
+
+def test_feature_preference_requires_auth(client, db, test_user):
+    c = _make_connector(db, test_user, display_name="Y")
+    # No auth headers → 401.
+    resp = client.post(
+        "/api/llm/feature-preferences",
+        json={"feature": "recommendation", "connector_id": c.id},
+    )
+    assert resp.status_code == 401
+
+
+# ---------- consistency guard ----------
+def test_feature_key_literal_matches_known_features():
+    """FeatureKey (the OpenAPI enum) must stay in sync with KNOWN_FEATURES."""
+    import typing
+
+    from app.schemas.llm import FeatureKey
+
+    literal_values = set(typing.get_args(FeatureKey))
+    assert literal_values == set(KNOWN_FEATURES)
diff --git a/server/tests/test_llm_gateway.py b/server/tests/test_llm_gateway.py
index 38f17f4e..b35de609 100644
--- a/server/tests/test_llm_gateway.py
+++ b/server/tests/test_llm_gateway.py
@@ -1,77 +1,475 @@
-"""Tests for the provider-agnostic LLM gateway stub (Phase 0).
+"""Tests for the LLM gateway dispatch + connector resolution."""
 
-The gateway is the single surface WrzDJSet codes against. Phase 0 ships an
-interface + a temporary delegating implementation. These tests pin the
-interface shape and the normalization contract, NOT the live LLM.
-"""
+from __future__ import annotations
 
-import ast
-from pathlib import Path
+import json
+from unittest.mock import AsyncMock, patch
 
 import pytest
 
-from app.services.llm import gateway
+from app.models.llm_connector import LlmConnector
+from app.models.system_settings import SystemSettings
+from app.models.user import User
+from app.services.auth import get_password_hash
+from app.services.llm.adapters.openai_apikey import OpenAIApiKeyAdapter
+from app.services.llm.base import ChatRequest, ChatResponse, Message, TokenUsage
+from app.services.llm.exceptions import (
+    AuthInvalid,
+    NoLlmConfigured,
+    ProviderUnavailable,
+    RateLimited,
+)
+from app.services.llm.gateway import Gateway
 
 
-def test_gateway_response_shape():
-    resp = gateway.GatewayResponse(tool_calls=[{"name": "x", "input": {}}], text="hi")
-    assert resp.tool_calls == [{"name": "x", "input": {}}]
-    assert resp.text == "hi"
+def _patch_chat(mock):
+    """Patch the (only) adapter the gateway dispatches to in these tests."""
+    return patch.object(OpenAIApiKeyAdapter, "chat", new=mock)
 
 
-def test_gateway_response_defaults():
-    resp = gateway.GatewayResponse()
-    assert resp.tool_calls == []
-    assert resp.text == ""
+@pytest.fixture
+def dj_user(db) -> User:
+    user = User(
+        username="djuser",
+        password_hash=get_password_hash("password123"),
+        role="dj",
+    )
+    db.add(user)
+    db.commit()
+    db.refresh(user)
+    return user
+
+
+@pytest.fixture
+def admin_user_actor(db) -> User:
+    user = User(
+        username="adminactor",
+        password_hash=get_password_hash("password123"),
+        role="admin",
+    )
+    db.add(user)
+    db.commit()
+    db.refresh(user)
+    return user
+
+
+def _make_connector(
+    db,
+    user: User,
+    *,
+    connector_type: str = "openai_apikey",
+    display_name: str = "Test connector",
+    status: str = "active",
+    model_hint: str = "gpt-5-mini",
+) -> LlmConnector:
+    row = LlmConnector(
+        user_id=user.id,
+        connector_type=connector_type,
+        display_name=display_name,
+        status=status,
+        credentials=json.dumps({"api_key": "sk-fake-key"}),
+        model_hint=model_hint,
+    )
+    db.add(row)
+    db.commit()
+    db.refresh(row)
+    return row
+
+
+@pytest.fixture
+def gateway_request() -> ChatRequest:
+    return ChatRequest(messages=[Message(role="user", content="hi")])
+
+
+@pytest.mark.asyncio
+async def test_no_actor_no_default_raises(db, gateway_request):
+    with pytest.raises(NoLlmConfigured):
+        await Gateway.dispatch(db, None, gateway_request, purpose="test")
+
+
+@pytest.mark.asyncio
+async def test_actor_with_active_connector_dispatches(db, dj_user, gateway_request):
+    connector = _make_connector(db, dj_user)
+
+    fake_response = ChatResponse(
+        text="ok",
+        tool_calls=[],
+        stop_reason="end_turn",
+        usage=TokenUsage(prompt=5, completion=2),
+    )
+
+    with _patch_chat(AsyncMock(return_value=fake_response)):
+        resp = await Gateway.dispatch(db, dj_user, gateway_request, purpose="test")
+
+    assert resp.text == "ok"
+    db.refresh(connector)
+    assert connector.last_used_at is not None
+    # call log row was inserted
+    from app.models.llm_connector import LlmCallLog
+
+    log = db.query(LlmCallLog).filter(LlmCallLog.connector_id == connector.id).one()
+    assert log.status == "ok"
+    assert log.tokens_in == 5
+    assert log.tokens_out == 2
+
+
+@pytest.mark.asyncio
+async def test_auth_invalid_marks_connector(db, dj_user, gateway_request):
+    connector = _make_connector(db, dj_user)
+    with _patch_chat(AsyncMock(side_effect=AuthInvalid("nope"))):
+        with pytest.raises(AuthInvalid):
+            await Gateway.dispatch(db, dj_user, gateway_request, purpose="test")
+
+    db.refresh(connector)
+    assert connector.status == "auth_invalid"
+
+    from app.models.llm_connector import LlmAuditEvent, LlmCallLog
+
+    log = db.query(LlmCallLog).one()
+    assert log.status == "auth_invalid"
+
+    audit = db.query(LlmAuditEvent).one()
+    assert audit.event_type == "auth_invalid_observed"
+    assert audit.target_connector_id == connector.id
+
+
+@pytest.mark.asyncio
+async def test_rate_limited_logs_and_raises(db, dj_user, gateway_request):
+    _make_connector(db, dj_user)
+    with _patch_chat(AsyncMock(side_effect=RateLimited("slow", retry_after_seconds=12))):
+        with pytest.raises(RateLimited) as exc_info:
+            await Gateway.dispatch(db, dj_user, gateway_request, purpose="test")
+    assert exc_info.value.retry_after_seconds == 12
+
+    from app.models.llm_connector import LlmCallLog
+
+    log = db.query(LlmCallLog).one()
+    assert log.status == "rate_limited"
+
+
+@pytest.mark.asyncio
+async def test_provider_unavailable_logs_and_raises(db, dj_user, gateway_request):
+    _make_connector(db, dj_user)
+    with _patch_chat(AsyncMock(side_effect=ProviderUnavailable("nope"))):
+        with pytest.raises(ProviderUnavailable):
+            await Gateway.dispatch(db, dj_user, gateway_request, purpose="test")
+
+    from app.models.llm_connector import LlmCallLog
+
+    log = db.query(LlmCallLog).one()
+    assert log.status == "provider_unavailable"
+
+
+@pytest.mark.asyncio
+async def test_disabled_connector_skipped_in_resolution(db, dj_user, gateway_request):
+    # Disabled connector should NOT be returned by the resolver — no default → raise.
+    _make_connector(db, dj_user, status="disabled", display_name="Disabled")
+    with pytest.raises(NoLlmConfigured):
+        await Gateway.dispatch(db, dj_user, gateway_request, purpose="test")
+
+
+@pytest.mark.asyncio
+async def test_falls_back_to_system_default(db, admin_user_actor, gateway_request):
+    # admin has no connector of their own — falls back to system default.
+    other_admin = User(
+        username="otheradmin",
+        password_hash=get_password_hash("password123"),
+        role="admin",
+    )
+    db.add(other_admin)
+    db.commit()
+    db.refresh(other_admin)
+    default_connector = _make_connector(db, other_admin, display_name="default-org-connector")
+
+    # Wire the system default
+    ss = db.query(SystemSettings).first()
+    if ss is None:
+        ss = SystemSettings(id=1, llm_default_connector_id=default_connector.id)
+        db.add(ss)
+    else:
+        ss.llm_default_connector_id = default_connector.id
+    db.commit()
+
+    fake_response = ChatResponse(
+        text="ok",
+        tool_calls=[],
+        stop_reason="end_turn",
+        usage=TokenUsage(prompt=1, completion=1),
+    )
+
+    with _patch_chat(AsyncMock(return_value=fake_response)):
+        resp = await Gateway.dispatch(db, None, gateway_request, purpose="test")
+
+    assert resp.text == "ok"
+
+
+def _wire_system_default(db, connector: LlmConnector) -> None:
+    ss = db.query(SystemSettings).first()
+    if ss is None:
+        ss = SystemSettings(id=1, llm_default_connector_id=connector.id)
+        db.add(ss)
+    else:
+        ss.llm_default_connector_id = connector.id
+    db.commit()
+
+
+def _make_org_default(db, username: str) -> LlmConnector:
+    """Create an admin-owned org connector and wire it as the system default."""
+    owner = User(
+        username=username,
+        password_hash=get_password_hash("password123"),
+        role="admin",
+    )
+    db.add(owner)
+    db.commit()
+    db.refresh(owner)
+    connector = _make_connector(db, owner, display_name="org-default")
+    _wire_system_default(db, connector)
+    return connector
+
+
+@pytest.mark.asyncio
+async def test_fallback_org_default_on_rate_limit(db, dj_user):
+    """429 on DJ connector → falls back to org default → audit event written."""
+    from app.models.llm_connector import LlmAuditEvent
+
+    _make_connector(db, dj_user, display_name="dj-primary")
 
+    org_connector = _make_org_default(db, "orgowner")
 
-def test_model_hint_literal_values_documented():
-    # The two documented hints from the exec summary.
-    assert gateway.MODEL_HINTS == ("fast", "strong")
+    fallback_response = ChatResponse(
+        text="from-fallback",
+        tool_calls=[],
+        stop_reason="end_turn",
+        usage=TokenUsage(prompt=3, completion=4),
+    )
+
+    # First call (DJ connector) → 429; second call (org default) → success.
+    chat_mock = AsyncMock(
+        side_effect=[RateLimited("slow", retry_after_seconds=5), fallback_response]
+    )
+    with _patch_chat(chat_mock):
+        req = ChatRequest(
+            messages=[Message(role="user", content="hi")],
+            fallback_policy="org_default",
+        )
+        resp = await Gateway.dispatch(db, dj_user, req, purpose="test")
+
+    assert resp.text == "from-fallback"
+    assert chat_mock.await_count == 2
+
+    # A fallback_triggered audit event referencing the fallback connector + trigger.
+    audit = (
+        db.query(LlmAuditEvent).filter(LlmAuditEvent.event_type.like("fallback_triggered%")).one()
+    )
+    assert audit.event_type == "fallback_triggered:rate_limited"
+    assert audit.target_connector_id == org_connector.id
+    assert audit.actor_user_id == dj_user.id
+
+
+@pytest.mark.asyncio
+async def test_fallback_none_surfaces_original_error(db, dj_user):
+    """fallback_policy='none' (default) surfaces the original error, no fallback."""
+    from app.models.llm_connector import LlmAuditEvent
+
+    _make_connector(db, dj_user, display_name="dj-primary")
+
+    _make_org_default(db, "orgowner2")
+
+    chat_mock = AsyncMock(side_effect=RateLimited("slow", retry_after_seconds=5))
+    with _patch_chat(chat_mock):
+        req = ChatRequest(
+            messages=[Message(role="user", content="hi")],
+            fallback_policy="none",
+        )
+        with pytest.raises(RateLimited):
+            await Gateway.dispatch(db, dj_user, req, purpose="test")
+
+    # Only one attempt — no fallback.
+    assert chat_mock.await_count == 1
+    assert (
+        db.query(LlmAuditEvent).filter(LlmAuditEvent.event_type.like("fallback_triggered%")).count()
+        == 0
+    )
+
+
+@pytest.mark.asyncio
+async def test_fallback_org_default_when_no_default_reraises(db, dj_user):
+    """org_default policy with no org default configured → original error surfaces."""
+    _make_connector(db, dj_user, display_name="dj-primary")
+
+    chat_mock = AsyncMock(side_effect=ProviderUnavailable("down"))
+    with _patch_chat(chat_mock):
+        req = ChatRequest(
+            messages=[Message(role="user", content="hi")],
+            fallback_policy="org_default",
+        )
+        with pytest.raises(ProviderUnavailable):
+            await Gateway.dispatch(db, dj_user, req, purpose="test")
+
+    assert chat_mock.await_count == 1
+
+
+@pytest.mark.asyncio
+async def test_fallback_skipped_when_primary_is_org_default(db, dj_user):
+    """If the failing connector IS the org default, there is nothing to fall back to."""
+    dj_connector = _make_connector(db, dj_user, display_name="dj-and-org-default")
+    _wire_system_default(db, dj_connector)
+
+    chat_mock = AsyncMock(side_effect=RateLimited("slow"))
+    with _patch_chat(chat_mock):
+        req = ChatRequest(
+            messages=[Message(role="user", content="hi")],
+            fallback_policy="org_default",
+        )
+        with pytest.raises(RateLimited):
+            await Gateway.dispatch(db, dj_user, req, purpose="test")
+
+    assert chat_mock.await_count == 1
+
+
+@pytest.mark.asyncio
+async def test_retry_then_org_default_retries_same_then_falls_back(db, dj_user):
+    """retry_then_org_default: same connector retried once, then org default."""
+    _make_connector(db, dj_user, display_name="dj-primary")
+
+    _make_org_default(db, "orgowner3")
+
+    ok = ChatResponse(text="recovered", tool_calls=[], stop_reason="end_turn", usage=None)
+    # attempt 1 (primary) 429, attempt 2 (primary retry) 429, attempt 3 (org default) ok
+    chat_mock = AsyncMock(side_effect=[RateLimited("slow"), RateLimited("slow"), ok])
+    with _patch_chat(chat_mock):
+        req = ChatRequest(
+            messages=[Message(role="user", content="hi")],
+            fallback_policy="retry_then_org_default",
+        )
+        resp = await Gateway.dispatch(db, dj_user, req, purpose="test")
+
+    assert resp.text == "recovered"
+    # Bounded: exactly 3 attempts (1 primary + 1 retry + 1 fallback). Never loops.
+    assert chat_mock.await_count == 3
 
 
 @pytest.mark.asyncio
-async def test_dispatch_normalizes_delegated_response(monkeypatch):
-    """dispatch() returns a GatewayResponse normalized from the provider call."""
+async def test_retry_then_org_default_succeeds_on_retry(db, dj_user):
+    """retry_then_org_default: same-connector retry succeeds → no fallback needed."""
+    _make_connector(db, dj_user, display_name="dj-primary")
+
+    ok = ChatResponse(text="retry-ok", tool_calls=[], stop_reason="end_turn", usage=None)
+    chat_mock = AsyncMock(side_effect=[ProviderUnavailable("blip"), ok])
+    with _patch_chat(chat_mock):
+        req = ChatRequest(
+            messages=[Message(role="user", content="hi")],
+            fallback_policy="retry_then_org_default",
+        )
+        resp = await Gateway.dispatch(db, dj_user, req, purpose="test")
+
+    assert resp.text == "retry-ok"
+    assert chat_mock.await_count == 2
+
 
-    class _FakeBlock:
-        def __init__(self, type, **kw):
-            self.type = type
-            for k, v in kw.items():
-                setattr(self, k, v)
+@pytest.mark.asyncio
+async def test_fallback_not_triggered_for_auth_invalid_when_policy_org_default(db, dj_user):
+    """auth_invalid is fallback-eligible: marks primary invalid, falls back."""
+    from app.models.llm_connector import LlmAuditEvent
 
-    class _FakeResponse:
-        content = [
-            _FakeBlock("text", text="thinking"),
-            _FakeBlock("tool_use", name="critique_set", input={"grade": "A"}),
-        ]
+    dj_connector = _make_connector(db, dj_user, display_name="dj-primary")
 
-    async def _fake_raw_call(*, model, system, tools, tool_choice, messages, max_tokens):
-        # Assert the gateway passed a concrete model string (data, not import).
-        assert isinstance(model, str) and model
-        return _FakeResponse()
+    org_connector = _make_org_default(db, "orgowner4")
 
-    monkeypatch.setattr(gateway, "_raw_provider_call", _fake_raw_call)
+    ok = ChatResponse(text="recovered", tool_calls=[], stop_reason="end_turn", usage=None)
+    chat_mock = AsyncMock(side_effect=[AuthInvalid("expired"), ok])
+    with _patch_chat(chat_mock):
+        req = ChatRequest(
+            messages=[Message(role="user", content="hi")],
+            fallback_policy="org_default",
+        )
+        resp = await Gateway.dispatch(db, dj_user, req, purpose="test")
 
-    result = await gateway.dispatch(
-        messages=[{"role": "user", "content": "grade this set"}],
-        tool={"name": "critique_set", "input_schema": {"type": "object"}},
-        model_hint="strong",
+    assert resp.text == "recovered"
+    # Primary connector marked auth_invalid; fallback audit + the auth_invalid audit both present.
+    db.refresh(dj_connector)
+    assert dj_connector.status == "auth_invalid"
+    fallback_audit = (
+        db.query(LlmAuditEvent)
+        .filter(LlmAuditEvent.event_type == "fallback_triggered:auth_invalid")
+        .one()
     )
-    assert isinstance(result, gateway.GatewayResponse)
-    assert result.text == "thinking"
-    assert result.tool_calls == [{"name": "critique_set", "input": {"grade": "A"}}]
-
-
-def test_no_provider_sdk_import_in_gateway_module():
-    """gateway.py must not import a provider SDK directly (anthropic/openai/etc.)."""
-    src = Path(gateway.__file__).read_text()
-    tree = ast.parse(src)
-    banned = {"anthropic", "openai", "google", "cohere", "mistralai", "litellm"}
-    for node in ast.walk(tree):
-        if isinstance(node, ast.Import):
-            for alias in node.names:
-                assert alias.name.split(".")[0] not in banned
-        elif isinstance(node, ast.ImportFrom):
-            root = (node.module or "").split(".")[0]
-            assert root not in banned
+    assert fallback_audit.target_connector_id == org_connector.id
+
+
+@pytest.mark.asyncio
+async def test_fallback_not_eligible_for_tool_translation_error(db, dj_user):
+    """ToolTranslationError is NOT fallback-eligible — a different connector won't help."""
+    from app.services.llm.exceptions import ToolTranslationError
+
+    _make_connector(db, dj_user, display_name="dj-primary")
+
+    _make_org_default(db, "orgowner5")
+
+    chat_mock = AsyncMock(side_effect=ToolTranslationError("bad schema"))
+    with _patch_chat(chat_mock):
+        req = ChatRequest(
+            messages=[Message(role="user", content="hi")],
+            fallback_policy="retry_then_org_default",
+        )
+        with pytest.raises(ToolTranslationError):
+            await Gateway.dispatch(db, dj_user, req, purpose="test")
+
+    assert chat_mock.await_count == 1
+
+
+@pytest.mark.asyncio
+async def test_fallback_failure_surfaces_fallback_error(db, dj_user):
+    """If the fallback connector also fails, the fallback's error surfaces."""
+    _make_connector(db, dj_user, display_name="dj-primary")
+
+    _make_org_default(db, "orgowner6")
+
+    chat_mock = AsyncMock(
+        side_effect=[RateLimited("primary-slow"), ProviderUnavailable("fallback-down")]
+    )
+    with _patch_chat(chat_mock):
+        req = ChatRequest(
+            messages=[Message(role="user", content="hi")],
+            fallback_policy="org_default",
+        )
+        with pytest.raises(ProviderUnavailable):
+            await Gateway.dispatch(db, dj_user, req, purpose="test")
+
+    # primary + fallback, bounded.
+    assert chat_mock.await_count == 2
+
+
+@pytest.mark.asyncio
+async def test_mru_resolution_picks_recent(db, dj_user, gateway_request):
+    """Resolver picks the connector with the most recent last_used_at."""
+    from app.core.time import utcnow
+
+    older = _make_connector(db, dj_user, display_name="older")
+    newer = _make_connector(db, dj_user, display_name="newer")
+
+    older.last_used_at = None
+    from datetime import timedelta
+
+    newer.last_used_at = utcnow() - timedelta(seconds=10)
+    db.commit()
+
+    fake_response = ChatResponse(
+        text="ok",
+        tool_calls=[],
+        stop_reason="end_turn",
+        usage=None,
+    )
+
+    chat_mock = AsyncMock(return_value=fake_response)
+    with _patch_chat(chat_mock):
+        await Gateway.dispatch(db, dj_user, gateway_request, purpose="test")
+
+    chat_mock.assert_awaited_once()
+    # Make sure the newer one was chosen
+    db.refresh(newer)
+    db.refresh(older)
+    assert newer.last_used_at is not None
+    # older.last_used_at was never set so should still be None
+    assert older.last_used_at is None
diff --git a/server/tests/test_llm_gateway_stream.py b/server/tests/test_llm_gateway_stream.py
new file mode 100644
index 00000000..0b203d12
--- /dev/null
+++ b/server/tests/test_llm_gateway_stream.py
@@ -0,0 +1,164 @@
+"""Tests for Gateway.stream — resolution mirrors dispatch, counts-only logging."""
+
+from __future__ import annotations
+
+import json
+
+import pytest
+
+from app.models.llm_connector import LlmCallLog, LlmConnector
+from app.models.user import User
+from app.services.auth import get_password_hash
+from app.services.llm.adapters.openai_apikey import OpenAIApiKeyAdapter
+from app.services.llm.base import ChatRequest, ChatResponseChunk, Message, TokenUsage
+from app.services.llm.exceptions import (
+    AuthInvalid,
+    NoLlmConfigured,
+    ProviderUnavailable,
+)
+from app.services.llm.gateway import Gateway
+
+
+@pytest.fixture
+def dj_user(db) -> User:
+    user = User(
+        username="streamdj",
+        password_hash=get_password_hash("password123"),
+        role="dj",
+    )
+    db.add(user)
+    db.commit()
+    db.refresh(user)
+    return user
+
+
+def _make_connector(db, user, **kw) -> LlmConnector:
+    row = LlmConnector(
+        user_id=user.id,
+        connector_type=kw.get("connector_type", "openai_apikey"),
+        display_name=kw.get("display_name", "Test"),
+        status=kw.get("status", "active"),
+        credentials=json.dumps({"api_key": "sk-fake"}),
+        model_hint="gpt-5-mini",
+    )
+    db.add(row)
+    db.commit()
+    db.refresh(row)
+    return row
+
+
+def _fake_stream(chunks):
+    async def _gen(self, request):
+        for c in chunks:
+            yield c
+
+    return _gen
+
+
+async def test_stream_no_actor_no_default_raises(db):
+    req = ChatRequest(messages=[Message(role="user", content="hi")])
+    with pytest.raises(NoLlmConfigured):
+        async for _ in Gateway.stream(db, None, req, purpose="test"):
+            pass
+
+
+async def test_stream_dispatches_and_logs_counts_only(db, dj_user, monkeypatch):
+    connector = _make_connector(db, dj_user)
+    chunks = [
+        ChatResponseChunk(text_delta="Hel"),
+        ChatResponseChunk(text_delta="lo"),
+        ChatResponseChunk(
+            stop_reason="end_turn",
+            usage=TokenUsage(prompt=4, completion=2),
+            done=True,
+        ),
+    ]
+    monkeypatch.setattr(OpenAIApiKeyAdapter, "stream", _fake_stream(chunks))
+
+    req = ChatRequest(messages=[Message(role="user", content="hi")])
+    out = [c async for c in Gateway.stream(db, dj_user, req, purpose="recommendation")]
+    assert "".join(c.text_delta for c in out) == "Hello"
+
+    log = db.query(LlmCallLog).filter(LlmCallLog.connector_id == connector.id).one()
+    assert log.status == "ok"
+    assert log.purpose == "recommendation"
+    assert log.tokens_in == 4
+    assert log.tokens_out == 2
+    db.refresh(connector)
+    assert connector.last_used_at is not None
+
+
+async def test_stream_error_logs_provider_unavailable(db, dj_user, monkeypatch):
+    connector = _make_connector(db, dj_user)
+
+    async def _boom(self, request):
+        raise ProviderUnavailable("down")
+        yield  # pragma: no cover
+
+    monkeypatch.setattr(OpenAIApiKeyAdapter, "stream", _boom)
+
+    req = ChatRequest(messages=[Message(role="user", content="hi")])
+    with pytest.raises(ProviderUnavailable):
+        async for _ in Gateway.stream(db, dj_user, req, purpose="test"):
+            pass
+
+    log = db.query(LlmCallLog).filter(LlmCallLog.connector_id == connector.id).one()
+    assert log.status == "provider_unavailable"
+
+
+async def test_stream_auth_error_marks_connector_and_audits(db, dj_user, monkeypatch):
+    from app.models.llm_connector import (
+        AUDIT_AUTH_INVALID_OBSERVED,
+        STATUS_AUTH_INVALID,
+        LlmAuditEvent,
+    )
+
+    connector = _make_connector(db, dj_user)
+
+    async def _auth(self, request):
+        raise AuthInvalid("nope")
+        yield  # pragma: no cover
+
+    monkeypatch.setattr(OpenAIApiKeyAdapter, "stream", _auth)
+
+    req = ChatRequest(messages=[Message(role="user", content="hi")])
+    with pytest.raises(AuthInvalid):
+        async for _ in Gateway.stream(db, dj_user, req, purpose="test"):
+            pass
+
+    db.refresh(connector)
+    assert connector.status == STATUS_AUTH_INVALID
+    log = db.query(LlmCallLog).filter(LlmCallLog.connector_id == connector.id).one()
+    assert log.status == "auth_invalid"
+    audit = (
+        db.query(LlmAuditEvent)
+        .filter(
+            LlmAuditEvent.target_connector_id == connector.id,
+            LlmAuditEvent.event_type == AUDIT_AUTH_INVALID_OBSERVED,
+        )
+        .one()
+    )
+    assert audit is not None
+
+
+async def test_stream_consumer_cancel_logs_and_propagates(db, dj_user, monkeypatch):
+    """Consumer stops early (client disconnect) → GeneratorExit, log written once."""
+    connector = _make_connector(db, dj_user)
+
+    async def _infinite(self, request):
+        i = 0
+        while True:
+            yield ChatResponseChunk(text_delta=str(i))
+            i += 1
+
+    monkeypatch.setattr(OpenAIApiKeyAdapter, "stream", _infinite)
+
+    req = ChatRequest(messages=[Message(role="user", content="hi")])
+    agen = Gateway.stream(db, dj_user, req, purpose="test")
+    first = await agen.__anext__()
+    assert first.text_delta == "0"
+    await agen.aclose()  # simulate client disconnect
+
+    log = db.query(LlmCallLog).filter(LlmCallLog.connector_id == connector.id).one()
+    assert log.status == "cancelled"
+    assert log.error_code == "client_disconnect"
diff --git a/server/tests/test_llm_health_check.py b/server/tests/test_llm_health_check.py
new file mode 100644
index 00000000..8eb1c66c
--- /dev/null
+++ b/server/tests/test_llm_health_check.py
@@ -0,0 +1,304 @@
+"""Tests for the shared connector health-check helper (issues #340 + #346).
+
+Covers:
+- ``last_health_check_at`` / ``last_health_check_status`` are written on every
+  invocation (success and failure).
+- AuthInvalid flips ``status`` to ``auth_invalid`` and writes the
+  ``connector_health_check_failed`` audit row only on the active→invalid
+  transition (not when already invalid).
+- Transient failures (rate_limited, provider_unavailable, quota_exceeded) do
+  NOT flip the connector status — they only record the outcome.
+- The manual /test endpoint produces the same observability columns and
+  audit rows as the background monitor (no behavior drift between the two).
+"""
+
+from __future__ import annotations
+
+import json
+from datetime import timedelta
+from unittest.mock import AsyncMock, patch
+
+import pytest
+from fastapi.testclient import TestClient
+
+from app.core.time import utcnow
+from app.models.llm_connector import (
+    AUDIT_AUTH_INVALID_OBSERVED,
+    AUDIT_HEALTH_CHECK,
+    AUDIT_HEALTH_CHECK_FAILED,
+    HEALTH_CHECK_AUTH_INVALID,
+    HEALTH_CHECK_ERROR,
+    HEALTH_CHECK_OK,
+    HEALTH_CHECK_PROVIDER_UNAVAILABLE,
+    HEALTH_CHECK_QUOTA_EXCEEDED,
+    HEALTH_CHECK_RATE_LIMITED,
+    STATUS_ACTIVE,
+    STATUS_AUTH_INVALID,
+    STATUS_DISABLED,
+    LlmAuditEvent,
+    LlmConnector,
+)
+from app.services.llm.exceptions import (
+    AuthInvalid,
+    ProviderUnavailable,
+    QuotaExceeded,
+    RateLimited,
+)
+
+
+def _make_connector(db, user_id: int, *, status: str = STATUS_ACTIVE) -> LlmConnector:
+    row = LlmConnector(
+        user_id=user_id,
+        connector_type="openai_apikey",
+        display_name="Tested",
+        status=status,
+        credentials=json.dumps({"api_key": "sk-key12345678901234567890"}),
+    )
+    db.add(row)
+    db.commit()
+    db.refresh(row)
+    return row
+
+
+def _audit_types(db, connector_id: int) -> list[str]:
+    rows = (
+        db.query(LlmAuditEvent)
+        .filter(LlmAuditEvent.target_connector_id == connector_id)
+        .order_by(LlmAuditEvent.id.asc())
+        .all()
+    )
+    return [r.event_type for r in rows]
+
+
+# ---------- helper API (shared between manual + background) ----------
+
+
+class TestRunHealthCheckHelper:
+    @pytest.mark.asyncio
+    async def test_success_writes_columns_and_audit(self, db, test_user):
+        from app.services.llm.health_check import run_health_check
+
+        row = _make_connector(db, test_user.id)
+        before = utcnow() - timedelta(seconds=1)
+
+        with patch(
+            "app.services.llm.adapters.openai_apikey.OpenAIApiKeyAdapter.health_check",
+            new=AsyncMock(return_value=None),
+        ):
+            outcome = await run_health_check(db, row, actor_user_id=test_user.id)
+        db.commit()
+
+        assert outcome.ok is True
+        assert outcome.status == HEALTH_CHECK_OK
+        assert outcome.status_flipped_to_auth_invalid is False
+
+        db.refresh(row)
+        assert row.last_health_check_status == HEALTH_CHECK_OK
+        assert row.last_health_check_at is not None
+        assert row.last_health_check_at >= before
+        assert row.status == STATUS_ACTIVE
+        assert row.last_error is None
+
+        assert _audit_types(db, row.id) == [AUDIT_HEALTH_CHECK]
+
+    @pytest.mark.asyncio
+    async def test_auth_invalid_flips_status_and_emits_flipped_audit(self, db, test_user):
+        from app.services.llm.health_check import run_health_check
+
+        row = _make_connector(db, test_user.id, status=STATUS_ACTIVE)
+
+        with patch(
+            "app.services.llm.adapters.openai_apikey.OpenAIApiKeyAdapter.health_check",
+            new=AsyncMock(side_effect=AuthInvalid("nope")),
+        ):
+            outcome = await run_health_check(db, row, actor_user_id=test_user.id)
+        db.commit()
+
+        assert outcome.ok is False
+        assert outcome.status == HEALTH_CHECK_AUTH_INVALID
+        assert outcome.status_flipped_to_auth_invalid is True
+
+        db.refresh(row)
+        assert row.status == STATUS_AUTH_INVALID
+        assert row.last_health_check_status == HEALTH_CHECK_AUTH_INVALID
+        assert row.last_error == "auth_invalid"
+
+        types = _audit_types(db, row.id)
+        assert AUDIT_HEALTH_CHECK in types
+        assert AUDIT_AUTH_INVALID_OBSERVED in types
+        assert AUDIT_HEALTH_CHECK_FAILED in types
+
+    @pytest.mark.asyncio
+    async def test_auth_invalid_does_not_re_emit_flipped_when_already_invalid(self, db, test_user):
+        from app.services.llm.health_check import run_health_check
+
+        row = _make_connector(db, test_user.id, status=STATUS_AUTH_INVALID)
+
+        with patch(
+            "app.services.llm.adapters.openai_apikey.OpenAIApiKeyAdapter.health_check",
+            new=AsyncMock(side_effect=AuthInvalid("still broken")),
+        ):
+            outcome = await run_health_check(db, row, actor_user_id=test_user.id)
+        db.commit()
+
+        assert outcome.status_flipped_to_auth_invalid is False
+        db.refresh(row)
+        assert row.status == STATUS_AUTH_INVALID
+        # health_check_failed should NOT be present — already broken on prior pass.
+        types = _audit_types(db, row.id)
+        assert AUDIT_HEALTH_CHECK_FAILED not in types
+
+    @pytest.mark.asyncio
+    async def test_auth_invalid_leaves_disabled_connector_disabled(self, db, test_user):
+        from app.services.llm.health_check import run_health_check
+
+        row = _make_connector(db, test_user.id, status=STATUS_DISABLED)
+
+        with patch(
+            "app.services.llm.adapters.openai_apikey.OpenAIApiKeyAdapter.health_check",
+            new=AsyncMock(side_effect=AuthInvalid("nope")),
+        ):
+            await run_health_check(db, row, actor_user_id=test_user.id)
+        db.commit()
+
+        db.refresh(row)
+        # Disabled must stay disabled — admin force-revoke takes precedence.
+        assert row.status == STATUS_DISABLED
+
+    @pytest.mark.parametrize(
+        ("exc", "expected_status"),
+        [
+            (RateLimited("slow down"), HEALTH_CHECK_RATE_LIMITED),
+            (QuotaExceeded("quota"), HEALTH_CHECK_QUOTA_EXCEEDED),
+            (ProviderUnavailable("5xx"), HEALTH_CHECK_PROVIDER_UNAVAILABLE),
+        ],
+    )
+    @pytest.mark.asyncio
+    async def test_transient_failures_record_outcome_but_do_not_flip_status(
+        self, db, test_user, exc, expected_status
+    ):
+        from app.services.llm.health_check import run_health_check
+
+        row = _make_connector(db, test_user.id, status=STATUS_ACTIVE)
+
+        with patch(
+            "app.services.llm.adapters.openai_apikey.OpenAIApiKeyAdapter.health_check",
+            new=AsyncMock(side_effect=exc),
+        ):
+            outcome = await run_health_check(db, row, actor_user_id=test_user.id)
+        db.commit()
+
+        assert outcome.ok is False
+        assert outcome.status == expected_status
+
+        db.refresh(row)
+        # Transient — status stays active so the gateway will still try it.
+        assert row.status == STATUS_ACTIVE
+        assert row.last_health_check_status == expected_status
+
+    @pytest.mark.asyncio
+    async def test_unexpected_exception_records_error_and_does_not_raise(self, db, test_user):
+        from app.services.llm.health_check import run_health_check
+
+        row = _make_connector(db, test_user.id, status=STATUS_ACTIVE)
+
+        with patch(
+            "app.services.llm.adapters.openai_apikey.OpenAIApiKeyAdapter.health_check",
+            new=AsyncMock(side_effect=RuntimeError("totally unexpected")),
+        ):
+            outcome = await run_health_check(db, row, actor_user_id=test_user.id)
+        db.commit()
+
+        assert outcome.ok is False
+        assert outcome.status == HEALTH_CHECK_ERROR
+        db.refresh(row)
+        # Status not flipped on truly unknown errors — DJ retries.
+        assert row.status == STATUS_ACTIVE
+        assert row.last_health_check_status == HEALTH_CHECK_ERROR
+
+    @pytest.mark.asyncio
+    async def test_success_after_auth_invalid_clears_status(self, db, test_user):
+        from app.services.llm.health_check import run_health_check
+
+        row = _make_connector(db, test_user.id, status=STATUS_AUTH_INVALID)
+        row.last_error = "auth_invalid"
+        db.commit()
+
+        with patch(
+            "app.services.llm.adapters.openai_apikey.OpenAIApiKeyAdapter.health_check",
+            new=AsyncMock(return_value=None),
+        ):
+            outcome = await run_health_check(db, row, actor_user_id=test_user.id)
+        db.commit()
+
+        assert outcome.ok is True
+        db.refresh(row)
+        assert row.status == STATUS_ACTIVE
+        assert row.last_error is None
+        assert row.last_health_check_status == HEALTH_CHECK_OK
+
+
+# ---------- manual /test endpoint parity ----------
+
+
+class TestManualTestEndpointParity:
+    """The DJ-triggered test button must produce the same observability + audit
+    rows as the background monitor — that's the whole point of issue #346.
+    """
+
+    def test_test_endpoint_writes_health_columns_on_success(
+        self, client: TestClient, auth_headers, db, test_user
+    ):
+        row = _make_connector(db, test_user.id)
+
+        with patch(
+            "app.services.llm.adapters.openai_apikey.OpenAIApiKeyAdapter.health_check",
+            new=AsyncMock(return_value=None),
+        ):
+            resp = client.post(f"/api/llm/connectors/{row.id}/test", headers=auth_headers)
+        assert resp.status_code == 200
+        assert resp.json()["ok"] is True
+
+        db.refresh(row)
+        assert row.last_health_check_status == HEALTH_CHECK_OK
+        assert row.last_health_check_at is not None
+        assert AUDIT_HEALTH_CHECK in _audit_types(db, row.id)
+
+    def test_test_endpoint_writes_health_columns_on_auth_invalid(
+        self, client: TestClient, auth_headers, db, test_user
+    ):
+        row = _make_connector(db, test_user.id)
+
+        with patch(
+            "app.services.llm.adapters.openai_apikey.OpenAIApiKeyAdapter.health_check",
+            new=AsyncMock(side_effect=AuthInvalid("nope")),
+        ):
+            resp = client.post(f"/api/llm/connectors/{row.id}/test", headers=auth_headers)
+        assert resp.status_code == 200
+        body = resp.json()
+        assert body["ok"] is False
+        assert body["error_code"] == "auth_invalid"
+
+        db.refresh(row)
+        assert row.status == STATUS_AUTH_INVALID
+        assert row.last_health_check_status == HEALTH_CHECK_AUTH_INVALID
+
+    def test_test_endpoint_response_exposes_new_columns_via_listing(
+        self, client: TestClient, auth_headers, db, test_user
+    ):
+        row = _make_connector(db, test_user.id)
+
+        with patch(
+            "app.services.llm.adapters.openai_apikey.OpenAIApiKeyAdapter.health_check",
+            new=AsyncMock(return_value=None),
+        ):
+            client.post(f"/api/llm/connectors/{row.id}/test", headers=auth_headers)
+
+        # The DJ listing now exposes the two new columns
+        resp = client.get("/api/llm/connectors", headers=auth_headers)
+        assert resp.status_code == 200
+        entries = resp.json()
+        assert len(entries) == 1
+        e = entries[0]
+        assert e["last_health_check_status"] == HEALTH_CHECK_OK
+        assert e["last_health_check_at"] is not None
diff --git a/server/tests/test_llm_health_monitor.py b/server/tests/test_llm_health_monitor.py
new file mode 100644
index 00000000..e01c091e
--- /dev/null
+++ b/server/tests/test_llm_health_monitor.py
@@ -0,0 +1,301 @@
+"""Tests for the background connector health monitor (issue #340).
+
+Covers:
+- Only active connectors that are overdue get checked.
+- Disabled / fresh connectors are skipped.
+- A successful pass writes ``last_health_check_at`` on each due connector.
+- A flip from active → auth_invalid triggers a notification.
+- A pass survives an adapter exception on one connector and keeps going.
+- Per-connector jitter is deterministic so the schedule doesn't shuffle.
+- The env-var interval is clamped to safe bounds.
+"""
+
+from __future__ import annotations
+
+import json
+from datetime import timedelta
+from unittest.mock import AsyncMock, patch
+
+import pytest
+
+from app.core.time import utcnow
+from app.models.llm_connector import (
+    HEALTH_CHECK_AUTH_INVALID,
+    HEALTH_CHECK_OK,
+    STATUS_ACTIVE,
+    STATUS_AUTH_INVALID,
+    STATUS_DISABLED,
+    LlmConnector,
+)
+from app.services.llm.exceptions import AuthInvalid
+from app.services.llm.health_monitor import (
+    _get_interval_seconds,
+    _is_due,
+    _jitter_factor,
+    _select_due_connectors,
+    run_monitor_pass,
+)
+
+_counter = {"n": 0}
+
+
+def _make(db, user_id: int, *, status: str = STATUS_ACTIVE, last_check: object = None):
+    _counter["n"] += 1
+    row = LlmConnector(
+        user_id=user_id,
+        connector_type="openai_apikey",
+        display_name=f"user{user_id}-conn-{_counter['n']}",
+        status=status,
+        credentials=json.dumps({"api_key": "sk-key12345678901234567890"}),
+        last_health_check_at=last_check,
+    )
+    db.add(row)
+    db.commit()
+    db.refresh(row)
+    return row
+
+
+# ---------- env-var interval ----------
+
+
+class TestIntervalConfig:
+    def test_default_interval_when_env_unset(self, monkeypatch):
+        monkeypatch.delenv("LLM_HEALTH_CHECK_INTERVAL_HOURS", raising=False)
+        assert _get_interval_seconds() == 6 * 3600
+
+    def test_env_override_applied(self, monkeypatch):
+        monkeypatch.setenv("LLM_HEALTH_CHECK_INTERVAL_HOURS", "12")
+        assert _get_interval_seconds() == 12 * 3600
+
+    def test_invalid_env_falls_back_to_default(self, monkeypatch):
+        monkeypatch.setenv("LLM_HEALTH_CHECK_INTERVAL_HOURS", "not-a-number")
+        assert _get_interval_seconds() == 6 * 3600
+
+    def test_too_low_clamped_to_floor(self, monkeypatch):
+        monkeypatch.setenv("LLM_HEALTH_CHECK_INTERVAL_HOURS", "0")
+        assert _get_interval_seconds() == 3600  # 1h floor
+
+    def test_too_high_clamped_to_ceiling(self, monkeypatch):
+        monkeypatch.setenv("LLM_HEALTH_CHECK_INTERVAL_HOURS", "9999")
+        assert _get_interval_seconds() == 168 * 3600  # 7d ceiling
+
+
+# ---------- jitter ----------
+
+
+class TestJitter:
+    def test_jitter_is_deterministic_per_id(self):
+        assert _jitter_factor(1) == _jitter_factor(1)
+        assert _jitter_factor(42) == _jitter_factor(42)
+
+    def test_jitter_within_bounds(self):
+        # All factors in [0.7, 1.3) per the docstring contract.
+        for i in range(1, 100):
+            f = _jitter_factor(i)
+            assert 0.7 <= f < 1.3
+
+    def test_jitter_spreads_connectors(self):
+        # Sample a few hundred ids — the band should be reasonably populated
+        # (not all clumped at one end).
+        factors = [_jitter_factor(i) for i in range(1, 300)]
+        low = sum(1 for f in factors if f < 1.0)
+        high = sum(1 for f in factors if f >= 1.0)
+        # Not a statistics test — just confirms the hash isn't a constant.
+        assert low > 50
+        assert high > 50
+
+
+# ---------- _is_due / _select_due_connectors ----------
+
+
+class TestDueSelection:
+    def test_never_checked_is_due(self, db, test_user):
+        row = _make(db, test_user.id, last_check=None)
+        assert _is_due(row) is True
+
+    def test_recently_checked_is_not_due(self, db, test_user):
+        row = _make(db, test_user.id, last_check=utcnow() - timedelta(minutes=5))
+        assert _is_due(row) is False
+
+    def test_overdue_is_due(self, db, test_user, monkeypatch):
+        # Force a tight interval so overdue triggers reliably regardless of jitter.
+        monkeypatch.setenv("LLM_HEALTH_CHECK_INTERVAL_HOURS", "1")
+        row = _make(db, test_user.id, last_check=utcnow() - timedelta(hours=24))
+        assert _is_due(row) is True
+
+    def test_select_due_skips_disabled(self, db, test_user):
+        active = _make(db, test_user.id, status=STATUS_ACTIVE, last_check=None)
+        _make(db, test_user.id, status=STATUS_DISABLED, last_check=None)
+        _make(db, test_user.id, status=STATUS_AUTH_INVALID, last_check=None)
+
+        due = _select_due_connectors(db)
+        due_ids = [c.id for c in due]
+        assert active.id in due_ids
+        # auth_invalid + disabled are excluded — the monitor only re-checks
+        # active connectors. (auth_invalid stays invalid until the DJ rotates.)
+        assert len(due) == 1
+
+
+# ---------- run_monitor_pass ----------
+
+
+@pytest.mark.asyncio
+async def test_monitor_pass_checks_every_due_connector(db, test_user):
+    a = _make(db, test_user.id, last_check=None)
+    b = _make(db, test_user.id, last_check=None)
+    c = _make(db, test_user.id, status=STATUS_DISABLED, last_check=None)
+
+    with (
+        patch(
+            "app.services.llm.adapters.openai_apikey.OpenAIApiKeyAdapter.health_check",
+            new=AsyncMock(return_value=None),
+        ),
+        patch(
+            "app.services.llm.health_monitor._PER_CHECK_SLEEP_SECONDS",
+            0,
+        ),
+    ):
+        checked = await run_monitor_pass(db)
+
+    assert checked == 2
+    db.refresh(a)
+    db.refresh(b)
+    db.refresh(c)
+    assert a.last_health_check_status == HEALTH_CHECK_OK
+    assert b.last_health_check_status == HEALTH_CHECK_OK
+    assert c.last_health_check_at is None  # disabled — skipped
+
+
+@pytest.mark.asyncio
+async def test_monitor_pass_notifies_on_first_flip_to_auth_invalid(db, test_user):
+    row = _make(db, test_user.id, last_check=None)
+
+    with (
+        patch(
+            "app.services.llm.adapters.openai_apikey.OpenAIApiKeyAdapter.health_check",
+            new=AsyncMock(side_effect=AuthInvalid("revoked upstream")),
+        ),
+        patch(
+            "app.services.llm.health_monitor._PER_CHECK_SLEEP_SECONDS",
+            0,
+        ),
+        patch(
+            "app.services.llm.health_monitor._notify_dj_auth_invalid",
+        ) as notify,
+    ):
+        await run_monitor_pass(db)
+
+    db.refresh(row)
+    assert row.status == STATUS_AUTH_INVALID
+    assert row.last_health_check_status == HEALTH_CHECK_AUTH_INVALID
+    notify.assert_called_once()
+    notified_connector = notify.call_args.args[1]
+    assert notified_connector.id == row.id
+
+
+@pytest.mark.asyncio
+async def test_monitor_pass_survives_individual_failure(db, test_user):
+    good = _make(db, test_user.id, last_check=None)
+    bad = _make(db, test_user.id, last_check=None)
+
+    call_count = {"n": 0}
+
+    async def fake_check(*args, **kwargs):
+        call_count["n"] += 1
+        if call_count["n"] == 1:
+            raise RuntimeError("first one explodes")
+        return None
+
+    with (
+        patch(
+            "app.services.llm.adapters.openai_apikey.OpenAIApiKeyAdapter.health_check",
+            new=fake_check,
+        ),
+        patch(
+            "app.services.llm.health_monitor._PER_CHECK_SLEEP_SECONDS",
+            0,
+        ),
+    ):
+        checked = await run_monitor_pass(db)
+
+    # Both checks were attempted (even after the first one's adapter raised).
+    assert checked == 2
+    # At least one of the two was successfully updated.
+    db.refresh(good)
+    db.refresh(bad)
+    statuses = [good.last_health_check_status, bad.last_health_check_status]
+    assert HEALTH_CHECK_OK in statuses
+
+
+@pytest.mark.asyncio
+async def test_monitor_pass_no_due_connectors_returns_zero(db, test_user):
+    # Just-checked connector — not due.
+    _make(db, test_user.id, last_check=utcnow() - timedelta(minutes=1))
+
+    with patch(
+        "app.services.llm.adapters.openai_apikey.OpenAIApiKeyAdapter.health_check",
+        new=AsyncMock(return_value=None),
+    ):
+        checked = await run_monitor_pass(db)
+    assert checked == 0
+
+
+# ---------- notification ----------
+
+
+def test_notify_dj_falls_back_to_log_when_email_not_configured(db, test_user, caplog):
+    from app.services.email_sender import EmailNotConfiguredError
+    from app.services.llm.health_monitor import _notify_dj_auth_invalid
+
+    # User HAS an email — the failure is at the sender layer (no Resend key).
+    test_user.email = "dj@example.com"
+    db.commit()
+    row = _make(db, test_user.id)
+
+    with patch(
+        "app.services.email_sender.send_connector_auth_invalid_notification",
+        side_effect=EmailNotConfiguredError("nope"),
+    ):
+        with caplog.at_level("WARNING"):
+            _notify_dj_auth_invalid(db, row)
+
+    assert any("email not configured" in r.message.lower() for r in caplog.records)
+
+
+def test_notify_dj_logs_when_user_has_no_email(db, caplog):
+    from app.models.user import User
+    from app.services.llm.health_monitor import _notify_dj_auth_invalid
+
+    user_noemail = User(
+        username="silent",
+        password_hash="x",
+        email=None,
+        role="dj",
+    )
+    db.add(user_noemail)
+    db.commit()
+    db.refresh(user_noemail)
+    row = _make(db, user_noemail.id)
+
+    with caplog.at_level("WARNING"):
+        _notify_dj_auth_invalid(db, row)
+    assert any("no email on file" in r.message.lower() for r in caplog.records)
+
+
+def test_notify_dj_sends_email_when_configured(db, test_user):
+    from app.services.llm.health_monitor import _notify_dj_auth_invalid
+
+    test_user.email = "dj@example.com"
+    db.commit()
+    row = _make(db, test_user.id)
+
+    with patch(
+        "app.services.email_sender.send_connector_auth_invalid_notification",
+    ) as sender:
+        _notify_dj_auth_invalid(db, row)
+
+    sender.assert_called_once()
+    kwargs = sender.call_args.kwargs
+    assert kwargs["to_address"] == "dj@example.com"
+    assert kwargs["display_name"] == row.display_name
+    assert kwargs["connector_type"] == row.connector_type
diff --git a/server/tests/test_llm_hooks.py b/server/tests/test_llm_hooks.py
index 0b4a8be0..62c9d542 100644
--- a/server/tests/test_llm_hooks.py
+++ b/server/tests/test_llm_hooks.py
@@ -19,36 +19,66 @@
 from app.services.recommendation.scorer import EventProfile
 
 
+def _add_active_connector(db, user):
+    """Insert an active LLM connector owned by ``user`` so the gateway resolver
+    (and therefore ``is_llm_available``) sees an available connector."""
+    import json
+
+    from app.models.llm_connector import LlmConnector
+
+    connector = LlmConnector(
+        user_id=user.id,
+        connector_type="anthropic_apikey",
+        display_name="Test",
+        status="active",
+        credentials=json.dumps({"api_key": "sk-ant-fakefakefakefakefakefakefakefakefakefake"}),
+        model_hint="claude-haiku-4-5-20251001",
+    )
+    db.add(connector)
+    db.commit()
+    db.refresh(connector)
+    return connector
+
+
 class TestIsLLMAvailable:
-    @patch("app.core.config.get_settings")
-    def test_returns_true_when_key_set(self, mock_settings):
-        mock_settings.return_value.anthropic_api_key = "sk-ant-test"
-        assert is_llm_available() is True
-
-    @patch("app.core.config.get_settings")
-    def test_returns_false_when_key_empty(self, mock_settings):
-        mock_settings.return_value.anthropic_api_key = ""
+    """``is_llm_available`` is connector-backed only.
+
+    The legacy ``ANTHROPIC_API_KEY`` env-var fallback was removed in #343, so a
+    call without ``db`` can never resolve a connector and returns ``False``.
+    """
+
+    def test_returns_false_without_db(self):
         assert is_llm_available() is False
 
-    @patch("app.core.config.get_settings")
-    def test_returns_false_when_llm_disabled_in_settings(self, mock_settings, db: Session):
-        """When API key is set but llm_enabled is False in DB, returns False."""
-        mock_settings.return_value.anthropic_api_key = "sk-ant-test"
+    def test_returns_false_without_db_even_with_actor(self):
+        from unittest.mock import MagicMock
+
+        assert is_llm_available(actor=MagicMock()) is False
+
+    def test_returns_false_when_llm_disabled_in_settings(self, db: Session, test_user):
+        """When a connector exists but llm_enabled is False in DB, returns False."""
         from app.services.system_settings import update_system_settings
 
+        _add_active_connector(db, test_user)
         update_system_settings(db, llm_enabled=False)
-        assert is_llm_available(db) is False
+        assert is_llm_available(db, actor=test_user) is False
         # Reset
         update_system_settings(db, llm_enabled=True)
 
-    @patch("app.core.config.get_settings")
-    def test_returns_true_when_llm_enabled_and_key_set(self, mock_settings, db: Session):
-        """When API key is set and llm_enabled is True in DB, returns True."""
-        mock_settings.return_value.anthropic_api_key = "sk-ant-test"
+    def test_returns_true_when_llm_enabled_and_actor_connector(self, db: Session, test_user):
+        """When the actor owns an active connector and llm_enabled is True, returns True."""
+        from app.services.system_settings import update_system_settings
+
+        _add_active_connector(db, test_user)
+        update_system_settings(db, llm_enabled=True)
+        assert is_llm_available(db, actor=test_user) is True
+
+    def test_returns_false_without_connector(self, db: Session, test_user):
+        """No connector and no org default -> not available."""
         from app.services.system_settings import update_system_settings
 
         update_system_settings(db, llm_enabled=True)
-        assert is_llm_available(db) is True
+        assert is_llm_available(db, actor=test_user) is False
 
 
 class TestGenerateLLMSuggestions:
@@ -72,6 +102,8 @@ async def test_delegates_to_llm_client(self, mock_call_llm):
             tracks=None,
             rejected_tracks=None,
             currently_playing=None,
+            db=None,
+            actor=None,
         )
 
     @pytest.mark.asyncio
@@ -97,6 +129,8 @@ async def test_passes_tracks_to_llm_client(self, mock_call_llm):
             tracks=tracks,
             rejected_tracks=None,
             currently_playing=None,
+            db=None,
+            actor=None,
         )
 
 
diff --git a/server/tests/test_llm_openrouter_models.py b/server/tests/test_llm_openrouter_models.py
new file mode 100644
index 00000000..8707cec4
--- /dev/null
+++ b/server/tests/test_llm_openrouter_models.py
@@ -0,0 +1,143 @@
+"""Tests for the OpenRouter model-catalogue fetcher + TTL cache."""
+
+from __future__ import annotations
+
+from unittest.mock import patch
+
+import httpx
+import pytest
+
+from app.services.llm import openrouter_models as om
+
+_HTTPX_PATH = "app.services.llm.openrouter_models.httpx.AsyncClient"
+
+
+class _AsyncClient:
+    """Minimal httpx.AsyncClient stub supporting .get()."""
+
+    def __init__(self, response: httpx.Response | Exception):
+        self._response = response
+        self.calls = 0
+
+    async def __aenter__(self):
+        return self
+
+    async def __aexit__(self, *args):
+        return None
+
+    async def get(self, url):
+        self.calls += 1
+        if isinstance(self._response, Exception):
+            raise self._response
+        return self._response
+
+
+def _models_body(*ids):
+    return {"data": [{"id": i, "name": i.split("/")[-1]} for i in ids]}
+
+
+def _ok(json_body):
+    return httpx.Response(
+        200,
+        request=httpx.Request("GET", om.OPENROUTER_MODELS_URL),
+        json=json_body,
+    )
+
+
+@pytest.fixture(autouse=True)
+def _clear_cache():
+    om._reset_cache_for_tests()
+    yield
+    om._reset_cache_for_tests()
+
+
+@pytest.mark.asyncio
+async def test_fetches_and_parses_models():
+    client = _AsyncClient(_ok(_models_body("openai/gpt-4o-mini", "anthropic/claude-3.5-sonnet")))
+    with patch(_HTTPX_PATH, return_value=client):
+        models = await om.get_openrouter_models()
+    ids = [m.id for m in models]
+    assert ids == ["openai/gpt-4o-mini", "anthropic/claude-3.5-sonnet"]
+    assert models[0].name == "gpt-4o-mini"
+
+
+@pytest.mark.asyncio
+async def test_second_call_uses_cache_no_refetch():
+    client = _AsyncClient(_ok(_models_body("openai/gpt-4o-mini")))
+    with patch(_HTTPX_PATH, return_value=client):
+        await om.get_openrouter_models()
+        await om.get_openrouter_models()
+    # Second call should be served from cache — only one HTTP fetch.
+    assert client.calls == 1
+
+
+@pytest.mark.asyncio
+async def test_expired_cache_refetches():
+    client = _AsyncClient(_ok(_models_body("openai/gpt-4o-mini")))
+    with patch(_HTTPX_PATH, return_value=client):
+        await om.get_openrouter_models()
+        # Force the cache to look stale.
+        fetched_at, models = om._cache
+        om._cache = (fetched_at - om.CACHE_TTL_SECONDS - 1, models)
+        await om.get_openrouter_models()
+    assert client.calls == 2
+
+
+@pytest.mark.asyncio
+async def test_force_refresh_bypasses_cache():
+    client = _AsyncClient(_ok(_models_body("openai/gpt-4o-mini")))
+    with patch(_HTTPX_PATH, return_value=client):
+        await om.get_openrouter_models()
+        await om.get_openrouter_models(force_refresh=True)
+    assert client.calls == 2
+
+
+@pytest.mark.asyncio
+async def test_fetch_failure_returns_empty_when_no_cache():
+    client = _AsyncClient(httpx.TimeoutException("timeout"))
+    with patch(_HTTPX_PATH, return_value=client):
+        models = await om.get_openrouter_models()
+    assert models == []
+
+
+@pytest.mark.asyncio
+async def test_fetch_failure_returns_stale_cache():
+    good = _AsyncClient(_ok(_models_body("openai/gpt-4o-mini")))
+    with patch(_HTTPX_PATH, return_value=good):
+        await om.get_openrouter_models()
+
+    # Now expire the cache and make the next fetch fail — stale cache served.
+    fetched_at, models = om._cache
+    om._cache = (fetched_at - om.CACHE_TTL_SECONDS - 1, models)
+    bad = _AsyncClient(httpx.ConnectError("boom"))
+    with patch(_HTTPX_PATH, return_value=bad):
+        out = await om.get_openrouter_models()
+    assert [m.id for m in out] == ["openai/gpt-4o-mini"]
+
+
+@pytest.mark.asyncio
+async def test_http_5xx_returns_empty_when_no_cache():
+    resp = httpx.Response(
+        503, request=httpx.Request("GET", om.OPENROUTER_MODELS_URL), json={"error": "down"}
+    )
+    client = _AsyncClient(resp)
+    with patch(_HTTPX_PATH, return_value=client):
+        models = await om.get_openrouter_models()
+    assert models == []
+
+
+@pytest.mark.asyncio
+async def test_malformed_body_returns_empty():
+    client = _AsyncClient(_ok({"unexpected": "shape"}))
+    with patch(_HTTPX_PATH, return_value=client):
+        models = await om.get_openrouter_models()
+    assert models == []
+
+
+@pytest.mark.asyncio
+async def test_entries_missing_id_are_skipped():
+    body = {"data": [{"name": "no id"}, {"id": "openai/gpt-4o-mini"}]}
+    client = _AsyncClient(_ok(body))
+    with patch(_HTTPX_PATH, return_value=client):
+        models = await om.get_openrouter_models()
+    assert [m.id for m in models] == ["openai/gpt-4o-mini"]
diff --git a/server/tests/test_llm_plugin_loader.py b/server/tests/test_llm_plugin_loader.py
new file mode 100644
index 00000000..30762960
--- /dev/null
+++ b/server/tests/test_llm_plugin_loader.py
@@ -0,0 +1,116 @@
+"""Tests for the ``LLM_PLUGIN_DIR`` filesystem plug-in loader.
+
+The loader is an optional surface — production deploys typically leave the
+env var unset and ship trusted adapters as ordinary Python modules. These
+tests pin its documented behaviour:
+
+- Importable ``.py`` files are loaded.
+- Files starting with ``_`` and any non-``.py`` files are skipped.
+- A single broken plug-in logs an error and does **not** stop loading the
+  rest of the directory.
+- The loader does not mutate ``sys.path`` (no namespace leakage).
+"""
+
+from __future__ import annotations
+
+import logging
+import sys
+
+import pytest
+
+from app.services.llm import plugin_loader
+
+
+@pytest.fixture
+def isolated_sys_path():
+    """Snapshot and restore ``sys.path`` around each loader test.
+
+    The loader is explicitly documented to *not* add the plug-in directory to
+    ``sys.path``. Snapshotting here lets us assert that no entry leaks out.
+    """
+    before = list(sys.path)
+    yield
+    sys.path[:] = before
+
+
+@pytest.fixture
+def cleanup_test_modules():
+    """Drop any ``llm_plugins.*`` modules between tests so re-imports re-execute."""
+    yield
+    for name in list(sys.modules):
+        if name.startswith("llm_plugins."):
+            sys.modules.pop(name, None)
+
+
+def _write_plugin(dir_path, name: str, body: str) -> None:
+    (dir_path / name).write_text(body)
+
+
+def test_no_env_var_loads_nothing(monkeypatch):
+    monkeypatch.delenv(plugin_loader.ENV_VAR, raising=False)
+    assert plugin_loader.load_plugins_from_env() == []
+
+
+def test_nonexistent_directory_is_skipped_with_warning(monkeypatch, tmp_path, caplog):
+    missing = tmp_path / "does-not-exist"
+    monkeypatch.setenv(plugin_loader.ENV_VAR, str(missing))
+    with caplog.at_level(logging.WARNING):
+        assert plugin_loader.load_plugins_from_env() == []
+    assert any("does not exist" in r.message for r in caplog.records)
+
+
+def test_loads_py_files_skipping_underscore_and_non_py(
+    monkeypatch, tmp_path, isolated_sys_path, cleanup_test_modules
+):
+    # A loadable plug-in — registers nothing, just imports cleanly. We use a
+    # noop body to keep the assertion focused on file selection rather than
+    # registry side-effects (the contract test in test_llm_adapter_contract.py
+    # already covers the end-to-end registration path via the docs skeleton).
+    _write_plugin(tmp_path, "good.py", "X = 1\n")
+    # Anything starting with ``_`` is skipped (e.g. shared helpers).
+    _write_plugin(tmp_path, "_helper.py", "raise RuntimeError('should not load')\n")
+    # Non-``.py`` files are skipped.
+    _write_plugin(tmp_path, "README.md", "not python\n")
+    # Subdirectories are skipped (no recursion).
+    (tmp_path / "subdir").mkdir()
+    (tmp_path / "subdir" / "nested.py").write_text("X = 2\n")
+
+    monkeypatch.setenv(plugin_loader.ENV_VAR, str(tmp_path))
+    loaded = plugin_loader.load_plugins_from_env()
+    assert loaded == ["llm_plugins.good"]
+    # The loader must not contaminate sys.path with the plug-in directory.
+    assert str(tmp_path) not in sys.path
+
+
+def test_one_broken_plugin_does_not_block_others(
+    monkeypatch, tmp_path, isolated_sys_path, cleanup_test_modules, caplog
+):
+    # Sorted load order: 'a' then 'z'. 'a' is broken; 'z' must still load.
+    _write_plugin(tmp_path, "a_broken.py", "raise ValueError('boom at import')\n")
+    _write_plugin(tmp_path, "z_good.py", "X = 1\n")
+
+    monkeypatch.setenv(plugin_loader.ENV_VAR, str(tmp_path))
+    with caplog.at_level(logging.ERROR):
+        loaded = plugin_loader.load_plugins_from_env()
+
+    assert loaded == ["llm_plugins.z_good"]
+    # The error log should include the offending file name AND the stack
+    # trace; operators rely on this to diagnose third-party imports.
+    error_messages = [r.message for r in caplog.records if r.levelno >= logging.ERROR]
+    assert any("a_broken.py" in m for m in error_messages)
+    assert any("ValueError" in m and "boom at import" in m for m in error_messages)
+
+
+def test_failed_plugin_does_not_leak_into_sys_modules(
+    monkeypatch, tmp_path, isolated_sys_path, cleanup_test_modules
+):
+    _write_plugin(tmp_path, "broken.py", "raise RuntimeError('nope')\n")
+    monkeypatch.setenv(plugin_loader.ENV_VAR, str(tmp_path))
+    plugin_loader.load_plugins_from_env()
+    assert "llm_plugins.broken" not in sys.modules
+
+
+def test_load_from_dir_accepts_explicit_path(tmp_path, isolated_sys_path, cleanup_test_modules):
+    _write_plugin(tmp_path, "direct.py", "X = 1\n")
+    loaded = plugin_loader.load_plugins_from_dir(tmp_path)
+    assert loaded == ["llm_plugins.direct"]
diff --git a/server/tests/test_llm_quota_cap.py b/server/tests/test_llm_quota_cap.py
new file mode 100644
index 00000000..4b4c7ba8
--- /dev/null
+++ b/server/tests/test_llm_quota_cap.py
@@ -0,0 +1,287 @@
+"""Tests for per-DJ monthly token caps (issue #339)."""
+
+from __future__ import annotations
+
+import json
+from datetime import timedelta
+from unittest.mock import AsyncMock, patch
+
+import pytest
+
+from app.core.time import utcnow
+from app.models.llm_connector import LlmCallLog, LlmConnector
+from app.models.user import User
+from app.services.auth import get_password_hash
+from app.services.llm.adapters.openai_apikey import OpenAIApiKeyAdapter
+from app.services.llm.base import ChatRequest, ChatResponse, Message, TokenUsage
+from app.services.llm.connector_storage import (
+    current_month_token_usage,
+    current_month_token_usage_bulk,
+    set_monthly_cap,
+)
+from app.services.llm.exceptions import LlmError, QuotaCapReached
+from app.services.llm.gateway import Gateway
+
+
+def _make_dj(db, username="capdj"):
+    user = User(username=username, password_hash=get_password_hash("password123"), role="dj")
+    db.add(user)
+    db.commit()
+    db.refresh(user)
+    return user
+
+
+def _make_connector(db, user, *, monthly_token_cap=None, display_name="Cap connector"):
+    row = LlmConnector(
+        user_id=user.id,
+        connector_type="openai_apikey",
+        display_name=display_name,
+        status="active",
+        credentials=json.dumps({"api_key": "sk-fake-key"}),
+        model_hint="gpt-5-mini",
+        monthly_token_cap=monthly_token_cap,
+    )
+    db.add(row)
+    db.commit()
+    db.refresh(row)
+    return row
+
+
+def _log(db, connector_id, *, tokens_in, tokens_out, when=None):
+    row = LlmCallLog(
+        connector_id=connector_id,
+        purpose="test",
+        status="ok",
+        latency_ms=10,
+        tokens_in=tokens_in,
+        tokens_out=tokens_out,
+    )
+    db.add(row)
+    db.flush()
+    if when is not None:
+        row.created_at = when
+    db.commit()
+    return row
+
+
+def _req() -> ChatRequest:
+    return ChatRequest(messages=[Message(role="user", content="hi")])
+
+
+# --- Exception ---------------------------------------------------------------
+
+
+def test_quota_cap_reached_is_llm_error():
+    exc = QuotaCapReached("cap reached")
+    assert isinstance(exc, LlmError)
+    assert str(exc) == "cap reached"
+
+
+# --- Model column ------------------------------------------------------------
+
+
+def test_connector_defaults_to_no_cap(db):
+    user = _make_dj(db)
+    connector = _make_connector(db, user)
+    assert connector.monthly_token_cap is None
+
+
+def test_connector_stores_cap(db):
+    user = _make_dj(db, username="capdj2")
+    connector = _make_connector(db, user, monthly_token_cap=100_000)
+    db.refresh(connector)
+    assert connector.monthly_token_cap == 100_000
+
+
+def test_db_rejects_negative_cap(db):
+    """The DB CHECK constraint backstops the app-layer ``ge=0`` guard (#354).
+
+    The API schema (``ge=0``) and ``set_monthly_cap`` already reject negatives;
+    this proves ``ck_llm_connectors_monthly_token_cap_nonnegative`` refuses to
+    persist one even if those layers were bypassed (defence-in-depth).
+    """
+    from sqlalchemy.exc import IntegrityError
+
+    user = _make_dj(db, username="capneg")
+    row = LlmConnector(
+        user_id=user.id,
+        connector_type="openai_apikey",
+        display_name="neg cap",
+        status="active",
+        credentials=json.dumps({"api_key": "sk-fake-key"}),
+        model_hint="gpt-5-mini",
+        monthly_token_cap=-1,
+    )
+    db.add(row)
+    with pytest.raises(IntegrityError):
+        db.commit()
+    db.rollback()
+
+
+# --- Aggregation + setter helpers --------------------------------------------
+
+
+def test_current_month_usage_sums_in_and_out(db):
+    user = _make_dj(db, username="usagedj")
+    connector = _make_connector(db, user)
+    _log(db, connector.id, tokens_in=100, tokens_out=50)
+    _log(db, connector.id, tokens_in=10, tokens_out=5)
+    assert current_month_token_usage(db, connector.id) == 165
+
+
+def test_current_month_usage_excludes_prior_months(db):
+    user = _make_dj(db, username="usagedj2")
+    connector = _make_connector(db, user)
+    # 40 days ago — previous month, must be excluded.
+    _log(db, connector.id, tokens_in=1000, tokens_out=1000, when=utcnow() - timedelta(days=40))
+    _log(db, connector.id, tokens_in=7, tokens_out=3)
+    assert current_month_token_usage(db, connector.id) == 10
+
+
+def test_current_month_usage_treats_null_tokens_as_zero(db):
+    user = _make_dj(db, username="usagedj3")
+    connector = _make_connector(db, user)
+    _log(db, connector.id, tokens_in=None, tokens_out=None)
+    _log(db, connector.id, tokens_in=5, tokens_out=None)
+    assert current_month_token_usage(db, connector.id) == 5
+
+
+def test_current_month_usage_zero_when_no_rows(db):
+    user = _make_dj(db, username="usagedj4")
+    connector = _make_connector(db, user)
+    assert current_month_token_usage(db, connector.id) == 0
+
+
+def test_bulk_usage_aggregates_per_connector(db):
+    # The bulk helper backs the admin list endpoint: one grouped query for many
+    # connectors instead of N+1 (CodeRabbit #377). It must match the per-row
+    # helper, scope to the current month, and key results by connector id.
+    user = _make_dj(db, username="bulkdj")
+    c1 = _make_connector(db, user, display_name="bulk-c1")
+    c2 = _make_connector(db, user, display_name="bulk-c2")
+    c3 = _make_connector(db, user, display_name="bulk-c3")  # no rows this month
+    _log(db, c1.id, tokens_in=100, tokens_out=50)
+    _log(db, c1.id, tokens_in=10, tokens_out=5)
+    _log(db, c2.id, tokens_in=7, tokens_out=3)
+    # Prior-month row on c2 must be excluded.
+    _log(db, c2.id, tokens_in=999, tokens_out=999, when=utcnow() - timedelta(days=40))
+
+    usage = current_month_token_usage_bulk(db, [c1.id, c2.id, c3.id])
+    assert usage[c1.id] == 165
+    assert usage[c2.id] == 10
+    # Connectors with no current-month rows are absent (caller defaults to 0).
+    assert c3.id not in usage
+    # Parity with the per-row helper.
+    assert usage[c1.id] == current_month_token_usage(db, c1.id)
+
+
+def test_bulk_usage_empty_input_returns_empty_dict(db):
+    assert current_month_token_usage_bulk(db, []) == {}
+
+
+def test_set_monthly_cap_accepts_positive_int(db):
+    user = _make_dj(db, username="capset")
+    connector = _make_connector(db, user)
+    set_monthly_cap(connector, 50_000)
+    assert connector.monthly_token_cap == 50_000
+
+
+def test_set_monthly_cap_accepts_none_to_clear(db):
+    user = _make_dj(db, username="capclear")
+    connector = _make_connector(db, user, monthly_token_cap=10)
+    set_monthly_cap(connector, None)
+    assert connector.monthly_token_cap is None
+
+
+def test_set_monthly_cap_rejects_negative(db):
+    user = _make_dj(db, username="capneg")
+    connector = _make_connector(db, user)
+    with pytest.raises(ValueError):
+        set_monthly_cap(connector, -1)
+
+
+# --- Gateway pre-flight enforcement ------------------------------------------
+
+
+@pytest.mark.asyncio
+async def test_dispatch_allows_when_under_cap(db):
+    user = _make_dj(db, username="undercap")
+    connector = _make_connector(db, user, monthly_token_cap=1_000)
+    _log(db, connector.id, tokens_in=100, tokens_out=100)  # 200 used, under 1000
+
+    fake = ChatResponse(
+        text="ok",
+        tool_calls=[],
+        stop_reason="end_turn",
+        usage=TokenUsage(prompt=5, completion=2),
+    )
+    with patch.object(OpenAIApiKeyAdapter, "chat", new=AsyncMock(return_value=fake)):
+        resp = await Gateway.dispatch(db, user, _req(), purpose="test")
+    assert resp.text == "ok"
+
+
+@pytest.mark.asyncio
+async def test_dispatch_refuses_when_cap_reached(db):
+    user = _make_dj(db, username="atcap")
+    connector = _make_connector(db, user, monthly_token_cap=200)
+    _log(db, connector.id, tokens_in=150, tokens_out=50)  # 200 used, == cap
+
+    # The adapter must NOT be called — refusal is pre-flight.
+    chat_mock = AsyncMock()
+    with patch.object(OpenAIApiKeyAdapter, "chat", new=chat_mock):
+        with pytest.raises(QuotaCapReached):
+            await Gateway.dispatch(db, user, _req(), purpose="test")
+    chat_mock.assert_not_called()
+
+
+@pytest.mark.asyncio
+async def test_dispatch_unlimited_when_cap_none(db):
+    user = _make_dj(db, username="nolimit")
+    connector = _make_connector(db, user, monthly_token_cap=None)
+    _log(db, connector.id, tokens_in=10_000, tokens_out=10_000)
+
+    fake = ChatResponse(
+        text="ok",
+        tool_calls=[],
+        stop_reason="end_turn",
+        usage=TokenUsage(prompt=1, completion=1),
+    )
+    with patch.object(OpenAIApiKeyAdapter, "chat", new=AsyncMock(return_value=fake)):
+        resp = await Gateway.dispatch(db, user, _req(), purpose="test")
+    assert resp.text == "ok"
+
+
+# --- API endpoint surfaces QuotaCapReached as a 429 with DJ-facing message ---
+
+
+def test_llm_recommendation_endpoint_returns_429_when_cap_reached(
+    client, db, test_user, test_event, auth_headers
+):
+    """The /recommendations/llm endpoint maps QuotaCapReached to a 429 with the
+    fixed DJ-facing message (issue #339), not the generic 502 catch-all."""
+    # The endpoint requires a connected music service on the event owner.
+    test_user.tidal_access_token = "fake-tidal-token"  # noqa: S105 (test stub)
+    db.commit()
+
+    with (
+        patch(
+            "app.services.recommendation.llm_hooks.is_llm_available",
+            return_value=True,
+        ),
+        patch(
+            "app.services.recommendation.service.generate_recommendations_from_llm",
+            new=AsyncMock(
+                side_effect=QuotaCapReached(
+                    "Your monthly token cap is reached. Contact your admin to raise it."
+                )
+            ),
+        ),
+    ):
+        resp = client.post(
+            f"/api/events/{test_event.code}/recommendations/llm",
+            headers=auth_headers,
+            json={"prompt": "more energy"},
+        )
+
+    assert resp.status_code == 429
+    assert "monthly token cap is reached" in resp.json()["detail"].lower()
diff --git a/server/tests/test_llm_recommendation_via_gateway.py b/server/tests/test_llm_recommendation_via_gateway.py
new file mode 100644
index 00000000..86a0d40e
--- /dev/null
+++ b/server/tests/test_llm_recommendation_via_gateway.py
@@ -0,0 +1,182 @@
+"""Regression: recommendation engine produces canonical output when routed
+through the LLM gateway.
+
+The gateway is the sole credential path — the legacy direct-Anthropic env-var
+fallback was removed in #343. These tests pin that gateway-dispatched output is
+identical to a direct parse of the equivalent provider response, and that
+``call_llm`` now requires a ``db`` session.
+"""
+
+from __future__ import annotations
+
+import json
+from unittest.mock import AsyncMock, patch
+
+import pytest
+
+from app.services.llm.base import ChatResponse, TokenUsage, ToolCall
+from app.services.recommendation.llm_client import call_llm
+from app.services.recommendation.scorer import EventProfile
+
+
+@pytest.fixture
+def event_profile() -> EventProfile:
+    return EventProfile(
+        avg_bpm=128.0,
+        bpm_range=(120.0, 134.0),
+        dominant_keys=["8A", "9A"],
+        dominant_genres=["Tech House"],
+        track_count=10,
+    )
+
+
+GATEWAY_RESPONSE = ChatResponse(
+    text="",
+    tool_calls=[
+        ToolCall(
+            id="tu_1",
+            name="search_queries",
+            input={
+                "queries": [
+                    {
+                        "search_query": "deadmau5 progressive house",
+                        "target_bpm": 128.0,
+                        "target_key": "8A",
+                        "target_genre": "Progressive House",
+                        "reasoning": "Anchor track style",
+                    },
+                    {
+                        "search_query": "eric prydz",
+                        "reasoning": "Similar artist",
+                    },
+                ]
+            },
+        )
+    ],
+    stop_reason="tool_use",
+    usage=TokenUsage(prompt=50, completion=20),
+)
+
+
+def _legacy_anthropic_response():
+    """Return a mock that mimics the Anthropic SDK response shape."""
+    from types import SimpleNamespace
+
+    tool_block = SimpleNamespace(
+        type="tool_use",
+        name="search_queries",
+        input=GATEWAY_RESPONSE.tool_calls[0].input,
+    )
+    return SimpleNamespace(content=[tool_block])
+
+
+def test_parse_tool_response_propagates_provider_model():
+    """The actual provider model from the gateway response must survive parsing,
+    so the UI badge reflects the connector that ran (not a hardcoded default)."""
+    from app.services.recommendation.llm_client import _parse_tool_response
+
+    resp = ChatResponse(
+        text="",
+        tool_calls=[
+            ToolCall(id="t", name="search_queries", input={"queries": [{"search_query": "x"}]})
+        ],
+        stop_reason="tool_use",
+        model="gpt-5.4-mini",
+    )
+    result = _parse_tool_response(resp)
+    assert result.model == "gpt-5.4-mini"
+    assert result.queries[0].search_query == "x"
+
+
+@pytest.mark.asyncio
+async def test_gateway_path_matches_canonical_parse(db, test_user, event_profile):
+    """The gateway path yields the same canonical ``LLMSuggestionResult`` as a
+    direct parse of the equivalent provider response.
+
+    The legacy direct-Anthropic env-var path was removed in #343 — the connector
+    system is the sole credential source. This pins that the gateway-dispatched
+    output is identical to what ``_parse_tool_response`` produces for the same
+    model output regardless of the (defensive) input shape it receives.
+    """
+    # Insert a connector for the actor so the gateway has something to resolve.
+    from app.models.llm_connector import LlmConnector
+    from app.services.recommendation.llm_client import _parse_tool_response
+
+    connector = LlmConnector(
+        user_id=test_user.id,
+        connector_type="anthropic_apikey",
+        display_name="Test",
+        status="active",
+        credentials=json.dumps({"api_key": "sk-ant-fakefakefakefakefakefakefakefakefakefake"}),
+        model_hint="claude-haiku-4-5-20251001",
+    )
+    db.add(connector)
+    db.commit()
+    db.refresh(connector)
+
+    # Gateway path: mock the adapter's chat method directly.
+    with patch(
+        "app.services.llm.adapters.anthropic_apikey.AnthropicApiKeyAdapter.chat",
+        new=AsyncMock(return_value=GATEWAY_RESPONSE),
+    ):
+        gateway_result = await call_llm(
+            event_profile,
+            "deeper progressive house",
+            db=db,
+            actor=test_user,
+        )
+
+    # Canonical parse of the equivalent Anthropic-SDK-shaped response.
+    canonical_result = _parse_tool_response(_legacy_anthropic_response())
+
+    # Identical structured output regardless of response shape.
+    assert len(gateway_result.queries) == len(canonical_result.queries) == 2
+    for gq, cq in zip(gateway_result.queries, canonical_result.queries):
+        assert gq.search_query == cq.search_query
+        assert gq.target_bpm == cq.target_bpm
+        assert gq.target_key == cq.target_key
+        assert gq.target_genre == cq.target_genre
+        assert gq.reasoning == cq.reasoning
+
+
+@pytest.mark.asyncio
+async def test_call_llm_requires_db(event_profile):
+    """The legacy no-``db`` env-var fallback is gone (#343): callers must supply a
+    db session so the gateway can resolve a connector."""
+    with pytest.raises(ValueError, match="requires a db session"):
+        await call_llm(event_profile, "anything")
+
+
+@pytest.mark.asyncio
+async def test_gateway_routes_gemini_connector(db, test_user, event_profile):
+    """When the active DJ connector is Gemini, the recommendation engine routes
+    through the Gemini adapter and produces structured queries.
+    """
+    from app.models.llm_connector import LlmConnector
+
+    connector = LlmConnector(
+        user_id=test_user.id,
+        connector_type="gemini_apikey",
+        display_name="Gemini",
+        status="active",
+        # Built at runtime so no scanner-matchable "AIza…" literal is committed.
+        credentials=json.dumps({"api_key": "AIza" + ("A" * 35)}),
+        model_hint="gemini-2.5-flash",
+    )
+    db.add(connector)
+    db.commit()
+    db.refresh(connector)
+
+    with patch(
+        "app.services.llm.adapters.gemini_apikey.GeminiApiKeyAdapter.chat",
+        new=AsyncMock(return_value=GATEWAY_RESPONSE),
+    ):
+        result = await call_llm(
+            event_profile,
+            "deeper progressive house",
+            db=db,
+            actor=test_user,
+        )
+
+    assert len(result.queries) == 2
+    assert result.queries[0].search_query == "deadmau5 progressive house"
diff --git a/server/tests/test_llm_sigv4.py b/server/tests/test_llm_sigv4.py
new file mode 100644
index 00000000..3b2a19a1
--- /dev/null
+++ b/server/tests/test_llm_sigv4.py
@@ -0,0 +1,78 @@
+"""Tests for the dependency-free AWS SigV4 signer (``services/llm/sigv4.py``).
+
+The signing-key derivation is pinned against AWS's published test vector, and
+a full request signature is pinned to a deterministic fixture so any change to
+the canonicalization or signing logic is caught.
+"""
+
+from __future__ import annotations
+
+from datetime import UTC, datetime
+
+from app.services.llm.sigv4 import _canonicalize_uri, _signing_key, sign_request
+
+
+def test_signing_key_matches_aws_published_vector():
+    # https://docs.aws.amazon.com/general/latest/gr/signature-v4-examples.html
+    key = _signing_key("wJalrXUtnFEMI/K7MDENG+bPxRfiCYEXAMPLEKEY", "20150830", "us-east-1", "iam")
+    assert key.hex() == "c4afb1cc5771d871763a393e44b703571b55cc28424d1a5e86da6ed3c154a4b9"
+
+
+def test_sign_request_is_deterministic_fixture():
+    body = b'{"prompt": "hi"}'
+    headers = sign_request(
+        access_key_id="AKIDEXAMPLE",
+        secret_access_key="wJalrXUtnFEMI/K7MDENG+bPxRfiCYEXAMPLEKEY",
+        region="us-east-1",
+        host="bedrock-runtime.us-east-1.amazonaws.com",
+        canonical_uri="/model/anthropic.claude-3-5-sonnet-20241022-v2:0/invoke",
+        body=body,
+        now=datetime(2025, 1, 1, 0, 0, 0, tzinfo=UTC),
+    )
+    assert headers["X-Amz-Date"] == "20250101T000000Z"
+    assert headers["X-Amz-Content-Sha256"] == (
+        "bbab304eadd046fe16c34bcfe99be2e82011d02a07dfb1974414bd13c0e34720"
+    )
+    assert headers["Authorization"] == (
+        "AWS4-HMAC-SHA256 "
+        "Credential=AKIDEXAMPLE/20250101/us-east-1/bedrock/aws4_request, "
+        "SignedHeaders=content-type;host;x-amz-content-sha256;x-amz-date, "
+        "Signature=8941eee088c2d5ff883e65e9aba29f3b653bea15791a13874201fccefe768fa9"
+    )
+
+
+def test_sign_request_includes_security_token_when_present():
+    headers = sign_request(
+        access_key_id="AKIDEXAMPLE",
+        secret_access_key="secret",
+        region="us-west-2",
+        host="bedrock-runtime.us-west-2.amazonaws.com",
+        canonical_uri="/model/meta.llama3-70b-instruct-v1:0/invoke",
+        body=b"{}",
+        now=datetime(2025, 1, 1, tzinfo=UTC),
+        session_token="FwoGZXIvYXdz",
+    )
+    assert headers["X-Amz-Security-Token"] == "FwoGZXIvYXdz"
+    assert "x-amz-security-token" in headers["Authorization"]
+
+
+def test_signature_changes_when_body_changes():
+    common = dict(
+        access_key_id="AKIDEXAMPLE",
+        secret_access_key="secret",
+        region="us-east-1",
+        host="bedrock-runtime.us-east-1.amazonaws.com",
+        canonical_uri="/model/anthropic.claude-3-5-sonnet-20241022-v2:0/invoke",
+        now=datetime(2025, 1, 1, tzinfo=UTC),
+    )
+    a = sign_request(body=b'{"a":1}', **common)["Authorization"]
+    b = sign_request(body=b'{"a":2}', **common)["Authorization"]
+    assert a != b
+
+
+def test_canonicalize_uri_encodes_colon_in_model_id():
+    # The ':' in "...-v2:0" must be percent-encoded in the canonical URI.
+    encoded = _canonicalize_uri("/model/anthropic.claude-3-5-sonnet-v2:0/invoke")
+    assert "%3A0" in encoded
+    assert encoded.startswith("/model/")
+    assert encoded.endswith("/invoke")
diff --git a/server/tests/test_llm_stream_endpoint.py b/server/tests/test_llm_stream_endpoint.py
new file mode 100644
index 00000000..17ef832a
--- /dev/null
+++ b/server/tests/test_llm_stream_endpoint.py
@@ -0,0 +1,95 @@
+"""SSE stream-test endpoint: auth, ownership, content-type, body shape."""
+
+from __future__ import annotations
+
+import json
+
+from app.models.llm_connector import LlmConnector
+from app.models.user import User
+from app.services.auth import get_password_hash
+from app.services.llm.adapters.openai_apikey import OpenAIApiKeyAdapter
+from app.services.llm.base import ChatResponseChunk, TokenUsage
+
+
+def _make_connector(db, user) -> LlmConnector:
+    row = LlmConnector(
+        user_id=user.id,
+        connector_type="openai_apikey",
+        display_name="Test",
+        status="active",
+        credentials=json.dumps({"api_key": "sk-fake"}),
+        model_hint="gpt-5-mini",
+    )
+    db.add(row)
+    db.commit()
+    db.refresh(row)
+    return row
+
+
+def _parse_sse(body: str) -> list[dict]:
+    return [
+        json.loads(line[len("data:") :].strip())
+        for line in body.splitlines()
+        if line.startswith("data:")
+    ]
+
+
+def test_stream_test_requires_auth(client, db, test_user):
+    connector = _make_connector(db, test_user)
+    resp = client.post(f"/api/llm/connectors/{connector.id}/stream-test")
+    assert resp.status_code == 401
+
+
+def test_stream_test_404_for_unowned(client, db, test_user, auth_headers):
+    other = User(username="other", password_hash=get_password_hash("x123456789"), role="dj")
+    db.add(other)
+    db.commit()
+    db.refresh(other)
+    connector = _make_connector(db, other)
+    resp = client.post(f"/api/llm/connectors/{connector.id}/stream-test", headers=auth_headers)
+    assert resp.status_code == 404
+
+
+def test_stream_test_streams_chunks(client, db, test_user, auth_headers, monkeypatch):
+    connector = _make_connector(db, test_user)
+
+    async def _fake_stream(self, request):
+        yield ChatResponseChunk(text_delta="Hi")
+        yield ChatResponseChunk(text_delta=" there")
+        yield ChatResponseChunk(
+            stop_reason="end_turn", usage=TokenUsage(prompt=2, completion=2), done=True
+        )
+
+    monkeypatch.setattr(OpenAIApiKeyAdapter, "stream", _fake_stream)
+
+    resp = client.post(f"/api/llm/connectors/{connector.id}/stream-test", headers=auth_headers)
+    assert resp.status_code == 200
+    assert resp.headers["content-type"].startswith("text/event-stream")
+
+    payloads = _parse_sse(resp.text)
+    text = "".join(p.get("text_delta", "") for p in payloads)
+    assert "Hi there" in text
+    assert any(p.get("done") for p in payloads)
+
+
+def test_stream_test_error_emits_sanitised_error_frame(
+    client, db, test_user, auth_headers, monkeypatch
+):
+    from app.services.llm.exceptions import ProviderUnavailable
+
+    connector = _make_connector(db, test_user)
+
+    async def _boom(self, request):
+        raise ProviderUnavailable("upstream secret detail")
+        yield  # pragma: no cover
+
+    monkeypatch.setattr(OpenAIApiKeyAdapter, "stream", _boom)
+
+    resp = client.post(f"/api/llm/connectors/{connector.id}/stream-test", headers=auth_headers)
+    assert resp.status_code == 200
+    # An error frame is emitted as event: error with a sanitised code only.
+    body = resp.text
+    assert "event: error" in body
+    assert "ProviderUnavailable" in body
+    # The raw upstream message is never leaked.
+    assert "upstream secret detail" not in body
diff --git a/server/tests/test_llm_streaming.py b/server/tests/test_llm_streaming.py
new file mode 100644
index 00000000..710f910b
--- /dev/null
+++ b/server/tests/test_llm_streaming.py
@@ -0,0 +1,677 @@
+"""Tests for streaming primitives: ChatResponseChunk + SSE helpers + adapters."""
+
+from __future__ import annotations
+
+import json as _json
+
+import pytest
+
+from app.models.llm_connector import LlmConnector
+from app.services.llm.base import (
+    ChatRequest,
+    ChatResponseChunk,
+    LlmAdapter,
+    Message,
+    TokenUsage,
+    ToolCallDelta,
+)
+from app.services.llm.exceptions import StreamingUnsupported
+
+
+# ---------------------------------------------------------------------------
+# Task 1 — ChatResponseChunk + ToolCallDelta models
+# ---------------------------------------------------------------------------
+def test_chunk_defaults_are_empty():
+    chunk = ChatResponseChunk()
+    assert chunk.text_delta == ""
+    assert chunk.tool_call_deltas == []
+    assert chunk.stop_reason is None
+    assert chunk.usage is None
+    assert chunk.done is False
+
+
+def test_chunk_final_carries_stop_reason_and_usage():
+    chunk = ChatResponseChunk(
+        stop_reason="end_turn",
+        usage=TokenUsage(prompt=3, completion=5),
+        done=True,
+    )
+    assert chunk.done is True
+    assert chunk.stop_reason == "end_turn"
+    assert chunk.usage.completion == 5
+
+
+def test_tool_call_delta_fragment_shape():
+    delta = ToolCallDelta(index=0, id="call_1", name="search", input_json_fragment='{"q":')
+    assert delta.index == 0
+    assert delta.id == "call_1"
+    assert delta.name == "search"
+    assert delta.input_json_fragment == '{"q":'
+
+
+# ---------------------------------------------------------------------------
+# Task 2 — default stream() raises StreamingUnsupported
+# ---------------------------------------------------------------------------
+class _BareAdapter(LlmAdapter):
+    connector_type = "bare"
+
+    async def chat(self, request):  # pragma: no cover
+        raise NotImplementedError
+
+    async def health_check(self):  # pragma: no cover
+        raise NotImplementedError
+
+
+async def test_default_stream_raises_streaming_unsupported():
+    adapter = _BareAdapter(connector=None)
+    req = ChatRequest(messages=[Message(role="user", content="hi")])
+    with pytest.raises(StreamingUnsupported):
+        async for _ in adapter.stream(req):
+            pass
+
+
+# ---------------------------------------------------------------------------
+# Task 3 — OpenAI streaming event parser
+# ---------------------------------------------------------------------------
+def test_parse_openai_stream_line_text():
+    from app.services.llm.streaming import parse_openai_stream_event
+
+    chunk = parse_openai_stream_event(
+        {"choices": [{"delta": {"content": "Hello"}, "finish_reason": None}]}
+    )
+    assert chunk is not None
+    assert chunk.text_delta == "Hello"
+    assert chunk.tool_call_deltas == []
+    assert chunk.done is False
+
+
+def test_parse_openai_stream_line_tool_call_fragment():
+    from app.services.llm.streaming import parse_openai_stream_event
+
+    chunk = parse_openai_stream_event(
+        {
+            "choices": [
+                {
+                    "delta": {
+                        "tool_calls": [
+                            {
+                                "index": 0,
+                                "id": "call_1",
+                                "function": {"name": "search", "arguments": '{"q":'},
+                            }
+                        ]
+                    },
+                    "finish_reason": None,
+                }
+            ]
+        }
+    )
+    assert chunk is not None
+    assert chunk.text_delta == ""
+    assert len(chunk.tool_call_deltas) == 1
+    d = chunk.tool_call_deltas[0]
+    assert d.index == 0 and d.id == "call_1" and d.name == "search"
+    assert d.input_json_fragment == '{"q":'
+
+
+def test_parse_openai_stream_line_finish():
+    from app.services.llm.streaming import parse_openai_stream_event
+
+    chunk = parse_openai_stream_event(
+        {
+            "choices": [{"delta": {}, "finish_reason": "tool_calls"}],
+            "usage": {"prompt_tokens": 7, "completion_tokens": 11},
+        }
+    )
+    assert chunk is not None
+    assert chunk.done is True
+    assert chunk.stop_reason == "tool_use"
+    assert chunk.usage is not None and chunk.usage.prompt == 7
+
+
+def test_parse_openai_stream_line_role_only_returns_none():
+    from app.services.llm.streaming import parse_openai_stream_event
+
+    chunk = parse_openai_stream_event(
+        {"choices": [{"delta": {"role": "assistant"}, "finish_reason": None}]}
+    )
+    assert chunk is None
+
+
+def test_parse_openai_stream_line_unknown_finish_reason_maps_error():
+    from app.services.llm.streaming import parse_openai_stream_event
+
+    chunk = parse_openai_stream_event(
+        {"choices": [{"delta": {}, "finish_reason": "content_filter"}]}
+    )
+    assert chunk is not None
+    assert chunk.done is True
+    assert chunk.stop_reason == "error"
+
+
+def test_parse_openai_stream_tolerates_non_numeric_tool_index():
+    """A null/non-numeric tool-call ``index`` must not abort the stream (#379)."""
+    from app.services.llm.streaming import parse_openai_stream_event
+
+    chunk = parse_openai_stream_event(
+        {
+            "choices": [
+                {
+                    "delta": {
+                        "tool_calls": [
+                            {
+                                "index": None,
+                                "id": "call_1",
+                                "function": {"name": "search", "arguments": "{}"},
+                            }
+                        ]
+                    },
+                    "finish_reason": None,
+                }
+            ]
+        }
+    )
+    assert chunk is not None
+    assert chunk.tool_call_deltas[0].index == 0  # fell back to default, no raise
+
+
+def test_parse_openai_stream_tolerates_non_numeric_usage():
+    """Malformed/null token counts must not abort the terminal chunk (#379)."""
+    from app.services.llm.streaming import parse_openai_stream_event
+
+    chunk = parse_openai_stream_event(
+        {
+            "choices": [{"delta": {}, "finish_reason": "stop"}],
+            "usage": {"prompt_tokens": None, "completion_tokens": "oops"},
+        }
+    )
+    assert chunk is not None
+    assert chunk.done is True
+    # Non-numeric counts coerce to 0 rather than raising mid-stream; the terminal
+    # chunk is still delivered with a (zeroed) usage block.
+    assert chunk.usage is not None
+    assert chunk.usage.prompt == 0
+    assert chunk.usage.completion == 0
+
+
+def test_parse_openai_stream_usage_only_terminal_event_preserved():
+    """A usage-only terminal event (empty ``choices``) must not be dropped (#354).
+
+    With ``stream_options.include_usage`` OpenAI emits a final frame carrying only
+    ``usage`` and ``choices: []`` — no delta, no ``finish_reason``. Previously the
+    parser returned ``None`` for it (``done`` is driven solely by ``finish_reason``)
+    so token accounting was silently lost. It must now yield a usage-bearing chunk.
+    """
+    from app.services.llm.streaming import parse_openai_stream_event
+
+    chunk = parse_openai_stream_event(
+        {"choices": [], "usage": {"prompt_tokens": 9, "completion_tokens": 4}}
+    )
+    assert chunk is not None
+    assert chunk.done is False
+    assert chunk.text_delta == ""
+    assert chunk.tool_call_deltas == []
+    assert chunk.usage is not None
+    assert chunk.usage.prompt == 9
+    assert chunk.usage.completion == 4
+
+
+# ---------------------------------------------------------------------------
+# Task 4 — httpx OpenAI streaming generator
+# ---------------------------------------------------------------------------
+class _FakeStreamResponse:
+    """Minimal stand-in for an httpx streaming response."""
+
+    def __init__(self, lines: list[str], status_code: int = 200):
+        self._lines = lines
+        self.status_code = status_code
+        self.headers: dict[str, str] = {}
+
+    async def aiter_lines(self):
+        for line in self._lines:
+            yield line
+
+    async def aread(self):
+        return b""
+
+
+class _FakeStreamClient:
+    def __init__(self, response):
+        self._response = response
+
+    async def __aenter__(self):
+        return self
+
+    async def __aexit__(self, *exc):
+        return False
+
+    def stream(self, method, url, **kwargs):
+        client = self
+
+        class _Ctx:
+            async def __aenter__(self_inner):
+                return client._response
+
+            async def __aexit__(self_inner, *exc):
+                return False
+
+        return _Ctx()
+
+
+async def test_stream_openai_chat_yields_text_then_final(monkeypatch):
+    from app.services.llm.adapters import _httpx_openai
+
+    # SSE events are blank-line delimited (``aiter_lines`` yields "" for a blank
+    # line). Real OpenAI frames each ``data:`` line that way.
+    sse_lines = [
+        'data: {"choices":[{"delta":{"role":"assistant"},"finish_reason":null}]}',
+        "",
+        'data: {"choices":[{"delta":{"content":"Hi"},"finish_reason":null}]}',
+        "",
+        'data: {"choices":[{"delta":{"content":" there"},"finish_reason":null}]}',
+        "",
+        'data: {"choices":[{"delta":{},"finish_reason":"stop"}],'
+        '"usage":{"prompt_tokens":4,"completion_tokens":2}}',
+        "",
+        "data: [DONE]",
+        "",
+    ]
+    fake_resp = _FakeStreamResponse(sse_lines)
+    monkeypatch.setattr(
+        _httpx_openai.httpx, "AsyncClient", lambda *a, **k: _FakeStreamClient(fake_resp)
+    )
+
+    req = ChatRequest(messages=[Message(role="user", content="hi")], model="gpt-x")
+    chunks = []
+    async for c in _httpx_openai.stream_openai_chat(
+        base_url="https://api.openai.com/v1",
+        api_key="sk-test",
+        request=req,
+        fallback_model="gpt-x",
+    ):
+        chunks.append(c)
+
+    text = "".join(c.text_delta for c in chunks)
+    assert text == "Hi there"
+    assert chunks[-1].done is True
+    assert chunks[-1].stop_reason == "end_turn"
+    assert chunks[-1].usage.prompt == 4
+
+
+async def test_stream_openai_chat_maps_auth_error(monkeypatch):
+    from app.services.llm.adapters import _httpx_openai
+    from app.services.llm.exceptions import AuthInvalid
+
+    fake_resp = _FakeStreamResponse([], status_code=401)
+    monkeypatch.setattr(
+        _httpx_openai.httpx, "AsyncClient", lambda *a, **k: _FakeStreamClient(fake_resp)
+    )
+
+    req = ChatRequest(messages=[Message(role="user", content="hi")], model="gpt-x")
+    with pytest.raises(AuthInvalid):
+        async for _ in _httpx_openai.stream_openai_chat(
+            base_url="https://api.openai.com/v1",
+            api_key="sk-test",
+            request=req,
+            fallback_model="gpt-x",
+        ):
+            pass
+
+
+async def test_stream_openai_chat_malformed_data_raises(monkeypatch):
+    """A malformed ``data:`` frame surfaces a typed error, not a silent truncation (#379)."""
+    from app.services.llm.adapters import _httpx_openai
+    from app.services.llm.exceptions import ToolTranslationError
+
+    sse_lines = [
+        'data: {"choices":[{"delta":{"content":"Hi"},"finish_reason":null}]}',
+        "",
+        "data: {not valid json",
+        "",
+    ]
+    fake_resp = _FakeStreamResponse(sse_lines)
+    monkeypatch.setattr(
+        _httpx_openai.httpx, "AsyncClient", lambda *a, **k: _FakeStreamClient(fake_resp)
+    )
+
+    req = ChatRequest(messages=[Message(role="user", content="hi")], model="gpt-x")
+    collected = []
+    with pytest.raises(ToolTranslationError):
+        async for c in _httpx_openai.stream_openai_chat(
+            base_url="https://api.openai.com/v1",
+            api_key="sk-test",
+            request=req,
+            fallback_model="gpt-x",
+        ):
+            collected.append(c)
+    # The valid leading chunk was still delivered before the fault surfaced.
+    assert collected and collected[0].text_delta == "Hi"
+
+
+async def test_stream_openai_chat_reassembles_multiline_data_event(monkeypatch):
+    """One SSE event split across multiple ``data:`` lines is reassembled (#354).
+
+    SSE permits a single event to span several ``data:`` lines (joined on
+    newlines); an OpenAI-compatible server may emit JSON that way. Decoding each
+    line on its own would raise on the first fragment and truncate the stream, so
+    the parser must buffer the whole event before JSON-decoding it.
+    """
+    from app.services.llm.adapters import _httpx_openai
+
+    sse_lines = [
+        # A single JSON object wrapped across two data lines — valid only once
+        # the two payloads are rejoined with a newline.
+        'data: {"choices":[{"delta":{"content":"Hi there"},',
+        'data: "finish_reason":null}]}',
+        "",
+        "data: [DONE]",
+        "",
+    ]
+    fake_resp = _FakeStreamResponse(sse_lines)
+    monkeypatch.setattr(
+        _httpx_openai.httpx, "AsyncClient", lambda *a, **k: _FakeStreamClient(fake_resp)
+    )
+
+    req = ChatRequest(messages=[Message(role="user", content="hi")], model="gpt-x")
+    chunks = [
+        c
+        async for c in _httpx_openai.stream_openai_chat(
+            base_url="https://api.openai.com/v1",
+            api_key="sk-test",
+            request=req,
+            fallback_model="gpt-x",
+        )
+    ]
+    assert "".join(c.text_delta for c in chunks) == "Hi there"
+
+
+# ---------------------------------------------------------------------------
+# Task 5 — OpenAI platform + compatible adapter stream()
+# ---------------------------------------------------------------------------
+async def test_openai_apikey_adapter_stream(monkeypatch):
+    from app.services.llm.adapters import openai_apikey
+
+    captured = {}
+
+    async def fake_stream(**kwargs):
+        captured.update(kwargs)
+        yield ChatResponseChunk(text_delta="ok", done=False)
+        yield ChatResponseChunk(stop_reason="end_turn", done=True)
+
+    monkeypatch.setattr(openai_apikey, "stream_openai_chat", fake_stream)
+
+    connector = LlmConnector(
+        user_id=1,
+        connector_type="openai_apikey",
+        display_name="x",
+        status="active",
+        credentials=_json.dumps({"api_key": "sk-test"}),
+        model_hint="gpt-x",
+    )
+    adapter = openai_apikey.OpenAIApiKeyAdapter(connector)
+    req = ChatRequest(messages=[Message(role="user", content="hi")])
+    chunks = [c async for c in adapter.stream(req)]
+    assert [c.text_delta for c in chunks] == ["ok", ""]
+    assert chunks[-1].done is True
+    assert captured["max_tokens_field"] == "max_completion_tokens"
+    assert captured["api_key"] == "sk-test"
+
+
+async def test_openai_compatible_adapter_stream(monkeypatch):
+    from app.services.llm.adapters import openai_compatible
+
+    async def fake_stream(**kwargs):
+        assert kwargs["base_url"] == "http://127.0.0.1:1234/v1"
+        yield ChatResponseChunk(text_delta="hey", done=False)
+        yield ChatResponseChunk(stop_reason="end_turn", done=True)
+
+    monkeypatch.setattr(openai_compatible, "stream_openai_chat", fake_stream)
+
+    connector = LlmConnector(
+        user_id=1,
+        connector_type="openai_compatible",
+        display_name="local",
+        status="active",
+        credentials=_json.dumps({"base_url": "http://127.0.0.1:1234/v1"}),
+        model_hint="local-model",
+    )
+    adapter = openai_compatible.OpenAICompatibleAdapter(connector)
+    req = ChatRequest(messages=[Message(role="user", content="hi")])
+    chunks = [c async for c in adapter.stream(req)]
+    assert "".join(c.text_delta for c in chunks) == "hey"
+    assert chunks[-1].done is True
+
+
+# ---------------------------------------------------------------------------
+# Task 6 — Anthropic adapter stream()
+# ---------------------------------------------------------------------------
+class _FakeEvent:
+    """Stand-in for an anthropic SDK stream event (attribute access)."""
+
+    def __init__(self, **kw):
+        for k, v in kw.items():
+            setattr(self, k, v)
+
+
+class _FakeAnthropicStream:
+    def __init__(self, events):
+        self._events = events
+
+    async def __aenter__(self):
+        return self
+
+    async def __aexit__(self, *exc):
+        return False
+
+    async def __aiter__(self):
+        for e in self._events:
+            yield e
+
+
+def _anthropic_text_events():
+    return [
+        _FakeEvent(type="message_start"),
+        _FakeEvent(
+            type="content_block_start",
+            index=0,
+            content_block=_FakeEvent(type="text", text=""),
+        ),
+        _FakeEvent(
+            type="content_block_delta",
+            index=0,
+            delta=_FakeEvent(type="text_delta", text="Hel"),
+        ),
+        _FakeEvent(
+            type="content_block_delta",
+            index=0,
+            delta=_FakeEvent(type="text_delta", text="lo"),
+        ),
+        _FakeEvent(type="content_block_stop", index=0),
+        _FakeEvent(
+            type="message_delta",
+            delta=_FakeEvent(stop_reason="end_turn"),
+            usage=_FakeEvent(output_tokens=5),
+        ),
+        _FakeEvent(type="message_stop"),
+    ]
+
+
+def _anthropic_tool_events():
+    return [
+        _FakeEvent(type="message_start"),
+        _FakeEvent(
+            type="content_block_start",
+            index=0,
+            content_block=_FakeEvent(type="tool_use", id="toolu_1", name="search"),
+        ),
+        _FakeEvent(
+            type="content_block_delta",
+            index=0,
+            delta=_FakeEvent(type="input_json_delta", partial_json='{"q":'),
+        ),
+        _FakeEvent(
+            type="content_block_delta",
+            index=0,
+            delta=_FakeEvent(type="input_json_delta", partial_json='"house"}'),
+        ),
+        _FakeEvent(type="content_block_stop", index=0),
+        _FakeEvent(
+            type="message_delta",
+            delta=_FakeEvent(stop_reason="tool_use"),
+            usage=_FakeEvent(output_tokens=9),
+        ),
+        _FakeEvent(type="message_stop"),
+    ]
+
+
+def _patch_fake_anthropic(monkeypatch, events):
+    from app.services.llm.adapters import anthropic_apikey
+
+    class _FakeMessages:
+        def stream(self, **kwargs):
+            return _FakeAnthropicStream(events)
+
+    class _FakeClient:
+        def __init__(self, *a, **k):
+            self.messages = _FakeMessages()
+
+        async def __aenter__(self):
+            return self
+
+        async def __aexit__(self, *exc):
+            return False
+
+    monkeypatch.setattr(anthropic_apikey, "AsyncAnthropic", _FakeClient)
+
+
+def _anthropic_connector():
+    return LlmConnector(
+        user_id=1,
+        connector_type="anthropic_apikey",
+        display_name="claude",
+        status="active",
+        credentials=_json.dumps({"api_key": "sk-ant-test"}),
+        model_hint="claude-x",
+    )
+
+
+async def test_anthropic_adapter_stream_text(monkeypatch):
+    from app.services.llm.adapters import anthropic_apikey
+
+    _patch_fake_anthropic(monkeypatch, _anthropic_text_events())
+    adapter = anthropic_apikey.AnthropicApiKeyAdapter(_anthropic_connector())
+    req = ChatRequest(messages=[Message(role="user", content="hi")])
+    chunks = [c async for c in adapter.stream(req)]
+    assert "".join(c.text_delta for c in chunks) == "Hello"
+    assert chunks[-1].done is True
+    assert chunks[-1].stop_reason == "end_turn"
+    assert chunks[-1].usage.completion == 5
+
+
+async def test_anthropic_adapter_stream_tool_use(monkeypatch):
+    from app.services.llm.adapters import anthropic_apikey
+
+    _patch_fake_anthropic(monkeypatch, _anthropic_tool_events())
+    adapter = anthropic_apikey.AnthropicApiKeyAdapter(_anthropic_connector())
+    req = ChatRequest(messages=[Message(role="user", content="hi")])
+    chunks = [c async for c in adapter.stream(req)]
+
+    frags = [d for c in chunks for d in c.tool_call_deltas]
+    assert frags[0].id == "toolu_1" and frags[0].name == "search"
+    joined = "".join(d.input_json_fragment for d in frags)
+    assert _json.loads(joined) == {"q": "house"}
+    assert chunks[-1].done is True
+    assert chunks[-1].stop_reason == "tool_use"
+
+
+@pytest.mark.parametrize("native_stop", ["refusal", "pause_turn", "something_new"])
+async def test_anthropic_stream_unmodelled_stop_matches_chat(monkeypatch, native_stop):
+    """Stream + chat must canonicalise unmodelled stop_reasons identically (#379).
+
+    Anthropic can emit ``pause_turn`` / ``refusal`` which we don't model
+    canonically; both paths must map them to ``"error"`` (not ``"end_turn"``).
+    """
+    from app.services.llm.adapters import anthropic_apikey
+    from app.services.llm.tool_translation import normalise_anthropic_stop_reason
+
+    events = [
+        _FakeEvent(type="message_start"),
+        _FakeEvent(
+            type="content_block_start", index=0, content_block=_FakeEvent(type="text", text="")
+        ),
+        _FakeEvent(
+            type="content_block_delta", index=0, delta=_FakeEvent(type="text_delta", text="x")
+        ),
+        _FakeEvent(
+            type="message_delta",
+            delta=_FakeEvent(stop_reason=native_stop),
+            usage=_FakeEvent(output_tokens=1),
+        ),
+        _FakeEvent(type="message_stop"),
+    ]
+    _patch_fake_anthropic(monkeypatch, events)
+    adapter = anthropic_apikey.AnthropicApiKeyAdapter(_anthropic_connector())
+    req = ChatRequest(messages=[Message(role="user", content="hi")])
+    chunks = [c async for c in adapter.stream(req)]
+
+    assert chunks[-1].done is True
+    # The streamed canonical stop_reason equals what the buffered path would give.
+    assert chunks[-1].stop_reason == normalise_anthropic_stop_reason(native_stop)
+    assert chunks[-1].stop_reason == "error"
+
+
+def test_translate_anthropic_event_handles_plain_dicts():
+    """Dict-backed events (not only SDK objects) must yield deltas (#354).
+
+    ``_translate_anthropic_event``'s docstring promises dict support, but the
+    original implementation read fields via ``getattr`` only — so dict events
+    silently produced empty chunks. Each branch must honour dict access.
+    """
+    from app.services.llm.adapters.anthropic_apikey import _translate_anthropic_event
+
+    # tool_use block start
+    chunk, saw_tool, stop, out_tokens = _translate_anthropic_event(
+        {
+            "type": "content_block_start",
+            "index": 0,
+            "content_block": {"type": "tool_use", "id": "toolu_1", "name": "search"},
+        }
+    )
+    assert saw_tool is True
+    assert chunk is not None
+    assert chunk.tool_call_deltas[0].id == "toolu_1"
+    assert chunk.tool_call_deltas[0].name == "search"
+
+    # text delta
+    chunk, _saw, _stop, _ot = _translate_anthropic_event(
+        {
+            "type": "content_block_delta",
+            "index": 0,
+            "delta": {"type": "text_delta", "text": "Hello"},
+        }
+    )
+    assert chunk is not None
+    assert chunk.text_delta == "Hello"
+
+    # input_json (tool argument) delta
+    chunk, _saw, _stop, _ot = _translate_anthropic_event(
+        {
+            "type": "content_block_delta",
+            "index": 0,
+            "delta": {"type": "input_json_delta", "partial_json": '{"q":'},
+        }
+    )
+    assert chunk is not None
+    assert chunk.tool_call_deltas[0].input_json_fragment == '{"q":'
+
+    # message_delta carries stop_reason + usage
+    chunk, _saw, stop, out_tokens = _translate_anthropic_event(
+        {
+            "type": "message_delta",
+            "delta": {"stop_reason": "end_turn"},
+            "usage": {"output_tokens": 7},
+        }
+    )
+    assert chunk is None
+    assert stop == "end_turn"
+    assert out_tokens == 7
diff --git a/server/tests/test_llm_tool_translation.py b/server/tests/test_llm_tool_translation.py
new file mode 100644
index 00000000..44ba644f
--- /dev/null
+++ b/server/tests/test_llm_tool_translation.py
@@ -0,0 +1,417 @@
+"""Tests for canonical ToolSpec <-> per-provider translation + response parsing."""
+
+import pytest
+
+from app.services.llm.base import ToolSpec
+from app.services.llm.exceptions import ToolTranslationError
+from app.services.llm.tool_translation import (
+    parse_anthropic_response,
+    parse_gemini_response,
+    parse_openai_response,
+    to_anthropic_tools,
+    to_gemini_tools,
+    to_openai_tools,
+)
+
+TOOL = ToolSpec(
+    name="rank_recommendations",
+    description="Rank the candidates",
+    input_schema={
+        "type": "object",
+        "properties": {"ids": {"type": "array", "items": {"type": "string"}}},
+        "required": ["ids"],
+    },
+)
+
+
+class TestOpenAITools:
+    def test_returns_none_for_no_tools(self):
+        tools, choice = to_openai_tools(None, None)
+        assert tools is None
+        assert choice is None
+
+    def test_translates_tools(self):
+        tools, choice = to_openai_tools([TOOL], None)
+        assert tools is not None
+        assert tools[0]["type"] == "function"
+        assert tools[0]["function"]["name"] == "rank_recommendations"
+        assert tools[0]["function"]["parameters"] == TOOL.input_schema
+        assert choice is None
+
+    def test_force_tool(self):
+        tools, choice = to_openai_tools([TOOL], "rank_recommendations")
+        assert choice == {
+            "type": "function",
+            "function": {"name": "rank_recommendations"},
+        }
+
+    def test_force_tool_not_in_list(self):
+        with pytest.raises(ToolTranslationError):
+            to_openai_tools([TOOL], "does_not_exist")
+
+
+class TestAnthropicTools:
+    def test_returns_none_for_no_tools(self):
+        tools, choice = to_anthropic_tools(None, None)
+        assert tools is None
+        assert choice is None
+
+    def test_translates_tools(self):
+        tools, choice = to_anthropic_tools([TOOL], None)
+        assert tools is not None
+        assert tools[0]["name"] == "rank_recommendations"
+        assert tools[0]["input_schema"] == TOOL.input_schema
+        assert choice is None
+
+    def test_force_tool(self):
+        tools, choice = to_anthropic_tools([TOOL], "rank_recommendations")
+        assert choice == {"type": "tool", "name": "rank_recommendations"}
+
+
+class TestGeminiTools:
+    def test_returns_none_for_no_tools(self):
+        tools, choice = to_gemini_tools(None, None)
+        assert tools is None
+        assert choice is None
+
+    def test_translates_tools(self):
+        tools, choice = to_gemini_tools([TOOL], None)
+        assert tools is not None
+        # Gemini nests declarations under a single tools entry.
+        assert tools[0]["function_declarations"][0]["name"] == "rank_recommendations"
+        assert tools[0]["function_declarations"][0]["parameters"] == TOOL.input_schema
+        assert choice is None
+
+    def test_force_tool(self):
+        tools, choice = to_gemini_tools([TOOL], "rank_recommendations")
+        assert choice == {
+            "function_calling_config": {
+                "mode": "ANY",
+                "allowed_function_names": ["rank_recommendations"],
+            }
+        }
+
+    def test_force_tool_not_in_list(self):
+        with pytest.raises(ToolTranslationError):
+            to_gemini_tools([TOOL], "does_not_exist")
+
+
+class TestParseGeminiResponse:
+    def test_text_response(self):
+        body = {
+            "candidates": [
+                {
+                    "content": {"role": "model", "parts": [{"text": "hello"}]},
+                    "finishReason": "STOP",
+                }
+            ],
+            "usageMetadata": {"promptTokenCount": 2, "candidatesTokenCount": 1},
+            "modelVersion": "gemini-2.5-flash",
+        }
+        resp = parse_gemini_response(body)
+        assert resp.text == "hello"
+        assert resp.stop_reason == "end_turn"
+        assert resp.tool_calls == []
+        assert resp.usage.prompt == 2
+        assert resp.usage.completion == 1
+        assert resp.model == "gemini-2.5-flash"
+
+    def test_function_call(self):
+        body = {
+            "candidates": [
+                {
+                    "content": {
+                        "role": "model",
+                        "parts": [
+                            {
+                                "functionCall": {
+                                    "name": "rank_recommendations",
+                                    "args": {"ids": ["a", "b"]},
+                                }
+                            }
+                        ],
+                    },
+                    "finishReason": "STOP",
+                }
+            ],
+            "usageMetadata": {"promptTokenCount": 10, "candidatesTokenCount": 5},
+        }
+        resp = parse_gemini_response(body)
+        assert resp.stop_reason == "tool_use"
+        assert len(resp.tool_calls) == 1
+        assert resp.tool_calls[0].name == "rank_recommendations"
+        assert resp.tool_calls[0].input == {"ids": ["a", "b"]}
+        # No native id from Gemini — falls back to the function name.
+        assert resp.tool_calls[0].id == "rank_recommendations"
+
+    def test_mixed_text_and_function_call(self):
+        body = {
+            "candidates": [
+                {
+                    "content": {
+                        "parts": [
+                            {"text": "Let me rank these."},
+                            {"functionCall": {"name": "rank", "args": {"ids": ["x"]}}},
+                        ]
+                    },
+                    "finishReason": "STOP",
+                }
+            ]
+        }
+        resp = parse_gemini_response(body)
+        assert resp.text == "Let me rank these."
+        assert resp.stop_reason == "tool_use"
+        assert resp.tool_calls[0].input == {"ids": ["x"]}
+
+    def test_max_tokens(self):
+        body = {
+            "candidates": [{"content": {"parts": [{"text": "..."}]}, "finishReason": "MAX_TOKENS"}]
+        }
+        resp = parse_gemini_response(body)
+        assert resp.stop_reason == "max_tokens"
+
+    def test_malformed_response(self):
+        with pytest.raises(ToolTranslationError):
+            parse_gemini_response({"foo": "bar"})
+
+    def test_function_call_missing_name_raises(self):
+        body = {
+            "candidates": [
+                {
+                    "content": {"parts": [{"functionCall": {"args": {"ids": ["x"]}}}]},
+                    "finishReason": "STOP",
+                }
+            ]
+        }
+        with pytest.raises(ToolTranslationError):
+            parse_gemini_response(body)
+
+    def test_function_call_non_object_raises(self):
+        # Regression: a truthy non-object ``functionCall`` (e.g. a string) must
+        # surface as ToolTranslationError, not a raw AttributeError from .get().
+        body = {
+            "candidates": [
+                {
+                    "content": {"parts": [{"functionCall": "oops"}]},
+                    "finishReason": "STOP",
+                }
+            ]
+        }
+        with pytest.raises(ToolTranslationError):
+            parse_gemini_response(body)
+
+    def test_function_call_non_object_args_raises(self):
+        # Regression: a non-object ``args`` (e.g. a list) must surface as a
+        # ToolTranslationError, not a raw TypeError/ValueError from dict(...).
+        body = {
+            "candidates": [
+                {
+                    "content": {"parts": [{"functionCall": {"name": "rank", "args": ["x"]}}]},
+                    "finishReason": "STOP",
+                }
+            ]
+        }
+        with pytest.raises(ToolTranslationError):
+            parse_gemini_response(body)
+
+    def test_function_call_missing_args_defaults_to_empty(self):
+        # Regression: omitted/null ``args`` yields an empty input dict, not a crash.
+        body = {
+            "candidates": [
+                {
+                    "content": {"parts": [{"functionCall": {"name": "rank"}}]},
+                    "finishReason": "STOP",
+                }
+            ]
+        }
+        resp = parse_gemini_response(body)
+        assert resp.tool_calls[0].name == "rank"
+        assert resp.tool_calls[0].input == {}
+
+    def test_empty_candidates_blocked_by_safety(self):
+        # Gemini can return an empty candidates list (e.g. safety block).
+        body = {"candidates": [], "promptFeedback": {"blockReason": "SAFETY"}}
+        with pytest.raises(ToolTranslationError):
+            parse_gemini_response(body)
+
+
+class TestParseOpenAIResponse:
+    def test_text_response(self):
+        body = {
+            "model": "gpt-5-mini",
+            "choices": [
+                {"finish_reason": "stop", "message": {"role": "assistant", "content": "hi"}}
+            ],
+            "usage": {"prompt_tokens": 3, "completion_tokens": 1},
+        }
+        resp = parse_openai_response(body)
+        assert resp.text == "hi"
+        assert resp.stop_reason == "end_turn"
+        assert resp.tool_calls == []
+        assert resp.usage.prompt == 3
+        assert resp.usage.completion == 1
+        assert resp.model == "gpt-5-mini"
+
+    def test_tool_call(self):
+        body = {
+            "model": "gpt-5-mini",
+            "choices": [
+                {
+                    "finish_reason": "tool_calls",
+                    "message": {
+                        "role": "assistant",
+                        "content": None,
+                        "tool_calls": [
+                            {
+                                "id": "call_1",
+                                "type": "function",
+                                "function": {
+                                    "name": "rank_recommendations",
+                                    "arguments": '{"ids": ["a", "b"]}',
+                                },
+                            }
+                        ],
+                    },
+                }
+            ],
+            "usage": {"prompt_tokens": 10, "completion_tokens": 5},
+        }
+        resp = parse_openai_response(body)
+        assert resp.stop_reason == "tool_use"
+        assert len(resp.tool_calls) == 1
+        assert resp.tool_calls[0].name == "rank_recommendations"
+        assert resp.tool_calls[0].input == {"ids": ["a", "b"]}
+        assert resp.tool_calls[0].id == "call_1"
+
+    def test_malformed_response(self):
+        with pytest.raises(ToolTranslationError):
+            parse_openai_response({"foo": "bar"})
+
+    def test_tool_arguments_invalid_json(self):
+        body = {
+            "choices": [
+                {
+                    "finish_reason": "tool_calls",
+                    "message": {
+                        "tool_calls": [
+                            {
+                                "id": "call_1",
+                                "function": {
+                                    "name": "rank",
+                                    "arguments": "{not json",
+                                },
+                            }
+                        ]
+                    },
+                }
+            ]
+        }
+        with pytest.raises(ToolTranslationError):
+            parse_openai_response(body)
+
+    @pytest.mark.parametrize("bad_args", [[], False, 0, 1, "[]", "false"])
+    def test_tool_arguments_falsy_non_object_rejected(self, bad_args):
+        """Falsy/non-object arguments must raise, not silently coerce to {}."""
+        body = {
+            "choices": [
+                {
+                    "finish_reason": "tool_calls",
+                    "message": {
+                        "tool_calls": [
+                            {
+                                "id": "call_1",
+                                "function": {"name": "rank", "arguments": bad_args},
+                            }
+                        ]
+                    },
+                }
+            ]
+        }
+        with pytest.raises(ToolTranslationError):
+            parse_openai_response(body)
+
+    @pytest.mark.parametrize("empty_args", [None, ""])
+    def test_tool_arguments_none_or_empty_string_become_empty_dict(self, empty_args):
+        """None (and empty-string, used by some compatible servers) → {} is valid."""
+        body = {
+            "choices": [
+                {
+                    "finish_reason": "tool_calls",
+                    "message": {
+                        "tool_calls": [
+                            {
+                                "id": "call_1",
+                                "function": {"name": "rank", "arguments": empty_args},
+                            }
+                        ]
+                    },
+                }
+            ]
+        }
+        resp = parse_openai_response(body)
+        assert resp.tool_calls[0].input == {}
+
+    def test_finish_reason_length(self):
+        body = {"choices": [{"finish_reason": "length", "message": {"content": "..."}}]}
+        resp = parse_openai_response(body)
+        assert resp.stop_reason == "max_tokens"
+
+
+class TestParseAnthropicResponse:
+    def test_text_response(self):
+        # Use dict shape — adapters accept either SDK objects or dicts.
+        msg = {
+            "model": "claude-haiku",
+            "stop_reason": "end_turn",
+            "content": [{"type": "text", "text": "hello"}],
+            "usage": {"input_tokens": 2, "output_tokens": 1},
+        }
+        resp = parse_anthropic_response(msg)
+        assert resp.text == "hello"
+        assert resp.stop_reason == "end_turn"
+        assert resp.usage.prompt == 2
+        assert resp.usage.completion == 1
+
+    def test_tool_use(self):
+        msg = {
+            "stop_reason": "tool_use",
+            "content": [
+                {
+                    "type": "tool_use",
+                    "id": "tu_1",
+                    "name": "rank",
+                    "input": {"ids": ["x"]},
+                }
+            ],
+        }
+        resp = parse_anthropic_response(msg)
+        assert resp.stop_reason == "tool_use"
+        assert len(resp.tool_calls) == 1
+        assert resp.tool_calls[0].input == {"ids": ["x"]}
+
+    def test_max_tokens(self):
+        msg = {"stop_reason": "max_tokens", "content": []}
+        resp = parse_anthropic_response(msg)
+        assert resp.stop_reason == "max_tokens"
+
+    def test_anthropic_tool_use_missing_id_name_raises(self):
+        """Regression: malformed tool_use without id/name must fail fast.
+
+        Pin per PR #348: previously the parser cast missing values to the
+        string "None", producing invalid canonical ToolCall objects.
+        """
+        msg = {
+            "stop_reason": "tool_use",
+            "content": [{"type": "tool_use", "input": {"ids": ["x"]}}],
+        }
+        with pytest.raises(ToolTranslationError):
+            parse_anthropic_response(msg)
+
+    def test_anthropic_tool_use_empty_name_raises(self):
+        """Empty name with no id to fall back to must raise, not emit 'None'."""
+        msg = {
+            "stop_reason": "tool_use",
+            "content": [{"type": "tool_use", "name": "", "input": {}}],
+        }
+        with pytest.raises(ToolTranslationError):
+            parse_anthropic_response(msg)
diff --git a/server/tests/test_llm_url_validator.py b/server/tests/test_llm_url_validator.py
new file mode 100644
index 00000000..2ab1a9b0
--- /dev/null
+++ b/server/tests/test_llm_url_validator.py
@@ -0,0 +1,61 @@
+"""Tests for the OpenAI-compatible base URL validator."""
+
+import pytest
+
+from app.services.llm.url_validator import (
+    InvalidBaseUrlError,
+    validate_compatible_base_url,
+)
+
+
+class TestValidateCompatibleBaseUrl:
+    @pytest.mark.parametrize(
+        ("url", "expected"),
+        [
+            ("https://api.openai.com/v1", "https://api.openai.com/v1"),
+            ("https://example.com/v1/", "https://example.com/v1"),  # strips trailing slash
+            ("http://localhost:8080", "http://localhost:8080"),  # loopback hostname
+            ("http://127.0.0.1:8000", "http://127.0.0.1:8000"),  # loopback IP
+            ("http://192.168.1.100", "http://192.168.1.100"),  # RFC1918 192.168/16
+            ("http://10.0.0.5/v1", "http://10.0.0.5/v1"),  # RFC1918 10/8
+            ("http://172.20.0.1", "http://172.20.0.1"),  # RFC1918 172.16/12
+            ("https://example.com", "https://example.com"),  # host root, no path
+            ("https://example.com/", "https://example.com"),  # empty path → no slash
+            ("http://127.0.0.1:11434/v1", "http://127.0.0.1:11434/v1"),  # preserves port
+            ("http://[::1]:8080", "http://[::1]:8080"),  # IPv6 loopback
+            ("http://[fc00::1]/v1", "http://[fc00::1]/v1"),  # IPv6 unique-local fc00::/7
+            ("http://[fe80::1]", "http://[fe80::1]"),  # IPv6 link-local fe80::/10
+            (
+                "https://example.com/v1/chat/completions",
+                "https://example.com/v1/chat/completions",
+            ),  # multi-segment path preserved
+        ],
+    )
+    def test_accepts_and_normalises(self, url, expected):
+        assert validate_compatible_base_url(url) == expected
+
+    @pytest.mark.parametrize(
+        "url",
+        [
+            "http://example.com/v1",  # public host must use HTTPS
+            "http://8.8.8.8",  # public IP must use HTTPS
+            "https://user:pass@example.com/v1",  # embedded credentials
+            "https://example.com/v1?api_key=secret",  # query string
+            "https://example.com/v1#fragment",  # fragment
+            "",  # empty
+            "example.com/v1",  # missing scheme
+            "ftp://example.com",  # invalid scheme
+            "https://",  # missing host
+            "http://[2001:4860:4860::8888]",  # public IPv6 (Google DNS)
+            "   ",  # whitespace only
+        ],
+    )
+    def test_rejects(self, url):
+        with pytest.raises(InvalidBaseUrlError):
+            validate_compatible_base_url(url)
+
+    def test_case_normalization_scheme(self):
+        # Scheme is lower-cased; netloc and path are preserved as-given.
+        result = validate_compatible_base_url("HTTPS://EXAMPLE.COM/V1")
+        assert result.startswith("https://")
+        assert result.endswith("/V1")
diff --git a/server/tests/test_sse_pool.py b/server/tests/test_sse_pool.py
new file mode 100644
index 00000000..8e77d208
--- /dev/null
+++ b/server/tests/test_sse_pool.py
@@ -0,0 +1,197 @@
+"""Regression test for issue #356 — SSE event_stream must NOT pin a pooled
+DB connection for the lifetime of the stream.
+
+Before the fix, event_stream declared `db: Session = Depends(get_db)`, so
+FastAPI held the session (and its checked-out QueuePool connection) open
+until the request finished — which for an EventSource never happens while
+the browser holds it open. ~15 concurrent guest viewers exhausted the pool
+(pool_size=5 + max_overflow=10).
+
+These tests bypass the conftest StaticPool override and drive a real
+QueuePool engine so engine.pool.checkedout() is meaningful.
+"""
+
+import asyncio
+from datetime import timedelta
+
+import pytest
+from sqlalchemy import create_engine
+from sqlalchemy.orm import sessionmaker
+from sqlalchemy.pool import QueuePool
+from starlette.requests import Request as StarletteRequest
+
+from app.core.time import utcnow
+from app.models.base import Base
+from app.models.event import Event
+from app.models.user import User
+from app.services.auth import get_password_hash
+
+
+@pytest.fixture()
+def pooled_engine(monkeypatch):
+    """A real shared-cache SQLite engine using QueuePool (default), so
+    engine.pool.checkedout() reflects actual checked-out connections.
+
+    Patches app.db.session.SessionLocal AND the name already imported into
+    app.api.sse so the endpoint resolves our pooled session factory.
+    """
+    import app.api.sse as sse_module
+    import app.db.session as db_session
+
+    engine = create_engine(
+        "sqlite:///file:sse_pool_test?mode=memory&cache=shared&uri=true",
+        poolclass=QueuePool,
+        pool_size=5,
+        max_overflow=10,
+        connect_args={"check_same_thread": False},
+    )
+    Base.metadata.create_all(bind=engine)
+    test_session = sessionmaker(autocommit=False, autoflush=False, bind=engine)
+
+    monkeypatch.setattr(db_session, "SessionLocal", test_session)
+    monkeypatch.setattr(sse_module, "SessionLocal", test_session, raising=False)
+
+    # Seed an active event using a short-lived session.
+    with test_session() as s:
+        user = User(
+            username="pooluser",
+            password_hash=get_password_hash("poolpassword123"),
+            role="dj",
+        )
+        s.add(user)
+        s.commit()
+        s.refresh(user)
+        evt = Event(
+            code="POOL01",
+            join_code="POOLJN",
+            name="Pool Event",
+            created_by_user_id=user.id,
+            expires_at=utcnow() + timedelta(hours=6),
+        )
+        s.add(evt)
+        s.commit()
+
+    try:
+        yield engine, test_session
+    finally:
+        Base.metadata.drop_all(bind=engine)
+        engine.dispose()
+
+
+def _make_request(code: str) -> StarletteRequest:
+    """Minimal ASGI scope for a GET that reports as a live, idle client.
+
+    The nested ``receive`` callable must NOT return ``http.disconnect``: doing
+    so makes ``StarletteRequest.is_disconnected()`` true on the first generator
+    iteration and the SSE generator exits before it can ever await
+    ``queue.get()``. That would mean the concurrency test (below) is asserting
+    that *instantly-disconnected* streams hold zero pool connections — trivially
+    true and useless as a regression for issue #356.
+
+    Instead, ``receive`` suspends forever on a never-set ``asyncio.Event``,
+    which matches a real live, idle SSE client that has opened the connection
+    and is simply waiting for server-sent events. The handler then suspends on
+    ``queue.get()`` as intended, and we can meaningfully assert
+    ``pool.checkedout() == 0`` across N concurrent idle streams.
+    """
+    scope = {
+        "type": "http",
+        "method": "GET",
+        "path": f"/api/public/events/{code}/stream",
+        "headers": [],
+        "query_string": b"",
+    }
+
+    never_disconnect = asyncio.Event()
+
+    async def receive():  # pragma: no cover - suspended forever in these tests
+        await never_disconnect.wait()
+        # Unreachable: the event is never set. Return value satisfies type
+        # checkers; runtime suspends indefinitely above.
+        return {"type": "http.disconnect"}
+
+    return StarletteRequest(scope, receive)
+
+
+def test_event_stream_returns_with_pool_checked_in(pooled_engine):
+    """After event_stream() returns, the existence-check connection must be
+    back in the pool (checkedout() == 0)."""
+    from app.api.sse import event_stream
+
+    engine, _ = pooled_engine
+    assert engine.pool.checkedout() == 0
+
+    req = _make_request("POOLJN")
+    asyncio.run(event_stream(code="POOLJN", request=req))
+
+    # EventSourceResponse created, generator not yet iterated.
+    assert engine.pool.checkedout() == 0
+
+
+def test_n_concurrent_idle_streams_hold_zero_pool_connections(pooled_engine):
+    """N concurrent open (idle) SSE streams must hold ~0 pooled connections.
+
+    Open N generators (past pool_size + max_overflow = 15), prime each one
+    tick so the generator body is actively suspended on queue.get(), then
+    assert the pool has 0 checked-out connections. Before the fix this would
+    be N (one pinned per stream) and would TimeoutError past 15.
+    """
+    from app.api.sse import event_stream
+
+    engine, _ = pooled_engine
+    n = 25  # well past pool capacity (15)
+
+    async def drive():
+        generators = []
+        for _ in range(n):
+            req = _make_request("POOLJN")
+            resp = await event_stream(code="POOLJN", request=req)
+            generators.append(resp.body_iterator)
+
+        # Prime each generator one step so it subscribes and suspends on
+        # queue.get(); give the event loop a tick to settle.
+        primer_tasks = [asyncio.ensure_future(g.__anext__()) for g in generators]
+        await asyncio.sleep(0.05)
+
+        # Sanity-check that streams are actually suspended (not instantly
+        # exited). If receive() returns http.disconnect immediately, every
+        # primer would already be done here and the pool-connection assertion
+        # below would pass for the wrong reason.
+        assert any(not t.done() for t in primer_tasks), (
+            "streams did not remain open/idle — receive() must suspend, not "
+            "return http.disconnect immediately"
+        )
+
+        checked_out = engine.pool.checkedout()
+
+        # Cancel the primers, await their cancellation so the generators are
+        # no longer running, then close them to release subscriptions.
+        for t in primer_tasks:
+            t.cancel()
+        for t in primer_tasks:
+            try:
+                await t
+            except (asyncio.CancelledError, BaseException):  # noqa: BLE001
+                pass
+        for g in generators:
+            await g.aclose()
+
+        return checked_out
+
+    checked_out = asyncio.run(drive())
+    assert checked_out == 0, (
+        f"Expected 0 pooled connections held by {n} idle SSE streams, "
+        f"got {checked_out} — the stream is pinning DB connections."
+    )
+
+
+def test_event_stream_preserves_404_for_unknown_event(pooled_engine):
+    """Existence check must still reject unknown codes with 404."""
+    from fastapi import HTTPException
+
+    from app.api.sse import event_stream
+
+    req = _make_request("NOEXIS")
+    with pytest.raises(HTTPException) as exc:
+        asyncio.run(event_stream(code="NOEXIS", request=req))
+    assert exc.value.status_code == 404
diff --git a/server/tests/test_verify_status_endpoint.py b/server/tests/test_verify_status_endpoint.py
index 4799bec6..e915be95 100644
--- a/server/tests/test_verify_status_endpoint.py
+++ b/server/tests/test_verify_status_endpoint.py
@@ -93,15 +93,27 @@ def b64enc(b: bytes) -> str:
     def test_tampered_signature_returns_false(self, client: TestClient, db: Session):
         from fastapi import Response
 
-        from app.services.human_verification import COOKIE_NAME, issue_human_cookie
+        from app.services.human_verification import (
+            COOKIE_NAME,
+            _b64decode,
+            _b64encode,
+            issue_human_cookie,
+        )
 
         guest = _make_guest(db, "tamper")
         helper_resp = Response()
         issue_human_cookie(helper_resp, guest.id)
         raw = helper_resp.headers["set-cookie"]
         cookie_value = raw.split(f"{COOKIE_NAME}=", 1)[1].split(";", 1)[0]
-        # Flip the last char of the signature portion
-        bad = cookie_value[:-1] + ("A" if cookie_value[-1] != "A" else "B")
+        # Tamper at the decoded-bytes level so the mutation is guaranteed to
+        # change sig_bytes. Flipping the last base64url char only touches the
+        # high bits of the trailing byte (low bits are discarded on decode), so
+        # it frequently round-trips to the SAME signature — that was the flaky
+        # tamper vector. Flip a whole byte instead. (Regression for #364.)
+        payload_part, sig_part = cookie_value.rsplit(".", 1)
+        sig = bytearray(_b64decode(sig_part))
+        sig[0] ^= 0xFF
+        bad = f"{payload_part}.{_b64encode(bytes(sig))}"
 
         client.cookies.clear()
         client.cookies.set(COOKIE_NAME, bad)