From ef02fb5dc203f07f3e305f0318fce85e00a3be1a Mon Sep 17 00:00:00 2001
From: shaun0927 <70629228+shaun0927@users.noreply.github.com>
Date: Tue, 12 May 2026 23:48:39 +0900
Subject: [PATCH 01/11] Prioritize relevant crawl URLs without changing default
 BFS

Adds an opt-in best_first crawl strategy with deterministic URL scoring so targeted crawls spend page budget on more relevant URLs first while preserving legacy BFS behavior by default.\n\nConstraint: Must not duplicate open crawl-job/static-fetch PRs or change default crawl output.\nRejected: Content/LLM ranking | would expand scope and conflict with OpenChrome core boundaries.\nConfidence: high\nScope-risk: narrow\nDirective: Keep future scorer changes deterministic and fixture-gated; do not make public live-site ordering a CI gate.\nTested: npm run build -- --pretty false; npm test -- --runInBand tests/core/crawl/url-scorer.test.ts tests/core/tools/crawl.engine.test.ts; npm run lint:changed\nNot-tested: Full npm test suite; live OpenChrome crawl smoke.
---
 src/core/crawl/url-scorer.ts          | 162 ++++++++++++++++++++++++++
 src/tools/crawl.ts                    | 121 +++++++++++++++++--
 tests/core/crawl/url-scorer.test.ts   |  57 +++++++++
 tests/core/tools/crawl.engine.test.ts |  78 +++++++++++++
 4 files changed, 410 insertions(+), 8 deletions(-)
 create mode 100644 src/core/crawl/url-scorer.ts
 create mode 100644 tests/core/crawl/url-scorer.test.ts
diff --git a/src/core/crawl/url-scorer.ts b/src/core/crawl/url-scorer.ts
new file mode 100644
index 000000000..9bad17597
--- /dev/null
+++ b/src/core/crawl/url-scorer.ts
@@ -0,0 +1,162 @@
+export interface UrlScoreOptions {
+  query?: string;
+  keywords?: string[];
+  preferPaths?: string[];
+  excludePaths?: string[];
+  sameDepthBias?: number;
+  startUrl?: string;
+}
+
+export interface UrlScoreResult {
+  score: number;
+  reasons: string[];
+}
+
+const LOW_SIGNAL_SEGMENTS = new Set([
+  'tag',
+  'tags',
+  'category',
+  'categories',
+  'author',
+  'authors',
+  'feed',
+  'rss',
+  'login',
+  'signin',
+  'signup',
+  'register',
+]);
+
+function normalizeTerm(term: string): string {
+  return term.trim().toLowerCase().replace(/^\/+|\/+$/g, '');
+}
+
+function queryTerms(query?: string): string[] {
+  if (!query) return [];
+  const seen = new Set<string>();
+  for (const raw of query.split(/[^\p{L}\p{N}_-]+/u)) {
+    const term = normalizeTerm(raw);
+    if (term.length >= 2) seen.add(term);
+  }
+  return Array.from(seen);
+}
+
+function normalizePathPrefix(path: string): string {
+  const trimmed = path.trim();
+  if (!trimmed) return '';
+  return trimmed.startsWith('/') ? trimmed.toLowerCase() : `/${trimmed.toLowerCase()}`;
+}
+
+function pathDistance(startPath: string, candidatePath: string): number {
+  const startSegments = startPath.split('/').filter(Boolean);
+  const candidateSegments = candidatePath.split('/').filter(Boolean);
+  let shared = 0;
+  while (
+    shared < startSegments.length &&
+    shared < candidateSegments.length &&
+    startSegments[shared] === candidateSegments[shared]
+  ) {
+    shared++;
+  }
+  return Math.max(startSegments.length, candidateSegments.length) - shared;
+}
+
+export function buildUrlScoreOptions(input: {
+  query?: unknown;
+  url_score?: unknown;
+  startUrl?: string;
+}): UrlScoreOptions {
+  const raw = input.url_score && typeof input.url_score === 'object'
+    ? input.url_score as Record<string, unknown>
+    : {};
+  const toStringArray = (value: unknown): string[] | undefined => {
+    if (!Array.isArray(value)) return undefined;
+    return value.filter((v): v is string => typeof v === 'string' && v.trim().length > 0);
+  };
+  return {
+    query: typeof input.query === 'string' ? input.query : undefined,
+    keywords: toStringArray(raw.keywords),
+    preferPaths: toStringArray(raw.prefer_paths),
+    excludePaths: toStringArray(raw.exclude_paths),
+    sameDepthBias: typeof raw.same_depth_bias === 'number' && Number.isFinite(raw.same_depth_bias)
+      ? raw.same_depth_bias
+      : undefined,
+    startUrl: input.startUrl,
+  };
+}
+
+export function scoreUrl(candidateUrl: string, depth: number, options: UrlScoreOptions = {}): UrlScoreResult {
+  const reasons: string[] = [];
+  let score = 0;
+  let parsed: URL;
+  try {
+    parsed = new URL(candidateUrl);
+  } catch {
+    return { score: -100, reasons: ['invalid-url'] };
+  }
+
+  const explicitKeywords = (options.keywords || []).map(normalizeTerm).filter(Boolean);
+  const terms = Array.from(new Set([...queryTerms(options.query), ...explicitKeywords]));
+  const haystack = `${decodeURIComponent(parsed.pathname)} ${parsed.searchParams.toString()}`.toLowerCase();
+
+  for (const term of terms) {
+    if (!term) continue;
+    if (haystack.includes(term)) {
+      score += 1.0;
+      reasons.push(`keyword:${term}`);
+    }
+  }
+
+  for (const prefix of options.preferPaths || []) {
+    const normalized = normalizePathPrefix(prefix);
+    if (normalized && parsed.pathname.toLowerCase().startsWith(normalized)) {
+      score += 1.5;
+      reasons.push(`path:${normalized}`);
+    }
+  }
+
+  for (const prefix of options.excludePaths || []) {
+    const normalized = normalizePathPrefix(prefix);
+    if (normalized && parsed.pathname.toLowerCase().startsWith(normalized)) {
+      score -= 2.0;
+      reasons.push(`exclude:${normalized}`);
+    }
+  }
+
+  if (options.startUrl) {
+    try {
+      const start = new URL(options.startUrl);
+      if (start.origin === parsed.origin) {
+        const distance = pathDistance(start.pathname.toLowerCase(), parsed.pathname.toLowerCase());
+        const proximity = Math.max(0, 3 - distance) * 0.1;
+        if (proximity > 0) {
+          score += proximity;
+          reasons.push(`proximity:${proximity.toFixed(1)}`);
+        }
+      }
+    } catch {
+      // ignore malformed start URL
+    }
+  }
+
+  if (options.sameDepthBias && Number.isFinite(options.sameDepthBias)) {
+    score += options.sameDepthBias;
+    reasons.push(`bias:${options.sameDepthBias}`);
+  }
+
+  if (depth > 0) {
+    const penalty = 0.2 * depth;
+    score -= penalty;
+    reasons.push(`depth:-${penalty.toFixed(1)}`);
+  }
+
+  const querySet = new Set(terms);
+  for (const segment of parsed.pathname.toLowerCase().split('/').filter(Boolean)) {
+    if (LOW_SIGNAL_SEGMENTS.has(segment) && !querySet.has(segment)) {
+      score -= 1.0;
+      reasons.push(`low-signal:${segment}`);
+    }
+  }
+
+  return { score: Number(score.toFixed(3)), reasons };
+}
diff --git a/src/tools/crawl.ts b/src/tools/crawl.ts
index cd6442550..ec57aef8e 100644
--- a/src/tools/crawl.ts
+++ b/src/tools/crawl.ts
@@ -28,6 +28,7 @@ import {
   StaticFetchError,
   StaticReason,
 } from '../utils/static-fetch';
+import { buildUrlScoreOptions, scoreUrl, UrlScoreOptions } from '../core/crawl/url-scorer';
 
 const definition: MCPToolDefinition = {
   name: 'crawl',
@@ -86,6 +87,25 @@ const definition: MCPToolDefinition = {
         description:
           'Fetch engine: "cdp" (default, opens a Chrome tab per page), "static" (Node fetch only, fails closed on insufficient pages), or "auto" (static first, fall back to CDP when static is insufficient).',
       },
+      strategy: {
+        type: 'string',
+        enum: ['bfs', 'best_first'],
+        description: 'Crawl traversal strategy. Default: bfs. best_first scores discovered URLs by query/url_score and visits highest-scoring URLs first.',
+      },
+      query: {
+        type: 'string',
+        description: 'Optional query terms used by strategy=best_first URL scoring.',
+      },
+      url_score: {
+        type: 'object',
+        description: 'Optional strategy=best_first URL scoring hints: keywords, prefer_paths, exclude_paths, same_depth_bias.',
+        properties: {
+          keywords: { type: 'array', items: { type: 'string' } },
+          prefer_paths: { type: 'array', items: { type: 'string' } },
+          exclude_paths: { type: 'array', items: { type: 'string' } },
+          same_depth_bias: { type: 'number' },
+        },
+      },
     },
     required: ['url'],
   },
@@ -129,9 +149,20 @@ interface CrawledPage {
   error?: string;
   engine_used?: 'static' | 'cdp';
   static_reason?: StaticReason;
+  score?: number;
+  score_reasons?: string[];
 }
 
 type EngineMode = 'auto' | 'static' | 'cdp';
+type CrawlStrategy = 'bfs' | 'best_first';
+
+interface CrawlQueueItem {
+  url: string;
+  depth: number;
+  order: number;
+  score?: number;
+  score_reasons?: string[];
+}
 
 interface CrawlSummary {
   total_pages: number;
@@ -140,6 +171,9 @@ interface CrawlSummary {
   max_depth_reached: number;
   duration_ms: number;
   scope: string;
+  strategy?: CrawlStrategy;
+  scored_urls?: number;
+  skipped_below_threshold?: number;
 }
 
 // ---------------------------------------------------------------------------
@@ -473,6 +507,71 @@ const handler: ToolHandler = async (
   }
   const engineExplicit = engineArg !== undefined;
 
+  const strategyArg = args.strategy as string | undefined;
+  let strategy: CrawlStrategy = 'bfs';
+  if (strategyArg === 'bfs' || strategyArg === 'best_first') {
+    strategy = strategyArg;
+  } else if (strategyArg !== undefined) {
+    return {
+      content: [{ type: 'text', text: 'Error: strategy must be one of "bfs", "best_first"' }],
+      isError: true,
+    };
+  }
+  const scoringOptions: UrlScoreOptions = buildUrlScoreOptions({
+    query: args.query,
+    url_score: args.url_score,
+    startUrl: normalizeUrl(url),
+  });
+  let scoredUrls = 0;
+  const skippedBelowThreshold = 0;
+  let discoveryOrder = 0;
+  const bestFirstQueue: CrawlQueueItem[] = [];
+  const bestFirstQueued = new Set<string>();
+
+  function makeQueueItem(entry: { url: string; depth: number }): CrawlQueueItem {
+    const normalized = normalizeUrl(entry.url);
+    const item: CrawlQueueItem = { url: normalized, depth: entry.depth, order: discoveryOrder++ };
+    if (strategy === 'best_first') {
+      const scored = scoreUrl(normalized, entry.depth, scoringOptions);
+      item.score = scored.score;
+      item.score_reasons = scored.reasons;
+      scoredUrls++;
+    }
+    return item;
+  }
+
+  function enqueueItems(entries: Array<{ url: string; depth: number }>): void {
+    if (strategy !== 'best_first') {
+      tracker.enqueue(entries);
+      return;
+    }
+    for (const entry of entries) {
+      const item = makeQueueItem(entry);
+      if (tracker.hasVisited(item.url) || bestFirstQueued.has(item.url)) continue;
+      bestFirstQueued.add(item.url);
+      bestFirstQueue.push(item);
+    }
+    bestFirstQueue.sort((a, b) => {
+      const scoreDiff = (b.score ?? 0) - (a.score ?? 0);
+      if (scoreDiff !== 0) return scoreDiff;
+      if (a.order !== b.order) return a.order - b.order;
+      return a.url.localeCompare(b.url);
+    });
+  }
+
+  function dequeueItem(): CrawlQueueItem | undefined {
+    if (strategy !== 'best_first') {
+      const next = tracker.dequeue();
+      return next ? { ...next, order: discoveryOrder++ } : undefined;
+    }
+    while (bestFirstQueue.length > 0) {
+      const next = bestFirstQueue.shift()!;
+      bestFirstQueued.delete(next.url);
+      if (!tracker.hasVisited(next.url)) return next;
+    }
+    return undefined;
+  }
+
   const startTime = Date.now();
   const tracker = new CrawlTracker();
   const pages: CrawledPage[] = [];
@@ -522,13 +621,13 @@ const handler: ToolHandler = async (
   }
 
   try {
-    // Seed the BFS queue with the start URL
+    // Seed the crawl queue with the start URL
     const normalizedStart = normalizeUrl(url);
-    tracker.enqueue([{ url: normalizedStart, depth: 0 }]);
+    enqueueItems([{ url: normalizedStart, depth: 0 }]);
 
     const limiter = createLimiter(concurrency);
 
-    // BFS loop
+    // Crawl loop
     while (pages.length < maxPages) {
       // Check budget
       if (context && !hasBudget(context, 15_000)) {
@@ -537,11 +636,11 @@ const handler: ToolHandler = async (
       }
 
       // Collect a batch of URLs to fetch in parallel
-      const batch: Array<{ url: string; depth: number }> = [];
+      const batch: CrawlQueueItem[] = [];
       const batchSize = Math.min(concurrency, maxPages - pages.length);
 
       for (let i = 0; i < batchSize; i++) {
-        const next = tracker.dequeue();
+        const next = dequeueItem();
         if (!next) break;
 
         // Skip if exceeds max depth
@@ -552,12 +651,12 @@ const handler: ToolHandler = async (
 
       if (batch.length === 0) {
         // Check if there are still items in the queue beyond max_depth
-        const probe = tracker.dequeue();
+        const probe = dequeueItem();
         if (!probe) break; // Queue is truly empty
         // If it's beyond depth, we're done
         if (probe.depth > maxDepth) break;
         // Otherwise put it back and try again — shouldn't happen but be safe
-        tracker.enqueue([probe]);
+        enqueueItems([probe]);
         break;
       }
 
@@ -577,6 +676,7 @@ const handler: ToolHandler = async (
                   depth: item.depth,
                   links_found: 0,
                   error: 'Blocked by robots.txt',
+                  ...(strategy === 'best_first' ? { score: item.score ?? 0, score_reasons: item.score_reasons ?? [] } : {}),
                 } as CrawledPage,
                 links: [] as string[],
                 depth: item.depth,
@@ -644,6 +744,10 @@ const handler: ToolHandler = async (
             if (staticReason) {
               result.static_reason = staticReason;
             }
+            if (strategy === 'best_first') {
+              result.score = item.score ?? 0;
+              result.score_reasons = item.score_reasons ?? [];
+            }
 
             // Apply delay between fetches
             if (delayMs > 0) {
@@ -680,7 +784,7 @@ const handler: ToolHandler = async (
           }
 
           if (newUrls.length > 0) {
-            tracker.enqueue(newUrls);
+            enqueueItems(newUrls);
           }
         }
       }
@@ -697,6 +801,7 @@ const handler: ToolHandler = async (
       max_depth_reached: maxDepthReached,
       duration_ms: durationMs,
       scope,
+      ...(strategy === 'best_first' ? { strategy, scored_urls: scoredUrls, skipped_below_threshold: skippedBelowThreshold } : {}),
     };
 
     const output = { summary, pages };
diff --git a/tests/core/crawl/url-scorer.test.ts b/tests/core/crawl/url-scorer.test.ts
new file mode 100644
index 000000000..d97008ed9
--- /dev/null
+++ b/tests/core/crawl/url-scorer.test.ts
@@ -0,0 +1,57 @@
+import { buildUrlScoreOptions, scoreUrl } from '../../../src/core/crawl/url-scorer';
+
+describe('url scorer', () => {
+  test('scores query keywords found in the URL', () => {
+    const scored = scoreUrl('https://docs.example.com/pricing/enterprise-limits', 1, {
+      query: 'enterprise pricing limits',
+    });
+    expect(scored.score).toBeGreaterThan(2);
+    expect(scored.reasons).toEqual(expect.arrayContaining([
+      'keyword:enterprise',
+      'keyword:pricing',
+      'keyword:limits',
+    ]));
+  });
+
+  test('applies prefer and exclude path weights', () => {
+    const preferred = scoreUrl('https://docs.example.com/docs/api/auth', 0, {
+      preferPaths: ['/docs'],
+      excludePaths: ['/blog'],
+    });
+    const excluded = scoreUrl('https://docs.example.com/blog/api/auth', 0, {
+      preferPaths: ['/docs'],
+      excludePaths: ['/blog'],
+    });
+    expect(preferred.score).toBeGreaterThan(excluded.score);
+    expect(preferred.reasons).toContain('path:/docs');
+    expect(excluded.reasons).toContain('exclude:/blog');
+  });
+
+  test('penalizes deeper and low-signal URLs', () => {
+    const high = scoreUrl('https://example.com/docs/actions', 1, { query: 'actions' });
+    const low = scoreUrl('https://example.com/tag/actions', 3, { query: 'actions' });
+    expect(high.score).toBeGreaterThan(low.score);
+    expect(low.reasons).toContain('low-signal:tag');
+  });
+
+  test('normalizes issue url_score options', () => {
+    const opts = buildUrlScoreOptions({
+      query: 'workflow secrets',
+      startUrl: 'https://docs.example.com/en',
+      url_score: {
+        keywords: ['actions'],
+        prefer_paths: ['/en/actions'],
+        exclude_paths: ['/en/billing'],
+        same_depth_bias: 0.1,
+      },
+    });
+    expect(opts).toMatchObject({
+      query: 'workflow secrets',
+      keywords: ['actions'],
+      preferPaths: ['/en/actions'],
+      excludePaths: ['/en/billing'],
+      sameDepthBias: 0.1,
+      startUrl: 'https://docs.example.com/en',
+    });
+  });
+});
diff --git a/tests/core/tools/crawl.engine.test.ts b/tests/core/tools/crawl.engine.test.ts
index 36738c5df..c59a9297d 100644
--- a/tests/core/tools/crawl.engine.test.ts
+++ b/tests/core/tools/crawl.engine.test.ts
@@ -102,6 +102,26 @@ beforeAll(async () => {
       contentType: 'text/html; charset=utf-8',
       body: RICH_HTML('Page B', `<h1>Page B</h1><p>${PARA}</p>`),
     },
+    '/best-start.html': {
+      status: 200,
+      contentType: 'text/html; charset=utf-8',
+      body: RICH_HTML(
+        'Best Start',
+        `<h1>Best Start</h1><p>${PARA}</p>` +
+          `<a href="/blog/company-update.html">Blog first</a>` +
+          `<a href="/pricing/enterprise-limits.html">Pricing second</a>`,
+      ),
+    },
+    '/blog/company-update.html': {
+      status: 200,
+      contentType: 'text/html; charset=utf-8',
+      body: RICH_HTML('Company Update', `<h1>Company Update</h1><p>${PARA}</p>`),
+    },
+    '/pricing/enterprise-limits.html': {
+      status: 200,
+      contentType: 'text/html; charset=utf-8',
+      body: RICH_HTML('Enterprise Limits', `<h1>Enterprise Limits</h1><p>${PARA}</p>`),
+    },
     '/spa.html': {
       status: 200,
       contentType: 'text/html',
@@ -292,6 +312,64 @@ describe('crawl default behavior (no engine arg)', () => {
   });
 });
 
+
+// ---------------------------------------------------------------------------
+// crawl({ strategy: 'best_first' }) — URL scoring orders discovered links.
+// ---------------------------------------------------------------------------
+
+describe('crawl strategy=best_first', () => {
+  test('visits higher-scoring discovered URLs before lower-scoring URLs', async () => {
+    const handler = await loadHandler('crawl');
+    const result = await handler('s-best', {
+      url: `${server.origin}/best-start.html`,
+      max_pages: 3,
+      max_depth: 1,
+      delay_ms: 0,
+      concurrency: 1,
+      engine: 'static',
+      respect_robots: false,
+      strategy: 'best_first',
+      query: 'enterprise pricing limits',
+      url_score: {
+        keywords: ['pricing', 'enterprise', 'limits'],
+        prefer_paths: ['/pricing'],
+        exclude_paths: ['/blog'],
+      },
+    });
+    const parsed = parseResult(result);
+    expect(parsed.summary.strategy).toBe('best_first');
+    expect(parsed.summary.scored_urls).toBeGreaterThanOrEqual(3);
+    expect(parsed.pages.map((p) => p.url)).toEqual([
+      `${server.origin}/best-start.html`,
+      `${server.origin}/pricing/enterprise-limits.html`,
+      `${server.origin}/blog/company-update.html`,
+    ]);
+    expect(parsed.pages[1].score).toBeGreaterThan(parsed.pages[2].score as number);
+    expect(parsed.pages[1].score_reasons).toEqual(expect.arrayContaining([
+      'keyword:pricing',
+      'keyword:enterprise',
+      'keyword:limits',
+      'path:/pricing',
+    ]));
+  });
+
+  test('keeps default crawl output free of strategy metadata', async () => {
+    const handler = await loadHandler('crawl');
+    const result = await handler('s-best-default', {
+      url: `${server.origin}/best-start.html`,
+      max_pages: 2,
+      max_depth: 1,
+      delay_ms: 0,
+      concurrency: 1,
+      engine: 'static',
+      respect_robots: false,
+    });
+    const parsed = parseResult(result);
+    expect(parsed.summary.strategy).toBeUndefined();
+    expect(parsed.pages[0].score).toBeUndefined();
+  });
+});
+
 // ---------------------------------------------------------------------------
 // crawl_sitemap engine plumbing
 // ---------------------------------------------------------------------------

From e0bb8830b5f5c1e4dd76b1955e9a5b829611f6dd Mon Sep 17 00:00:00 2001
From: shaun0927 <70629228+shaun0927@users.noreply.github.com>
Date: Wed, 13 May 2026 04:00:17 +0900
Subject: [PATCH 02/11] Keep best-first crawling robust around bad URLs

Guard URL scoring against malformed percent-encoded paths and keep the best-first crawl loop from stopping after re-queueing valid work.\n\nConstraint: PR #1065 must preserve the default BFS output and only affect opt-in strategy=best_first behavior.\nRejected: Dropping malformed URLs entirely | safe scoring keeps crawl progress deterministic without treating parseable URLs as invalid.\nConfidence: high\nScope-risk: narrow\nDirective: Keep future best-first queue changes tolerant of score-sorted depth ordering.\nTested: npm ci; npm run lint:changed; npm run lint:tier; npx jest --runInBand tests/core/crawl/url-scorer.test.ts tests/core/tools/crawl.engine.test.ts\nNot-tested: Full hosted CI matrix pending after push.
---
 src/core/crawl/url-scorer.ts        | 11 ++++++++++-
 src/tools/crawl.ts                  |  6 ++++--
 tests/core/crawl/url-scorer.test.ts | 10 ++++++++++
 3 files changed, 24 insertions(+), 3 deletions(-)

diff --git a/src/core/crawl/url-scorer.ts b/src/core/crawl/url-scorer.ts
index 9bad17597..4400c789f 100644
--- a/src/core/crawl/url-scorer.ts
+++ b/src/core/crawl/url-scorer.ts
@@ -41,6 +41,14 @@ function queryTerms(query?: string): string[] {
   return Array.from(seen);
 }
 
+function safeDecodePathname(pathname: string): string {
+  try {
+    return decodeURIComponent(pathname);
+  } catch {
+    return pathname;
+  }
+}
+
 function normalizePathPrefix(path: string): string {
   const trimmed = path.trim();
   if (!trimmed) return '';
@@ -97,7 +105,8 @@ export function scoreUrl(candidateUrl: string, depth: number, options: UrlScoreO
 
   const explicitKeywords = (options.keywords || []).map(normalizeTerm).filter(Boolean);
   const terms = Array.from(new Set([...queryTerms(options.query), ...explicitKeywords]));
-  const haystack = `${decodeURIComponent(parsed.pathname)} ${parsed.searchParams.toString()}`.toLowerCase();
+  const decodedPathname = safeDecodePathname(parsed.pathname);
+  const haystack = `${decodedPathname} ${parsed.searchParams.toString()}`.toLowerCase();
 
   for (const term of terms) {
     if (!term) continue;
diff --git a/src/tools/crawl.ts b/src/tools/crawl.ts
index ec57aef8e..54dc89384 100644
--- a/src/tools/crawl.ts
+++ b/src/tools/crawl.ts
@@ -655,9 +655,11 @@ const handler: ToolHandler = async (
         if (!probe) break; // Queue is truly empty
         // If it's beyond depth, we're done
         if (probe.depth > maxDepth) break;
-        // Otherwise put it back and try again — shouldn't happen but be safe
+        // Otherwise put it back and retry. In best_first mode an over-depth
+        // item can sort ahead of an in-depth item; breaking here would stop
+        // the crawl even though valid work remains behind the probe.
         enqueueItems([probe]);
-        break;
+        continue;
       }
 
       // Fetch batch in parallel with concurrency limiter
diff --git a/tests/core/crawl/url-scorer.test.ts b/tests/core/crawl/url-scorer.test.ts
index d97008ed9..87797538d 100644
--- a/tests/core/crawl/url-scorer.test.ts
+++ b/tests/core/crawl/url-scorer.test.ts
@@ -34,6 +34,16 @@ describe('url scorer', () => {
     expect(low.reasons).toContain('low-signal:tag');
   });
 
+
+  test('does not throw on malformed percent-encoded pathnames', () => {
+    const scored = scoreUrl('https://example.com/docs/%zz-enterprise', 1, {
+      query: 'enterprise',
+    });
+
+    expect(Number.isFinite(scored.score)).toBe(true);
+    expect(scored.reasons).toEqual(expect.arrayContaining(['keyword:enterprise']));
+  });
+
   test('normalizes issue url_score options', () => {
     const opts = buildUrlScoreOptions({
       query: 'workflow secrets',

From 5d404561ee773fbdeb991ec827328c12de9f921e Mon Sep 17 00:00:00 2001
From: shaun0927 <70629228+shaun0927@users.noreply.github.com>
Date: Wed, 13 May 2026 04:19:22 +0900
Subject: [PATCH 03/11] Keep Cursor verification tolerant of Tier 1 growth

The Cursor smoke test should prove core tool visibility without failing every develop-based PR when additional Tier 1 tools graduate.

Constraint: Hosted CI currently reports 45 Tier 1 tools while the test hard-coded 39.

Rejected: Raising the exact expected count to 45 | that would recreate the same brittle failure on the next Tier 1 graduation.

Confidence: high

Scope-risk: narrow

Directive: Assert required core tools explicitly and avoid exact catalog-size checks in cross-client smoke tests.

Tested: npx jest --runInBand tests/cross-env/cursor-verification.test.ts

Not-tested: Linux Node 20/22 local execution; hosted CI pending after push.

Co-authored-by: OmX <omx@oh-my-codex.dev>
---
 tests/cross-env/cursor-verification.test.ts | 8 ++++----
 1 file changed, 4 insertions(+), 4 deletions(-)

diff --git a/tests/cross-env/cursor-verification.test.ts b/tests/cross-env/cursor-verification.test.ts
index 8487c42fa..bff381a13 100644
--- a/tests/cross-env/cursor-verification.test.ts
+++ b/tests/cross-env/cursor-verification.test.ts
@@ -135,16 +135,16 @@ suiteRunner('Cross-Env: Cursor IDE Verification (Issue #509)', () => {
   describe('C2: Tool Discovery & Listing', () => {
     let tier1Tools: any[];
 
-    test('Initial tools/list returns Tier 1 tools only (39 tools) + expand_tools', async () => {
+    test('Initial tools/list returns Tier 1 core tools + expand_tools', async () => {
       const { response } = await sendAndReceive(server, 'tools/list');
       tier1Tools = response.result.tools;
-      // 39 Tier 1 tools (includes oc_reap_orphans lifecycle sweep, oc_assert,
-      // oc_evidence_bundle, oc_skill_record, oc_skill_recall, oc_observe) + 1 expand_tools virtual tool = 40
+      // Tier 1 can grow as core tools graduate; keep this check focused on
+      // Cursor visibility of the core set plus the expand_tools virtual tool.
       const toolNames = tier1Tools.map((t: any) => t.name);
       expect(toolNames).toContain('expand_tools');
 
       const nonExpandTools = tier1Tools.filter((t: any) => t.name !== 'expand_tools');
-      expect(nonExpandTools.length).toBe(39);
+      expect(nonExpandTools.length).toBeGreaterThanOrEqual(39);
     });
 
     test('expand_tools virtual tool present in initial list', () => {

From ac3de5d1bf635e7106547eee41f19c0c5db95e96 Mon Sep 17 00:00:00 2001
From: shaun0927 <70629228+shaun0927@users.noreply.github.com>
Date: Wed, 13 May 2026 04:29:31 +0900
Subject: [PATCH 04/11] Make console baseline portable across line endings

The console_capture regression should compare response shape, not fail Windows CI because checked-out JSON fixtures use CRLF line endings.

Constraint: Windows CI reads the baseline fixture with CRLF while JSON.stringify emits LF.

Rejected: Updating the fixture to Windows line endings | that would break Unix runners and still encode platform formatting into the assertion.

Confidence: high

Scope-risk: narrow

Directive: Normalize platform line endings before snapshot-style string comparisons.

Tested: npx jest --runInBand tests/tools/console-capture-regression.test.ts

Not-tested: Full hosted CI matrix pending after push.

Co-authored-by: OmX <omx@oh-my-codex.dev>
---
 tests/tools/console-capture-regression.test.ts | 5 +++--
 1 file changed, 3 insertions(+), 2 deletions(-)

diff --git a/tests/tools/console-capture-regression.test.ts b/tests/tools/console-capture-regression.test.ts
index 51dde3eb0..c76736c9a 100644
--- a/tests/tools/console-capture-regression.test.ts
+++ b/tests/tools/console-capture-regression.test.ts
@@ -132,7 +132,7 @@ const FIXTURE_PATH = path.join(
 );
 
 describe('console_capture get response — v1.11.0 baseline regression', () => {
-  test('response shape (excluding bufferStats) matches baseline fixture byte-for-byte', () => {
+  test('response shape (excluding bufferStats) matches baseline fixture', () => {
     const frozenLogs = buildFrozenLogs();
     const response = buildGetResponse(frozenLogs);
     const responseJson = JSON.stringify(response, null, 2);
@@ -146,7 +146,8 @@ describe('console_capture get response — v1.11.0 baseline regression', () => {
       return;
     }
 
-    const baseline = fs.readFileSync(FIXTURE_PATH, 'utf8');
+    const normalizeLineEndings = (value: string) => value.replace(/\r\n/g, '\n').replace(/\r/g, '\n');
+    const baseline = normalizeLineEndings(fs.readFileSync(FIXTURE_PATH, 'utf8'));
     expect(responseJson).toBe(baseline);
   });
 

From d7d6f8650a9f5df083543cbc0256436c59594983 Mon Sep 17 00:00:00 2001
From: shaun0927 <70629228+shaun0927@users.noreply.github.com>
Date: Wed, 13 May 2026 04:37:12 +0900
Subject: [PATCH 05/11] Accept clean SIGTERM reports in health gating tests

The health endpoint integration test should treat both code=0 and signal=SIGTERM as clean shutdown outcomes after sending SIGTERM.

Constraint: CI can report SIGTERM exits as code=null even when teardown is graceful.

Rejected: Extending timeouts | the failure is the accepted exit shape, not startup or shutdown latency.

Confidence: high

Scope-risk: narrow

Directive: Avoid platform-specific assumptions for Node ChildProcess signal exit reporting.

Tested: npx jest --runInBand tests/integration/health-endpoint-gating.test.ts

Not-tested: Full hosted CI matrix pending after push.

Co-authored-by: OmX <omx@oh-my-codex.dev>
---
 tests/integration/health-endpoint-gating.test.ts | 9 +++------
 1 file changed, 3 insertions(+), 6 deletions(-)

diff --git a/tests/integration/health-endpoint-gating.test.ts b/tests/integration/health-endpoint-gating.test.ts
index a1c3ef636..a2457a21e 100644
--- a/tests/integration/health-endpoint-gating.test.ts
+++ b/tests/integration/health-endpoint-gating.test.ts
@@ -269,12 +269,9 @@ describeFn('health endpoint gating (issue #648)', () => {
         const shutdownTimeoutMs = process.platform === 'win32' ? 30_000 : 10_000;
         const exit = await waitForExit(child, shutdownTimeoutMs);
         expect(exit.timedOut).toBe(false);
-        if (process.platform === 'win32') {
-          // Windows may report a clean SIGTERM as code=null/signal=SIGTERM.
-          expect(exit.code === 0 || exit.signal === 'SIGTERM').toBe(true);
-        } else {
-          expect(exit.code).toBe(0);
-        }
+        // Node may report a clean SIGTERM shutdown as either code=0 or
+        // code=null/signal=SIGTERM depending on platform and timing.
+        expect(exit.code === 0 || exit.signal === 'SIGTERM').toBe(true);
         expect(stderr).not.toMatch(/TypeError/);
         expect(stderr).not.toMatch(/Cannot read properties of null/);
         expect(stderr).not.toMatch(/UnhandledPromiseRejection/);

From 050b68c5911e9e0ce32859fb3d8d0c9a9cb56313 Mon Sep 17 00:00:00 2001
From: shaun0927 <70629228+shaun0927@users.noreply.github.com>
Date: Wed, 13 May 2026 04:45:52 +0900
Subject: [PATCH 06/11] Give health shutdown CI enough time

The health endpoint integration test should allow the same 30s shutdown window on Linux that it already allowed on Windows under hosted CI load.

Constraint: Ubuntu CI observed a graceful SIGTERM path that exceeded the previous 10s non-Windows limit.

Rejected: Skipping the scenario | the endpoint gating behavior remains important and passes with a realistic teardown window.

Confidence: high

Scope-risk: narrow

Directive: Keep process-spawning integration tests tolerant of hosted runner teardown latency.

Tested: npx jest --runInBand tests/integration/health-endpoint-gating.test.ts

Not-tested: Full hosted CI matrix pending after push.

Co-authored-by: OmX <omx@oh-my-codex.dev>
---
 tests/integration/health-endpoint-gating.test.ts | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/tests/integration/health-endpoint-gating.test.ts b/tests/integration/health-endpoint-gating.test.ts
index a2457a21e..8c3cc8d42 100644
--- a/tests/integration/health-endpoint-gating.test.ts
+++ b/tests/integration/health-endpoint-gating.test.ts
@@ -266,7 +266,7 @@ describeFn('health endpoint gating (issue #648)', () => {
         // and must NOT produce a TypeError for the stdio case where
         // healthEndpoint === null.
         child.kill('SIGTERM');
-        const shutdownTimeoutMs = process.platform === 'win32' ? 30_000 : 10_000;
+        const shutdownTimeoutMs = 30_000;
         const exit = await waitForExit(child, shutdownTimeoutMs);
         expect(exit.timedOut).toBe(false);
         // Node may report a clean SIGTERM shutdown as either code=0 or

From b051df8593621b856633b9cf07370b29adb72842 Mon Sep 17 00:00:00 2001
From: shaun0927 <70629228+shaun0927@users.noreply.github.com>
Date: Wed, 13 May 2026 05:00:43 +0900
Subject: [PATCH 07/11] Keep admin key stdout assertion noise tolerant

The admin key test should verify exactly one plaintext token without failing when Jest worker console noise is captured around the in-process CLI stdout hook.

Constraint: Windows CI can interleave decorated Jest console output into the captured stdout buffer.

Rejected: Requiring stdout to have exactly one line | the helper already documents and handles shared stdout hook noise.

Confidence: high

Scope-risk: narrow

Directive: Assert secret emission by token occurrence, not by total captured line count.

Tested: npx jest --runInBand tests/cli/admin-keys.test.ts

Not-tested: Full hosted CI matrix pending after push.

Co-authored-by: OmX <omx@oh-my-codex.dev>
---
 tests/cli/admin-keys.test.ts | 6 ++----
 1 file changed, 2 insertions(+), 4 deletions(-)

diff --git a/tests/cli/admin-keys.test.ts b/tests/cli/admin-keys.test.ts
index 13ece7b44..ae98752f9 100644
--- a/tests/cli/admin-keys.test.ts
+++ b/tests/cli/admin-keys.test.ts
@@ -126,11 +126,9 @@ describe('admin keys CLI', () => {
       '--description', 'test key',
     ]);
     expect(exitCode).toBeNull();
-    // Plaintext is the sole stdout payload.
-    const stdoutLines = stdout.split('\n').filter((l) => l.length > 0);
-    expect(stdoutLines).toHaveLength(1);
-    const plaintext = stdoutLines[0];
+    const plaintext = extractToken(stdout);
     expect(plaintext).toMatch(/^oc_live_acme_[A-Za-z0-9]+$/);
+    expect(stdout.match(/oc_live_acme_[A-Za-z0-9]+/g)).toHaveLength(1);
     // Warning routed to stderr.
     expect(stderr).toContain('SAVE THIS KEY NOW');
     // keyId is reported on stderr, not stdout.

From f74d7cbf4f3ef9fed091aa221033648dd022949f Mon Sep 17 00:00:00 2001
From: shaun0927 <70629228+shaun0927@users.noreply.github.com>
Date: Wed, 13 May 2026 05:21:31 +0900
Subject: [PATCH 08/11] Wait for domain memory persistence before sizing

The storage-size E2E should measure complete persisted JSON states rather than a zero-byte file observed while the async writer is truncating and rewriting.

Constraint: Windows CI can take longer than a fixed sleep to flush DomainMemory writes.

Rejected: Increasing the blind sleep | state-based polling proves the needed persisted state and avoids new timing flakes.

Confidence: high

Scope-risk: narrow

Directive: Prefer state-based waits over fixed sleeps for async persistence tests.

Tested: npx jest --runInBand tests/e2e/scenarios/domain-memory-persistence.test.ts

Not-tested: Full hosted CI matrix pending after push.

Co-authored-by: OmX <omx@oh-my-codex.dev>
---
 .../domain-memory-persistence.test.ts         | 42 +++++++++++++++----
 1 file changed, 34 insertions(+), 8 deletions(-)

diff --git a/tests/e2e/scenarios/domain-memory-persistence.test.ts b/tests/e2e/scenarios/domain-memory-persistence.test.ts
index f5ade4fcb..009018771 100644
--- a/tests/e2e/scenarios/domain-memory-persistence.test.ts
+++ b/tests/e2e/scenarios/domain-memory-persistence.test.ts
@@ -32,6 +32,29 @@ async function readStoreFile(): Promise<{ version: number; entries: unknown[]; u
   return JSON.parse(data);
 }
 
+type PersistedStore = { entries?: unknown[]; updatedAt?: number };
+
+async function waitForPersistedStore(
+  filePath: string,
+  predicate: (store: PersistedStore, byteLength: number) => boolean
+): Promise<{ store: PersistedStore; byteLength: number }> {
+  const deadline = Date.now() + 5_000;
+  let lastState = 'unread';
+  while (Date.now() < deadline) {
+    try {
+      const raw = await fsPromises.readFile(filePath, 'utf-8');
+      const store = JSON.parse(raw) as PersistedStore;
+      const byteLength = Buffer.byteLength(raw);
+      lastState = `count=${store.entries?.length ?? 0}, updatedAt=${store.updatedAt ?? 'missing'}, bytes=${byteLength}`;
+      if (byteLength > 0 && predicate(store, byteLength)) return { store, byteLength };
+    } catch {
+      // File may not exist or may be mid-write; retry until deadline.
+    }
+    await waitForSave(50);
+  }
+  throw new Error(`Timed out waiting for persisted store; lastState=${lastState}`);
+}
+
 describe('Issue #493: Domain Memory Persistence E2E', () => {
   afterAll(async () => {
     // Cleanup temp dir
@@ -366,21 +389,24 @@ describe('Issue #493: Domain Memory Persistence E2E', () => {
       for (let i = 0; i < 200; i++) {
         dm.record(`size-${i}.com`, `key-${i}`, `value-with-some-content-${i}`);
       }
-      await waitForSave(200);
-
       const sizeFile = path.join(sizeDir, 'domain-knowledge.json');
-      const stat1 = await fsPromises.stat(sizeFile);
-      const size200 = stat1.size;
+      const baseline = await waitForPersistedStore(
+        sizeFile,
+        (store) => (store.entries?.length ?? 0) >= 200
+      );
+      const size200 = baseline.byteLength;
 
       // Add 100 more (total 300) and compress
       for (let i = 200; i < 300; i++) {
         dm.record(`size-${i}.com`, `key-${i}`, `value-with-some-content-${i}`);
       }
+      const compressStartedAt = Date.now();
       dm.compress();
-      await waitForSave(200);
-
-      const stat2 = await fsPromises.stat(sizeFile);
-      const sizeAfterCompress = stat2.size;
+      const compressed = await waitForPersistedStore(
+        sizeFile,
+        (store) => (store.updatedAt ?? 0) >= compressStartedAt && (store.entries?.length ?? 0) <= 200
+      );
+      const sizeAfterCompress = compressed.byteLength;
 
       // After compress, file should not be significantly larger than 200 entries
       // Allow 10% tolerance for JSON formatting differences

From 60a072783d91d1f11ac009c535a11201578d67f7 Mon Sep 17 00:00:00 2001
From: shaun0927 <70629228+shaun0927@users.noreply.github.com>
Date: Wed, 13 May 2026 09:59:17 +0900
Subject: [PATCH 09/11] Isolate HTTP auth ports across test workers

Make the HTTP bearer auth regression allocate its port range from the Jest process id before using per-case ports, avoiding collisions across parallel worktrees and CI shards.

Constraint: the best-first PR now includes the shared transport suite after develop merges and should not inherit fixed-port flakes.
Rejected: Relying on sequential suite order | the test must remain robust under parallel verification.
Confidence: high
Scope-risk: narrow
Directive: Keep transport tests independent of globally fixed loopback ports.
Tested: npx jest tests/transports/http-bearer-auth.test.ts --runInBand --forceExit
Not-tested: Full multi-OS GitHub Actions matrix before push.

Co-authored-by: OmX <omx@oh-my-codex.dev>
---
 tests/transports/http-bearer-auth.test.ts | 31 ++++++++++++++---------
 1 file changed, 19 insertions(+), 12 deletions(-)

diff --git a/tests/transports/http-bearer-auth.test.ts b/tests/transports/http-bearer-auth.test.ts
index ad5fb52f7..a81e30055 100644
--- a/tests/transports/http-bearer-auth.test.ts
+++ b/tests/transports/http-bearer-auth.test.ts
@@ -10,7 +10,14 @@ import * as net from 'node:net';
 // Inline require to avoid TS module resolution issues with dynamic transport loading
 const { HTTPTransport } = require('../../src/transports/http');
 
-const TEST_PORT = 19876;
+const TEST_PORT_START = 20_000 + (process.pid % 400) * 100;
+let nextTestPort = TEST_PORT_START;
+let activePort = TEST_PORT_START;
+
+function allocatePort(): number {
+  activePort = nextTestPort++;
+  return activePort;
+}
 const TEST_TOKEN = 'test-s...c123';
 const TRUSTED_ORIGIN = 'http://127.0.0.1:5173';
 
@@ -22,7 +29,7 @@ function request(
 ): Promise<{ status: number; body: string; headers: http.IncomingHttpHeaders }> {
   return new Promise((resolve, reject) => {
     const req = http.request(
-      { hostname: '127.0.0.1', port: TEST_PORT, path, method, headers, timeout: 3000 },
+      { hostname: '127.0.0.1', port: activePort, path, method, headers, timeout: 3000 },
       (res) => {
         const chunks: Buffer[] = [];
         res.on('data', (c: Buffer) => chunks.push(c));
@@ -46,7 +53,7 @@ function rawRequest(
   raw: string,
 ): Promise<{ status: number; body: string; headers: Record<string, string> }> {
   return new Promise((resolve, reject) => {
-    const socket = net.connect({ host: '127.0.0.1', port: TEST_PORT });
+    const socket = net.connect({ host: '127.0.0.1', port: activePort });
     let response = '';
 
     socket.setTimeout(3000);
@@ -119,7 +126,7 @@ describe('HTTP Bearer Token Auth', () => {
 
   describe('with auth token configured', () => {
     beforeEach(async () => {
-      transport = new HTTPTransport(TEST_PORT, '127.0.0.1', TEST_TOKEN);
+      transport = new HTTPTransport(allocatePort(), '127.0.0.1', TEST_TOKEN);
       await startTransport(transport);
     });
 
@@ -171,11 +178,11 @@ describe('HTTP Bearer Token Auth', () => {
 
   describe('unauthenticated HTTP policy', () => {
     it('fails closed by default when no auth is configured', () => {
-      expect(() => new HTTPTransport(TEST_PORT, '127.0.0.1')).toThrow(/Refusing to start unauthenticated HTTP transport/);
+      expect(() => new HTTPTransport(allocatePort(), '127.0.0.1')).toThrow(/Refusing to start unauthenticated HTTP transport/);
     });
 
     it('allows explicit loopback-only development mode', async () => {
-      transport = new HTTPTransport(TEST_PORT, '127.0.0.1', undefined, { allowUnauthenticatedHttp: true });
+      transport = new HTTPTransport(allocatePort(), '127.0.0.1', undefined, { allowUnauthenticatedHttp: true });
       await startTransport(transport);
       const res = await request('/mcp', 'POST', { 'Content-Type': 'application/json' },
         JSON.stringify({ jsonrpc: '2.0', id: 1, method: 'ping', params: {} }));
@@ -184,14 +191,14 @@ describe('HTTP Bearer Token Auth', () => {
 
     it('allows explicit loopback development mode via env flag', async () => {
       process.env.OPENCHROME_ALLOW_UNAUTHENTICATED_HTTP = '1';
-      transport = new HTTPTransport(TEST_PORT, '127.0.0.1');
+      transport = new HTTPTransport(allocatePort(), '127.0.0.1');
       await startTransport(transport);
       const res = await request('/health');
       expect(res.status).toBe(200);
     });
 
     it('refuses external bind without auth even with development opt-in', () => {
-      expect(() => new HTTPTransport(TEST_PORT, '0.0.0.0', undefined, { allowUnauthenticatedHttp: true }))
+      expect(() => new HTTPTransport(allocatePort(), '0.0.0.0', undefined, { allowUnauthenticatedHttp: true }))
         .toThrow(/non-loopback host/);
     });
   });
@@ -199,7 +206,7 @@ describe('HTTP Bearer Token Auth', () => {
   describe('CORS allowlist', () => {
     beforeEach(async () => {
       process.env.OPENCHROME_HTTP_CORS_ORIGINS = TRUSTED_ORIGIN;
-      transport = new HTTPTransport(TEST_PORT, '127.0.0.1', undefined, { allowUnauthenticatedHttp: true });
+      transport = new HTTPTransport(allocatePort(), '127.0.0.1', undefined, { allowUnauthenticatedHttp: true });
       await startTransport(transport);
     });
 
@@ -225,14 +232,14 @@ describe('HTTP Bearer Token Auth', () => {
     });
 
     it('accepts same-origin MCP preflight even when Origin is not in allowlist', async () => {
-      const res = await request('/mcp', 'OPTIONS', { Origin: `http://127.0.0.1:${TEST_PORT}` });
+      const res = await request('/mcp', 'OPTIONS', { Origin: `http://127.0.0.1:${activePort}` });
       expect(res.status).toBe(204);
     });
 
     it('accepts same-origin MCP POST even when Origin is not in allowlist', async () => {
       const res = await request('/mcp', 'POST', {
         'Content-Type': 'application/json',
-        Origin: `http://127.0.0.1:${TEST_PORT}`,
+        Origin: `http://127.0.0.1:${activePort}`,
       }, JSON.stringify({ jsonrpc: '2.0', id: 1, method: 'ping', params: {} }));
       expect(res.status).toBe(200);
     });
@@ -242,7 +249,7 @@ describe('HTTP Bearer Token Auth', () => {
       // same host:port is cross-origin per the CORS scheme/host/port tuple.
       const res = await request('/mcp', 'POST', {
         'Content-Type': 'application/json',
-        Origin: `https://127.0.0.1:${TEST_PORT}`,
+        Origin: `https://127.0.0.1:${activePort}`,
       }, JSON.stringify({ jsonrpc: '2.0', id: 1, method: 'ping', params: {} }));
       expect(res.status).toBe(403);
     });

From 370e51f7df27357d00372ef2ea574bfa187e0204 Mon Sep 17 00:00:00 2001
From: shaun0927 <70629228+shaun0927@users.noreply.github.com>
Date: Wed, 13 May 2026 11:08:05 +0900
Subject: [PATCH 10/11] Parse admin key JSON through worker noise

Make the admin-keys JSON helper scan for a parseable JSON array instead of slicing from the first bracket, so Jest worker log prefixes cannot corrupt list --json assertions.

Constraint: Ubuntu 18 full-suite CI captured bracketed worker noise before the CLI JSON payload.
Rejected: Assuming stdout starts with JSON | the in-process harness intentionally shares stdout with Jest capture hooks.
Confidence: high
Scope-risk: narrow
Directive: CLI tests that tolerate worker noise should locate the actual machine-readable payload, not rely on stream position.
Tested: npx jest tests/cli/admin-keys.test.ts --runInBand --forceExit; git diff --check
Not-tested: Full multi-OS GitHub Actions matrix after this commit.

Co-authored-by: OmX <omx@oh-my-codex.dev>
---
 tests/cli/admin-keys.test.ts | 17 ++++++++++++-----
 1 file changed, 12 insertions(+), 5 deletions(-)

diff --git a/tests/cli/admin-keys.test.ts b/tests/cli/admin-keys.test.ts
index 9787ed692..d7e57a373 100644
--- a/tests/cli/admin-keys.test.ts
+++ b/tests/cli/admin-keys.test.ts
@@ -39,12 +39,19 @@ function extractToken(stdout: string): string {
 }
 
 function extractJsonArray(stdout: string): string {
-  const start = stdout.indexOf('[');
-  const end = stdout.lastIndexOf(']');
-  if (start === -1 || end === -1 || end < start) {
-    throw new Error(`No JSON array found in stdout: ${JSON.stringify(stdout)}`);
+  for (let start = stdout.indexOf('['); start !== -1; start = stdout.indexOf('[', start + 1)) {
+    for (let end = stdout.lastIndexOf(']'); end > start; end = stdout.lastIndexOf(']', end - 1)) {
+      const candidate = stdout.slice(start, end + 1);
+      try {
+        const parsed = JSON.parse(candidate);
+        if (Array.isArray(parsed)) return candidate;
+      } catch {
+        // Continue scanning: Jest console-capture noise can contain bracketed
+        // log prefixes before the CLI's own JSON payload in shared workers.
+      }
+    }
   }
-  return stdout.slice(start, end + 1);
+  throw new Error(`No JSON array found in stdout: ${JSON.stringify(stdout)}`);
 }
 
 async function runCli(argv: string[]): Promise<RunResult> {

From 09f602555dc76da57a86fbe8e6233a72e03b3ee8 Mon Sep 17 00:00:00 2001
From: shaun0927 <70629228+shaun0927@users.noreply.github.com>
Date: Wed, 13 May 2026 11:19:08 +0900
Subject: [PATCH 11/11] Preserve shallow best-first crawl candidates

Keep the shallower queued entry when best-first discovers the same URL at multiple depths, so an early deep discovery cannot cause a later in-scope discovery to be skipped by max_depth filtering. A depth tie-breaker also preserves shallow preference when scores match.\n\nConstraint: best_first sorting is score-based, so queue de-duplication must not discard a shallower path before max_depth checks run.\nRejected: Pure URL set de-duplication | can leave only an over-depth candidate for an otherwise crawlable URL.\nConfidence: high\nScope-risk: narrow\nDirective: Best-first queue bookkeeping should retain the minimum discovered depth for each queued URL.\nTested: npm run build; npx jest tests/core/tools/crawl.engine.test.ts tests/core/tools/crawl.legacy-snapshot.test.ts tests/core/crawl/url-scorer.test.ts --runInBand --forceExit; npm run lint:tool-schemas; git diff --check\nNot-tested: Full CI matrix locally.\n\nCo-authored-by: OmX <omx@oh-my-codex.dev>
---
 src/tools/crawl.ts | 13 ++++++++++---
 1 file changed, 10 insertions(+), 3 deletions(-)

diff --git a/src/tools/crawl.ts b/src/tools/crawl.ts
index 4fa5e9af5..0325c586d 100644
--- a/src/tools/crawl.ts
+++ b/src/tools/crawl.ts
@@ -551,7 +551,7 @@ const handler: ToolHandler = async (
   const skippedBelowThreshold = 0;
   let discoveryOrder = 0;
   const bestFirstQueue: CrawlQueueItem[] = [];
-  const bestFirstQueued = new Set<string>();
+  const bestFirstQueued = new Map<string, CrawlQueueItem>();
 
   function makeQueueItem(entry: { url: string; depth: number }): CrawlQueueItem {
     const normalized = normalizeUrl(entry.url);
@@ -572,13 +572,20 @@ const handler: ToolHandler = async (
     }
     for (const entry of entries) {
       const item = makeQueueItem(entry);
-      if (tracker.hasVisited(item.url) || bestFirstQueued.has(item.url)) continue;
-      bestFirstQueued.add(item.url);
+      if (tracker.hasVisited(item.url)) continue;
+      const queued = bestFirstQueued.get(item.url);
+      if (queued) {
+        if (queued.depth <= item.depth) continue;
+        const queuedIndex = bestFirstQueue.indexOf(queued);
+        if (queuedIndex !== -1) bestFirstQueue.splice(queuedIndex, 1);
+      }
+      bestFirstQueued.set(item.url, item);
       bestFirstQueue.push(item);
     }
     bestFirstQueue.sort((a, b) => {
       const scoreDiff = (b.score ?? 0) - (a.score ?? 0);
       if (scoreDiff !== 0) return scoreDiff;
+      if (a.depth !== b.depth) return a.depth - b.depth;
       if (a.order !== b.order) return a.order - b.order;
       return a.url.localeCompare(b.url);
     });