shaun0927 · shaun0927 · May 13, 2026 · May 12, 2026 · May 12, 2026 · May 12, 2026
diff --git a/src/tools/_shared/state-header.ts b/src/tools/_shared/state-header.ts
@@ -0,0 +1,64 @@
+/**
+ * State Header — unified page-state envelope for tool responses.
+ *
+ * Prepends a 4-line header to text-mode tool responses so agents can
+ * determine which page a snapshot came from without parsing the payload.
+ *
+ * Opt-out: set OPENCHROME_STATE_HEADER=off (case-insensitive) to restore
+ * v1.11.0 byte-identical output.
+ */
+
+export interface PageStateHeader {
+  url: string;
+  title: string;
+  mode: 'ax' | 'dom' | 'css' | 'html' | 'inspect' | 'validate';
+  capturedAt: number; // Unix ms — server wall-clock at response assembly
+  tabId: string;
+}
+
+/**
+ * Returns true when the state header should be included in responses.
+ * Default is enabled; set OPENCHROME_STATE_HEADER=off to disable.
+ */
+export function isStateHeaderEnabled(): boolean {
+  const val = process.env.OPENCHROME_STATE_HEADER;
+  return val === undefined || val.toLowerCase() !== 'off';
+}
+
+/**
+ * Formats the 4-line header text.
+ * The returned string ends with a trailing newline so that
+ * `formatHeaderText(h) + existingPayload` is clean without extra newlines.
+ * Callers that want a blank separator line should append '\n' before the payload.
+ */
+export function formatHeaderText(h: PageStateHeader): string {
+  const capturedAtIso = new Date(h.capturedAt).toISOString();
+  // Escape control characters so a crafted title/url cannot split the fixed
+  // 4-line header into extra lines and spoof subsequent fields.
+  const safeUrl = h.url.replace(/[\r\n]/g, ' ');
+  const safeTitle = h.title.replace(/[\r\n]/g, ' ');
+  return (
+    `- Page URL: ${safeUrl}\n` +
+    `- Page Title: ${safeTitle}\n` +
+    `- Page Mode: ${h.mode}\n` +
+    `- Captured At: ${capturedAtIso}\n`
+  );
+}
+
+/**
+ * Prepends the state header (+ blank line) to a text payload.
+ * Returns the payload unchanged when the header is disabled.
+ */
+export function prependHeaderText(h: PageStateHeader, payload: string): string {
+  if (!isStateHeaderEnabled()) return payload;
+  return formatHeaderText(h) + '\n' + payload;
+}
+
+/**
+ * Merges the state header fields into a JSON-mode response object.
+ * Returns the object unchanged when the header is disabled.
+ */
+export function mergeHeaderJson<T extends object>(h: PageStateHeader, obj: T): T & { state: PageStateHeader } | T {
+  if (!isStateHeaderEnabled()) return obj;
+  return { state: h, ...obj };
+}
diff --git a/src/tools/inspect.ts b/src/tools/inspect.ts
@@ -14,6 +14,7 @@ import { TOOL_ANNOTATIONS } from '../types/tool-annotations';
 import { getSessionManager } from '../session-manager';
 import { withTimeout } from '../utils/with-timeout';
 import { getAllShadowRoots, querySelectorInShadowRoots } from '../utils/shadow-dom';
+import { prependHeaderText } from './_shared/state-header';
 import {
   formatNodeRefToken,
   getCurrentLoaderId,
@@ -578,8 +579,9 @@ const handler: ToolHandler = async (
     // Footer with page context (always included)
     lines.push(`[Page] ${inspectResult.url} | "${inspectResult.title}"`);
 
+    const inspectPayload = lines.join('\n');
     return {
-      content: [{ type: 'text', text: lines.join('\n') }],
+      content: [{ type: 'text', text: prependHeaderText({ url: inspectResult.url, title: inspectResult.title, mode: 'inspect', capturedAt: Date.now(), tabId }, inspectPayload) }],
     };
   } catch (error) {
     return {

diff --git a/src/tools/page-content.ts b/src/tools/page-content.ts
@@ -1,148 +1,155 @@
-/**
- * Page Content Tool - Get HTML content from page
- */
-
-import { MCPServer } from '../mcp-server';
-import { MCPToolDefinition, MCPResult, ToolHandler } from '../types/mcp';
+/**
+ * Page Content Tool - Get HTML content from page
+ */
+
+import { MCPServer } from '../mcp-server';
+import { MCPToolDefinition, MCPResult, ToolHandler } from '../types/mcp';
 import { TOOL_ANNOTATIONS } from '../types/tool-annotations';
-import { getSessionManager } from '../session-manager';
-import { MAX_OUTPUT_CHARS, DEFAULT_NAVIGATION_TIMEOUT_MS } from '../config/defaults';
-import { withTimeout } from '../utils/with-timeout';
-
-const definition: MCPToolDefinition = {
-  name: 'page_content',
-  description: 'Get HTML content from page or element.',
-  inputSchema: {
-    type: 'object',
-    properties: {
-      tabId: {
-        type: 'string',
-        description: 'Tab ID to get content from',
-      },
-      selector: {
-        type: 'string',
-        description: 'CSS selector. Omit for full page',
-      },
-      outerHTML: {
-        type: 'boolean',
-        description: 'Return outerHTML vs innerHTML. Default: true',
-      },
-    },
-    required: ['tabId'],
-  },
+import { getSessionManager } from '../session-manager';
+import { MAX_OUTPUT_CHARS, DEFAULT_NAVIGATION_TIMEOUT_MS } from '../config/defaults';
+import { withTimeout } from '../utils/with-timeout';
+import { mergeHeaderJson, isStateHeaderEnabled } from './_shared/state-header';
+
+const definition: MCPToolDefinition = {
+  name: 'page_content',
+  description: 'Get HTML content from page or element.',
+  inputSchema: {
+    type: 'object',
+    properties: {
+      tabId: {
+        type: 'string',
+        description: 'Tab ID to get content from',
+      },
+      selector: {
+        type: 'string',
+        description: 'CSS selector. Omit for full page',
+      },
+      outerHTML: {
+        type: 'boolean',
+        description: 'Return outerHTML vs innerHTML. Default: true',
+      },
+    },
+    required: ['tabId'],
+  },
   annotations: TOOL_ANNOTATIONS.page_content,
-};
-
-const handler: ToolHandler = async (
-  sessionId: string,
-  args: Record<string, unknown>
-): Promise<MCPResult> => {
-  const tabId = args.tabId as string;
-  const selector = args.selector as string | undefined;
-  const outerHTML = (args.outerHTML as boolean) ?? true;
-
-  const sessionManager = getSessionManager();
-
-  if (!tabId) {
-    return {
-      content: [{ type: 'text', text: 'Error: tabId is required' }],
-      isError: true,
-    };
-  }
-
-  try {
-    const page = await sessionManager.getPage(sessionId, tabId, undefined, 'page_content');
-    if (!page) {
-      return {
-        content: [{ type: 'text', text: `Error: Tab ${tabId} not found` }],
-        isError: true,
-      };
-    }
-
-    if (selector) {
-      // Get content from specific element
-      const element = await page.$(selector);
-
-      if (!element) {
-        return {
-          content: [
-            {
-              type: 'text',
-              text: JSON.stringify({
-                action: 'page_content',
-                selector,
-                content: null,
-                message: `No element found matching "${selector}"`,
-              }),
-            },
-          ],
-          isError: true,
-        };
-      }
-
-      let html = await withTimeout(page.evaluate(
-        (el: Element, getOuter: boolean) => {
-          return getOuter ? el.outerHTML : el.innerHTML;
-        },
-        element,
-        outerHTML
-      ), 15000, 'page_content');
-
-      const originalLength = html.length;
-      if (html.length > MAX_OUTPUT_CHARS) {
-        html = html.substring(0, MAX_OUTPUT_CHARS) + `\n\n[Truncated: ${originalLength} chars total, showing first ${MAX_OUTPUT_CHARS}]`;
-      }
-
-      return {
-        content: [
-          {
-            type: 'text',
-            text: JSON.stringify({
-              action: 'page_content',
-              selector,
-              outerHTML,
-              contentLength: originalLength,
-              content: html,
-            }),
-          },
-        ],
-      };
-    } else {
-      // Get full page content
-      let html = await withTimeout(page.content(), DEFAULT_NAVIGATION_TIMEOUT_MS, 'page.content()');
-
-      const originalLength = html.length;
-      if (html.length > MAX_OUTPUT_CHARS) {
-        html = html.substring(0, MAX_OUTPUT_CHARS) + `\n\n[Truncated: ${originalLength} chars total, showing first ${MAX_OUTPUT_CHARS}]`;
-      }
-
-      return {
-        content: [
-          {
-            type: 'text',
-            text: JSON.stringify({
-              action: 'page_content',
-              selector: null,
-              contentLength: originalLength,
-              content: html,
-            }),
-          },
-        ],
-      };
-    }
-  } catch (error) {
-    return {
-      content: [
-        {
-          type: 'text',
-          text: `Page content error: ${error instanceof Error ? error.message : String(error)}`,
-        },
-      ],
-      isError: true,
-    };
-  }
-};
-
-export function registerPageContentTool(server: MCPServer): void {
-  server.registerTool('page_content', handler, definition);
-}
+};
+
+const handler: ToolHandler = async (
+  sessionId: string,
+  args: Record<string, unknown>
+): Promise<MCPResult> => {
+  const tabId = args.tabId as string;
+  const selector = args.selector as string | undefined;
+  const outerHTML = (args.outerHTML as boolean) ?? true;
+
+  const sessionManager = getSessionManager();
+
+  if (!tabId) {
+    return {
+      content: [{ type: 'text', text: 'Error: tabId is required' }],
+      isError: true,
+    };
+  }
+
+  try {
+    const page = await sessionManager.getPage(sessionId, tabId, undefined, 'page_content');
+    if (!page) {
+      return {
+        content: [{ type: 'text', text: `Error: Tab ${tabId} not found` }],
+        isError: true,
+      };
+    }
+
+    if (selector) {
+      // Get content from specific element
+      const element = await page.$(selector);
+
+      if (!element) {
+        const missingBody = {
+          action: 'page_content',
+          selector,
+          content: null,
+          message: `No element found matching "${selector}"`,
+        };
+        const missingWithState = isStateHeaderEnabled()
+          ? mergeHeaderJson(
+              { url: page.url(), title: await page.title(), mode: 'html' as const, capturedAt: Date.now(), tabId },
+              missingBody,
+            )
+          : missingBody;
+        return {
+          content: [{ type: 'text', text: JSON.stringify(missingWithState) }],
+          isError: true,
+        };
+      }
+
+      let html = await withTimeout(page.evaluate(
+        (el: Element, getOuter: boolean) => {
+          return getOuter ? el.outerHTML : el.innerHTML;
+        },
+        element,
+        outerHTML
+      ), 15000, 'page_content');
+
+      const originalLength = html.length;
+      if (html.length > MAX_OUTPUT_CHARS) {
+        html = html.substring(0, MAX_OUTPUT_CHARS) + `\n\n[Truncated: ${originalLength} chars total, showing first ${MAX_OUTPUT_CHARS}]`;
+      }
+
+      const elementBody = {
+        action: 'page_content',
+        selector,
+        outerHTML,
+        contentLength: originalLength,
+        content: html,
+      };
+      const elementWithState = isStateHeaderEnabled()
+        ? mergeHeaderJson(
+            { url: page.url(), title: await page.title(), mode: 'html' as const, capturedAt: Date.now(), tabId },
+            elementBody,
+          )
+        : elementBody;
+      return {
+        content: [{ type: 'text', text: JSON.stringify(elementWithState) }],
+      };
+    } else {
+      // Get full page content
+      let html = await withTimeout(page.content(), DEFAULT_NAVIGATION_TIMEOUT_MS, 'page.content()');
+
+      const originalLength = html.length;
+      if (html.length > MAX_OUTPUT_CHARS) {
+        html = html.substring(0, MAX_OUTPUT_CHARS) + `\n\n[Truncated: ${originalLength} chars total, showing first ${MAX_OUTPUT_CHARS}]`;
+      }
+
+      const fullPageBody = {
+        action: 'page_content',
+        selector: null,
+        contentLength: originalLength,
+        content: html,
+      };
+      const fullPageWithState = isStateHeaderEnabled()
+        ? mergeHeaderJson(
+            { url: page.url(), title: await page.title(), mode: 'html' as const, capturedAt: Date.now(), tabId },
+            fullPageBody,
+          )
+        : fullPageBody;
+      return {
+        content: [{ type: 'text', text: JSON.stringify(fullPageWithState) }],
+      };
+    }
+  } catch (error) {
+    return {
+      content: [
+        {
+          type: 'text',
+          text: `Page content error: ${error instanceof Error ? error.message : String(error)}`,
+        },
+      ],
+      isError: true,
+    };
+  }
+};
+
+export function registerPageContentTool(server: MCPServer): void {
+  server.registerTool('page_content', handler, definition);
+}