timescale · jgpruitt · May 1, 2026 · Apr 30, 2026 · May 1, 2026 · May 1, 2026
@@ -243,6 +243,12 @@ Skipped memories do not contribute to the exit code; only parse and engine error
 
 `--dry-run` validates parsing only; it does not predict id collisions with already-imported memories. Run with `--verbose` after a real import to see the skipped ids.
 
+### Chunking and partial failures
+
+Large imports are sliced into multiple `batchCreate` requests under the hood to fit under the server's request-body limit. Each chunk is sent sequentially. If a chunk fails (network error, server error), siblings are not affected -- the successful chunks still land. The failed chunk's items are reported as `failed`, and the chunk-level error message appears in the `errors` array (sourced as `chunk N (K items)`).
+
+This means partial failures are now possible: `imported > 0` and `failed > 0` can both be true in the same run. Re-running the import with the same input will pick up where the previous run left off (already-inserted ids are skipped via `ON CONFLICT DO NOTHING`, missing ids are inserted).
+
 ---
 
 ## me memory export

@@ -88,6 +88,15 @@ JSON mode (`--format json`) returns:
 | `skippedIdempotent` | Skipped because already present at this version. |
 | `skippedConflict` | Skipped because the id is held by something not from this pack/version. |
 | `skippedConflictIds` | Array of conflicting ids (only present when `skippedConflict > 0`). |
+| `failed` | Memories in chunks that errored before reaching the server. |
+| `failedIds` | Array of ids in failed chunks (only present when `failed > 0`). |
+| `errors` | Per-chunk error detail: `{ chunkIndex, itemCount, ids, error }` (only present when `failed > 0`). |
+
+### Chunking and partial failures
+
+Large packs are sliced into multiple `batchCreate` requests under the hood to fit under the server's request-body limit. Chunks are sent sequentially. If a chunk fails (network error, server error), siblings are not affected -- the successful chunks still land. The failed memories are reported under `failed` / `failedIds` / `errors`.
+
+A partial install is crash-safe: re-running `me pack install` with the same pack file picks up where the previous run left off. The step-3 search finds the inserted memories as already-at-this-version (idempotent), and the missing ids are filled in. The text output adds a `└ N failed (chunk error — re-run to retry)` line and a `clack.log.error` block with per-chunk error detail when this happens.
 
 ### Example
 

@@ -28,25 +28,35 @@ See [File Formats](../formats.md) for full schema documentation, examples, and f
 {
   "imported": 2,
   "skipped": 1,
+  "failed": 0,
   "ids": [
     "0194a000-0001-7000-8000-000000000001",
     "0194a000-0002-7000-8000-000000000002"
   ],
   "skippedIds": [
     "0194a000-0003-7000-8000-000000000003"
-  ]
+  ],
+  "errors": []
 }
 ```
 
 | Field | Type | Description |
 |-------|------|-------------|
 | `imported` | `number` | Number of memories successfully imported on this call. |
 | `skipped` | `number` | Number of memories whose explicit `id` already existed in the engine. Always present (may be `0`). |
+| `failed` | `number` | Number of memories in chunks that errored before reaching the server. Always present (may be `0`). |
 | `ids` | `string[]` | UUIDs of the memories actually inserted on this call. |
 | `skippedIds` | `string[]` | The explicit ids that were skipped because they already existed. Always present (may be empty). Inspect any of these with `me_memory_get` to see what's there. |
+| `errors` | `Array<{ chunkIndex, itemCount, ids, error }>` | One entry per failed chunk. Always present (may be empty). |
 
 The tool is idempotent for memories with explicit ids: re-calling with the same arguments leaves the engine in the same state, with all previously-imported ids appearing in `skippedIds` instead of `ids`. Memories submitted without an explicit `id` get a server-generated UUIDv7 and never collide.
 
+### Chunking and partial failures
+
+Large imports are sliced into multiple `batchCreate` requests under the hood to fit under the server's request-body limit. Chunks are sent sequentially. If a chunk fails, siblings are not affected -- the successful chunks still land. The failed chunk's items are reported under `failed`/`errors`, and re-calling with the same arguments will pick up where the previous call left off.
+
+The tool throws only when **every** chunk fails (total failure). For mixed outcomes it returns the partial-success detail above so the caller can decide how to react.
+
 ## Examples
 
 ### Import from file (preferred)

@@ -0,0 +1,215 @@
+/**
+ * Tests for the byte-aware chunker in `chunk.ts`.
+ */
+import { describe, expect, test } from "bun:test";
+import type { MemoryCreateParams } from "@memory.build/protocol/engine";
+import {
+  approxMemoryBytes,
+  type BatchCreateClient,
+  batchCreateChunked,
+  chunkByBytes,
+} from "./chunk.ts";
+
+describe("chunkByBytes", () => {
+  // Cheap size: each character is 1 byte.
+  const sizeAsLength = (s: string) => s.length;
+
+  test("returns a single chunk when everything fits the budget", () => {
+    const chunks = Array.from(
+      chunkByBytes(["aa", "bb", "cc"], 100, 1000, sizeAsLength),
+    );
+    expect(chunks).toEqual([["aa", "bb", "cc"]]);
+  });
+
+  test("cuts a new chunk when adding the next item would overflow the byte budget", () => {
+    const chunks = Array.from(
+      chunkByBytes(["aaaa", "bbbb", "cccc"], 6, 1000, sizeAsLength),
+    );
+    // First two items: 4 + 4 = 8 > 6, so cut after 'aaaa'. Next: 4 + 4 = 8 > 6
+    // again, cut after 'bbbb'. Then 'cccc' alone.
+    expect(chunks).toEqual([["aaaa"], ["bbbb"], ["cccc"]]);
+  });
+
+  test("packs as many items as fit before cutting", () => {
+    const chunks = Array.from(
+      chunkByBytes(["aa", "bb", "cc", "dd"], 5, 1000, sizeAsLength),
+    );
+    // Running total: 2, 4 (still ≤5), 6 > 5 → cut. Next chunk starts at 'cc'.
+    expect(chunks).toEqual([
+      ["aa", "bb"],
+      ["cc", "dd"],
+    ]);
+  });
+
+  test("cuts a new chunk when count cap is hit before byte budget", () => {
+    const chunks = Array.from(
+      chunkByBytes(["a", "b", "c", "d", "e"], 999, 2, sizeAsLength),
+    );
+    expect(chunks).toEqual([["a", "b"], ["c", "d"], ["e"]]);
+  });
+
+  test("yields an oversized item alone instead of dropping it", () => {
+    const big = "x".repeat(100);
+    const chunks = Array.from(
+      chunkByBytes(["aa", big, "bb"], 10, 1000, sizeAsLength),
+    );
+    // 'aa' fits, then 'big' would overflow → cut, big gets its own chunk
+    // (even though it exceeds the budget on its own), then 'bb' starts a new chunk.
+    expect(chunks).toEqual([["aa"], [big], ["bb"]]);
+  });
+
+  test("returns no chunks for empty input", () => {
+    const chunks = Array.from(chunkByBytes([], 100, 1000, sizeAsLength));
+    expect(chunks).toEqual([]);
+  });
+});
+
+describe("approxMemoryBytes", () => {
+  test("scales with content length", () => {
+    const small = approxMemoryBytes({ content: "hi", tree: "t" });
+    const large = approxMemoryBytes({
+      content: "x".repeat(10_000),
+      tree: "t",
+    });
+    expect(large).toBeGreaterThan(small + 9_000);
+  });
+
+  test("includes meta and id contribution", () => {
+    const a = approxMemoryBytes({ content: "x", tree: "t" });
+    const b = approxMemoryBytes({
+      id: "00000000-0000-7000-8000-000000000001",
+      content: "x",
+      tree: "t",
+      meta: { source_session_id: "abc", source_message_id: "def" },
+    });
+    expect(b).toBeGreaterThan(a);
+  });
+
+  test("counts UTF-8 bytes, not UTF-16 code units, for non-ASCII content", () => {
+    // "abc" and "日本語" both have JS .length === 3, but the CJK string is
+    // 9 UTF-8 bytes (3 bytes per char) — so the wire-size estimate must
+    // differ. A String.length-based implementation would return identical
+    // values here, missing roughly 6 bytes of real wire weight per CJK
+    // memory and silently shrinking the headroom under the 1 MiB cap.
+    const ascii = approxMemoryBytes({ content: "abc", tree: "t" });
+    const cjk = approxMemoryBytes({ content: "日本語", tree: "t" });
+    expect(cjk).toBeGreaterThan(ascii + 5);
+  });
+});
+
+describe("batchCreateChunked", () => {
+  /**
+   * Build a tiny memory whose serialized size is just `bytes` of "x"
+   * content. Lets each test control exactly how many chunks the byte
+   * budget produces without depending on the 768 KiB default.
+   */
+  const mem = (id: string, contentBytes = 1): MemoryCreateParams => ({
+    id,
+    content: "x".repeat(contentBytes),
+    tree: "t",
+  });
+
+  /** Minimal stub client; the test supplies the per-call behavior. */
+  const stubClient = (
+    handler: (memories: MemoryCreateParams[]) => Promise<{ ids: string[] }>,
+  ): BatchCreateClient => ({
+    memory: { batchCreate: ({ memories }) => handler(memories) },
+  });
+
+  test("single chunk, all succeed", async () => {
+    const calls: number[] = [];
+    const client = stubClient(async (memories) => {
+      calls.push(memories.length);
+      return { ids: memories.map((m) => m.id ?? "auto") };
+    });
+    const result = await batchCreateChunked(client, [mem("a"), mem("b")]);
+    expect(result.insertedIds).toEqual(["a", "b"]);
+    expect(result.failedIds).toEqual([]);
+    expect(result.errors).toEqual([]);
+    expect(calls).toEqual([2]); // single batchCreate call
+  });
+
+  test("two chunks succeed, insertedIds accumulate across chunks", async () => {
+    // Force two chunks via a tight byte budget by using big content. We
+    // can't override the 768 KiB default through the public API, so use
+    // many small memories and rely on the count cap... actually easier:
+    // use one big enough that two would overflow.
+    const big = mem("big", 700_000);
+    const small = mem("small", 10);
+    const client = stubClient(async (memories) => ({
+      ids: memories.map((m) => m.id ?? "auto"),
+    }));
+    const result = await batchCreateChunked(client, [big, small]);
+    // Both items land; we don't assert chunk boundaries here, only that
+    // ids are accumulated correctly across however many chunks fired.
+    expect(result.insertedIds.sort()).toEqual(["big", "small"]);
+    expect(result.failedIds).toEqual([]);
+    expect(result.errors).toEqual([]);
+  });
+
+  test("second chunk fails: insertedIds from first only, failedIds from second", async () => {
+    const big1 = mem("a", 700_000);
+    const big2 = mem("b", 700_000);
+    let call = 0;
+    const client = stubClient(async (memories) => {
+      call++;
+      if (call === 2) throw new Error("server boom");
+      return { ids: memories.map((m) => m.id ?? "auto") };
+    });
+    const result = await batchCreateChunked(client, [big1, big2]);
+    expect(result.insertedIds).toEqual(["a"]);
+    expect(result.failedIds).toEqual(["b"]);
+    expect(result.errors).toHaveLength(1);
+    expect(result.errors[0]).toMatchObject({
+      chunkIndex: 1,
+      itemCount: 1,
+      ids: ["b"],
+      error: "server boom",
+    });
+  });
+
+  test("all chunks fail: insertedIds empty, failedIds covers all explicit ids", async () => {
+    const big1 = mem("a", 700_000);
+    const big2 = mem("b", 700_000);
+    const client = stubClient(async () => {
+      throw new Error("network down");
+    });
+    const result = await batchCreateChunked(client, [big1, big2]);
+    expect(result.insertedIds).toEqual([]);
+    expect(result.failedIds.sort()).toEqual(["a", "b"]);
+    expect(result.errors).toHaveLength(2);
+    expect(result.errors[0]?.chunkIndex).toBe(0);
+    expect(result.errors[1]?.chunkIndex).toBe(1);
+  });
+
+  test("server returns shorter ids than requested (simulating ON CONFLICT)", async () => {
+    // Mimics post-#64 server behavior: caller submits 3 memories, server
+    // inserts 2 (one was a duplicate id, dropped by ON CONFLICT). The
+    // helper should faithfully report the 2 inserted; classifying the
+    // missing one as "skipped" is the caller's job.
+    const client = stubClient(async (memories) => ({
+      ids: memories.map((m) => m.id ?? "auto").filter((id) => id !== "dup"), // server "drops" the dup id
+    }));
+    const result = await batchCreateChunked(client, [
+      mem("a"),
+      mem("dup"),
+      mem("b"),
+    ]);
+    expect(result.insertedIds).toEqual(["a", "b"]);
+    expect(result.failedIds).toEqual([]); // no chunk failed
+    expect(result.errors).toEqual([]);
+  });
+
+  test("empty input never calls the server", async () => {
+    let calls = 0;
+    const client = stubClient(async () => {
+      calls++;
+      return { ids: [] };
+    });
+    const result = await batchCreateChunked(client, []);
+    expect(result.insertedIds).toEqual([]);
+    expect(result.failedIds).toEqual([]);
+    expect(result.errors).toEqual([]);
+    expect(calls).toBe(0);
+  });
+});