2026-06-07 09:16:27 +00:00
11 changed files with 363 additions and 1 deletions
@@ -0,0 +1,18 @@
+---
+"@united-workforce/util-agent": minor
+"@united-workforce/agent-mock": patch
+"@united-workforce/agent-builtin": patch
+"@united-workforce/agent-hermes": patch
+"@united-workforce/agent-claude-code": patch
+---
+
+feat(util-agent): extend AgentOptions with `fork` / `cleanup` and add ask-session cache
+
+Phase 2a infrastructure for `step ask`. Extends `AgentOptions` with
+`fork: AgentForkFn | null` and `cleanup: AgentCleanupFn | null` fields, exporting
+the new `AgentForkFn` and `AgentCleanupFn` type aliases. Adds `getAskSessionId` /
+`setAskSessionId` to the per-agent session cache, using `<stepHash>:ask` keys
+that share the cache file with exec sessions (`<threadId>:<role>` keys) without
+collision. All four adapters (mock, builtin, hermes, claude-code) now pass
+`fork: null, cleanup: null` — real implementations land in Phase 2b. Resolves
+issue #145.
@@ -167,5 +167,7 @@ export function createBuiltinAgent(): () => Promise<void> {
    name: "builtin",
    run: runBuiltin,
    continue: continueBuiltin,
+    fork: null,
+    cleanup: null,
  });
 }
@@ -253,5 +253,7 @@ export function createClaudeCodeAgent(model: string | null): () => Promise<void>
    name: "claude-code",
    run: (ctx) => runClaudeCode(ctx, model),
    continue: (sessionId, message, store) => continueClaudeCode(sessionId, message, store, model),
+    fork: null,
+    cleanup: null,
  });
 }
@@ -246,6 +246,8 @@ export function createHermesAgent(resumeDisabled: boolean): () => Promise<void>
    name: "hermes",
    run: runHermes,
    continue: continueHermes,
+    fork: null,
+    cleanup: null,
  });

  // Wrap to ensure ACP client is closed after agent completes,
@@ -125,5 +125,7 @@ export function createMockAgent(mockDataPath: string): () => Promise<void> {
    name: "mock",
    run,
    continue: continueRun,
+    fork: null,
+    cleanup: null,
  });
 }
@@ -0,0 +1,60 @@
+import { readFile } from "node:fs/promises";
+import { join } from "node:path";
+import { describe, expect, test } from "vitest";
+
+/**
+ * Source-level verification that each adapter's `createAgent({...})` call
+ * includes the new `fork: null` and `cleanup: null` fields.
+ *
+ * Adapters are CLI binaries that spawn external processes — runtime testing
+ * requires real LLM environments — so we use static source inspection here.
+ * Type-level correctness is enforced separately by `tsc --build`.
+ */
+
+const REPO_ROOT = join(__dirname, "..", "..", "..");
+
+const ADAPTERS: Array<{ name: string; path: string }> = [
+  { name: "agent-mock", path: "packages/agent-mock/src/mock-agent.ts" },
+  { name: "agent-builtin", path: "packages/agent-builtin/src/agent.ts" },
+  { name: "agent-hermes", path: "packages/agent-hermes/src/hermes.ts" },
+  { name: "agent-claude-code", path: "packages/agent-claude-code/src/claude-code.ts" },
+];
+
+/** Find the matching `}` for the `{` at `openIdx` in `source`. */
+function findMatchingBrace(source: string, openIdx: number): number {
+  let depth = 0;
+  for (let i = openIdx; i < source.length; i++) {
+    const ch = source[i];
+    if (ch === "{") {
+      depth++;
+    } else if (ch === "}") {
+      depth--;
+      if (depth === 0) {
+        return i;
+      }
+    }
+  }
+  return -1;
+}
+
+/** Extract the `createAgent({...})` block from adapter source. */
+function extractCreateAgentBlock(source: string): string {
+  const startIdx = source.indexOf("createAgent({");
+  expect(startIdx).toBeGreaterThanOrEqual(0);
+  const openIdx = source.indexOf("{", startIdx);
+  const endIdx = findMatchingBrace(source, openIdx);
+  expect(endIdx).toBeGreaterThan(openIdx);
+  return source.slice(openIdx, endIdx + 1);
+}
+
+describe("adapter createAgent calls include fork: null and cleanup: null", () => {
+  for (const adapter of ADAPTERS) {
+    test(`${adapter.name} createAgent call includes fork: null and cleanup: null`, async () => {
+      const source = await readFile(join(REPO_ROOT, adapter.path), "utf8");
+      expect(source).toMatch(/createAgent\s*\(\s*\{/);
+      const block = extractCreateAgentBlock(source);
+      expect(block).toMatch(/fork:\s*null/);
+      expect(block).toMatch(/cleanup:\s*null/);
+    });
+  }
+});
@@ -0,0 +1,78 @@
+import type { Store } from "@ocas/core";
+import { describe, expect, test } from "vitest";
+
+import type {
+  AgentCleanupFn,
+  AgentContext,
+  AgentContinueFn,
+  AgentForkFn,
+  AgentOptions,
+  AgentRunFn,
+} from "../src/types.js";
+
+const makeRun: AgentRunFn = async (_ctx: AgentContext) => ({
+  output: "",
+  detailHash: "",
+  sessionId: "",
+  assembledPrompt: "",
+  usage: null,
+});
+
+const makeContinue: AgentContinueFn = async (_sessionId, _message, _store) => ({
+  output: "",
+  detailHash: "",
+  sessionId: "",
+  assembledPrompt: "",
+  usage: null,
+});
+
+describe("AgentOptions fork/cleanup", () => {
+  test("AgentOptions accepts fork and cleanup as null", () => {
+    const opts: AgentOptions = {
+      name: "test",
+      run: makeRun,
+      continue: makeContinue,
+      fork: null,
+      cleanup: null,
+    };
+    expect(opts.name).toBe("test");
+    expect(opts.run).toBe(makeRun);
+    expect(opts.continue).toBe(makeContinue);
+    expect(opts.fork).toBeNull();
+    expect(opts.cleanup).toBeNull();
+  });
+
+  test("AgentOptions accepts real fork and cleanup functions", () => {
+    const fork: AgentForkFn = async (sessionId, _store) => `${sessionId}-forked`;
+    const cleanup: AgentCleanupFn = async () => {
+      /* no-op */
+    };
+    const opts: AgentOptions = {
+      name: "test",
+      run: makeRun,
+      continue: makeContinue,
+      fork,
+      cleanup,
+    };
+    expect(typeof opts.fork).toBe("function");
+    expect(typeof opts.cleanup).toBe("function");
+  });
+
+  test("AgentForkFn signature accepts (sessionId: string, store: Store) and returns Promise<string>", async () => {
+    const fork: AgentForkFn = async (sessionId, _store) => `${sessionId}-child`;
+    // Cast a placeholder Store — only the signature shape matters for this test.
+    const fakeStore = {} as Store;
+    const result = await fork("session-abc", fakeStore);
+    expect(result).toBe("session-abc-child");
+  });
+
+  test("AgentCleanupFn signature accepts no args and returns Promise<void>", async () => {
+    let called = false;
+    const cleanup: AgentCleanupFn = async () => {
+      called = true;
+    };
+    const result = await cleanup();
+    expect(result).toBeUndefined();
+    expect(called).toBe(true);
+  });
+});
@@ -0,0 +1,131 @@
+import { mkdir, readFile, rm, writeFile } from "node:fs/promises";
+import { dirname, join } from "node:path";
+import type { ThreadId } from "@united-workforce/protocol";
+import { afterEach, beforeEach, describe, expect, test } from "vitest";
+
+import {
+  getAskSessionId,
+  getCachedSessionId,
+  getCachePath,
+  setAskSessionId,
+  setCachedSessionId,
+} from "../src/session-cache.js";
+import { getDefaultStorageRoot } from "../src/storage.js";
+
+describe("session-cache ask sessions", () => {
+  let testStorageRoot: string;
+
+  beforeEach(async () => {
+    testStorageRoot = join(
+      getDefaultStorageRoot(),
+      "test-cache",
+      `ask-${Date.now()}-${Math.random()}`,
+    );
+    await mkdir(testStorageRoot, { recursive: true });
+  });
+
+  afterEach(async () => {
+    await rm(testStorageRoot, { recursive: true, force: true });
+  });
+
+  const stepHash = "ABCDEFG1234567";
+
+  test("getAskSessionId returns null when no ask session cached", async () => {
+    const session = await getAskSessionId("claude-code", stepHash, testStorageRoot);
+    expect(session).toBeNull();
+  });
+
+  test("setAskSessionId + getAskSessionId round-trip", async () => {
+    await setAskSessionId("claude-code", stepHash, "ask-session-123", testStorageRoot);
+    const session = await getAskSessionId("claude-code", stepHash, testStorageRoot);
+    expect(session).toBe("ask-session-123");
+  });
+
+  test("ask cache keys use stepHash:ask format", async () => {
+    await setAskSessionId("claude-code", stepHash, "ask-session-456", testStorageRoot);
+
+    const cachePath = getCachePath("claude-code", testStorageRoot);
+    const content = JSON.parse(await readFile(cachePath, "utf8")) as Record<string, string>;
+
+    expect(content).toHaveProperty(`${stepHash}:ask`, "ask-session-456");
+  });
+
+  test("exec cache and ask cache coexist in same file", async () => {
+    const threadId = "01234567890123456789012345" as ThreadId;
+    const role = "developer";
+
+    await setCachedSessionId("claude-code", threadId, role, "exec-session", testStorageRoot);
+    await setAskSessionId("claude-code", stepHash, "ask-session", testStorageRoot);
+
+    const cachePath = getCachePath("claude-code", testStorageRoot);
+    const content = JSON.parse(await readFile(cachePath, "utf8")) as Record<string, string>;
+
+    expect(content).toHaveProperty(`${threadId}:${role}`, "exec-session");
+    expect(content).toHaveProperty(`${stepHash}:ask`, "ask-session");
+
+    expect(await getCachedSessionId("claude-code", threadId, role, testStorageRoot)).toBe(
+      "exec-session",
+    );
+    expect(await getAskSessionId("claude-code", stepHash, testStorageRoot)).toBe("ask-session");
+  });
+
+  test("updating ask session does not affect exec session", async () => {
+    const threadId = "01234567890123456789012345" as ThreadId;
+    const role = "developer";
+
+    await setCachedSessionId("claude-code", threadId, role, "exec-original", testStorageRoot);
+    await setAskSessionId("claude-code", stepHash, "ask-original", testStorageRoot);
+
+    await setAskSessionId("claude-code", stepHash, "ask-updated", testStorageRoot);
+
+    expect(await getCachedSessionId("claude-code", threadId, role, testStorageRoot)).toBe(
+      "exec-original",
+    );
+    expect(await getAskSessionId("claude-code", stepHash, testStorageRoot)).toBe("ask-updated");
+  });
+
+  test("updating exec session does not affect ask session", async () => {
+    const threadId = "01234567890123456789012345" as ThreadId;
+    const role = "developer";
+
+    await setAskSessionId("claude-code", stepHash, "ask-original", testStorageRoot);
+    await setCachedSessionId("claude-code", threadId, role, "exec-original", testStorageRoot);
+
+    await setCachedSessionId("claude-code", threadId, role, "exec-updated", testStorageRoot);
+
+    expect(await getAskSessionId("claude-code", stepHash, testStorageRoot)).toBe("ask-original");
+    expect(await getCachedSessionId("claude-code", threadId, role, testStorageRoot)).toBe(
+      "exec-updated",
+    );
+  });
+
+  test("different stepHashes have independent ask sessions", async () => {
+    const stepHashA = "AAAAAAA1234567";
+    const stepHashB = "BBBBBBB1234567";
+
+    await setAskSessionId("claude-code", stepHashA, "session-A", testStorageRoot);
+    await setAskSessionId("claude-code", stepHashB, "session-B", testStorageRoot);
+
+    expect(await getAskSessionId("claude-code", stepHashA, testStorageRoot)).toBe("session-A");
+    expect(await getAskSessionId("claude-code", stepHashB, testStorageRoot)).toBe("session-B");
+  });
+
+  test("ask session for one agent does not leak to another", async () => {
+    await setAskSessionId("claude-code", stepHash, "cc-ask-session", testStorageRoot);
+
+    const ccSession = await getAskSessionId("claude-code", stepHash, testStorageRoot);
+    const hermesSession = await getAskSessionId("hermes", stepHash, testStorageRoot);
+
+    expect(ccSession).toBe("cc-ask-session");
+    expect(hermesSession).toBeNull();
+  });
+
+  test("empty string ask session treated as missing", async () => {
+    const cachePath = getCachePath("claude-code", testStorageRoot);
+    await mkdir(dirname(cachePath), { recursive: true });
+    await writeFile(cachePath, JSON.stringify({ [`${stepHash}:ask`]: "" }), "utf8");
+
+    const session = await getAskSessionId("claude-code", stepHash, testStorageRoot);
+    expect(session).toBeNull();
+  });
+});
@@ -14,12 +14,20 @@ export type { FrontmatterFastPathResult } from "./frontmatter.js";
 export { tryFrontmatterFastPath } from "./frontmatter.js";
 export { buildFrontmatterRetryPrompt } from "./frontmatter-retry-prompt.js";
 export { createAgent, parseArgv } from "./run.js";
-export { getCachedSessionId, getCachePath, setCachedSessionId } from "./session-cache.js";
+export {
+  getAskSessionId,
+  getCachedSessionId,
+  getCachePath,
+  setAskSessionId,
+  setCachedSessionId,
+} from "./session-cache.js";
 export { getConfigPath, getEnvPath, loadWorkflowConfig, resolveStorageRoot } from "./storage.js";
 export type {
  AdapterOutput,
+  AgentCleanupFn,
  AgentContext,
  AgentContinueFn,
+  AgentForkFn,
  AgentOptions,
  AgentRunFn,
  AgentRunResult,
@@ -14,6 +14,10 @@ function cacheKey(threadId: ThreadId, role: string): string {
  return `${threadId}:${role}`;
 }

+function askCacheKey(stepHash: string): string {
+  return `${stepHash}:ask`;
+}
+
 function isRecord(value: unknown): value is Record<string, unknown> {
  return typeof value === "object" && value !== null && !Array.isArray(value);
 }
@@ -86,3 +90,33 @@ export async function setCachedSessionId(
  cache[cacheKey(threadId, role)] = sessionId;
  await writeCache(agentName, storageRoot, cache);
 }
+
+/**
+ * Read the cached ask-session ID for a stepHash.
+ *
+ * Ask sessions are forked side conversations spawned by `step ask` from a
+ * specific completed step. They share the per-agent cache file with exec
+ * sessions but use the `<stepHash>:ask` key shape so the two namespaces
+ * never collide.
+ */
+export async function getAskSessionId(
+  agentName: string,
+  stepHash: string,
+  storageRoot: string,
+): Promise<string | null> {
+  const cache = await readCache(agentName, storageRoot);
+  const sessionId = cache[askCacheKey(stepHash)];
+  return sessionId ?? null;
+}
+
+/** Write the ask-session ID for a stepHash into the cache. */
+export async function setAskSessionId(
+  agentName: string,
+  stepHash: string,
+  sessionId: string,
+  storageRoot: string,
+): Promise<void> {
+  const cache = await readCache(agentName, storageRoot);
+  cache[askCacheKey(stepHash)] = sessionId;
+  await writeCache(agentName, storageRoot, cache);
+}
@@ -50,6 +50,21 @@ export type AgentContinueFn = (

 export type AgentRunFn = (ctx: AgentContext) => Promise<AgentRunResult>;

+/**
+ * Fork an existing agent session, returning a new session ID that branches
+ * from the source session's state. Used by `step ask` (Phase 2a infrastructure)
+ * to spawn a side conversation from a completed step's session without
+ * polluting the original session's history.
+ */
+export type AgentForkFn = (sessionId: string, store: AgentContext["store"]) => Promise<string>;
+
+/**
+ * Clean up adapter-level resources (e.g. close ACP client, kill subprocesses).
+ * Invoked by the agent CLI factory after the run completes — regardless of
+ * success or failure — so adapters can release I/O handles deterministically.
+ */
+export type AgentCleanupFn = () => Promise<void>;
+
 export type AdapterOutput = {
  stepHash: string;
  detailHash: string;
@@ -65,4 +80,14 @@ export type AgentOptions = {
  name: string;
  run: AgentRunFn;
  continue: AgentContinueFn;
+  /**
+   * Optional session-fork hook. null means the adapter does not yet support
+   * `step ask` (Phase 2a placeholder — wired up in Phase 2b).
+   */
+  fork: AgentForkFn | null;
+  /**
+   * Optional cleanup hook invoked after the agent CLI completes. null means
+   * the adapter has no resources to release.
+   */
+  cleanup: AgentCleanupFn | null;
 };