feat: @uncaged/workflow-role-llm — role factory + zod@4 schema

Migrated from nerve/workflow-utils: - createRole with zod@4 schema → typed meta + JSON Schema - createLlmAdapter — LLM provider abstraction - llmExtract/llmExtractWithRetry — structured output extraction - decorateRole/withDryRun/onFail — role decorators - buildDescriptorFromRoles — auto-generate descriptor from zod schemas - Zero nerve-core dependencies - 83 tests pass, biome clean Closes #9 小橘 <xiaoju@shazhou.work>
2026-05-06 06:50:19 +00:00
parent 3467b772e6
commit c2a8f2d81b
16 changed files with 1311 additions and 1 deletions
@@ -0,0 +1,74 @@
 import { describe, expect, test } from "bun:test";
 import { validateWorkflowDescriptor } from "@uncaged/workflow";
 import * as z from "zod/v4";
 import { buildDescriptorFromRoles } from "../src/build-descriptor.js";
 describe("buildDescriptorFromRoles", () => {
  test("produces a descriptor that validates and includes JSON schemas per role", () => {
    const schema = z.object({
      title: z.string(),
      count: z.number(),
    });
    const descriptor = buildDescriptorFromRoles({
      description: "Demo workflow",
      roles: {
        analyst: {
          name: "analyst",
          schema,
          description: "Analyzes input",
        },
      },
    });
    const validated = validateWorkflowDescriptor(descriptor);
    expect(validated.ok).toBe(true);
    if (!validated.ok) {
      return;
    }
    expect(validated.value.description).toBe("Demo workflow");
    const analyst = validated.value.roles.analyst;
    expect(analyst.description).toBe("Analyzes input");
    expect(analyst.schema.type).toBe("object");
    const props = analyst.schema.properties as Record<string, unknown>;
    expect(props.title).toMatchObject({ type: "string" });
    expect(props.count).toMatchObject({ type: "number" });
  });
  test("uses empty description when spec.description is null", () => {
    const descriptor = buildDescriptorFromRoles({
      description: "W",
      roles: {
        x: {
          name: "x",
          schema: z.object({ n: z.number() }),
          description: null,
        },
      },
    });
    const validated = validateWorkflowDescriptor(descriptor);
    expect(validated.ok).toBe(true);
    if (!validated.ok) {
      return;
    }
    expect(validated.value.roles.x.description).toBe("");
  });
  test("throws when role key and spec.name diverge", () => {
    expect(() =>
      buildDescriptorFromRoles({
        description: "W",
        roles: {
          a: {
            name: "b",
            schema: z.object({ n: z.number() }),
            description: null,
          },
        },
      }),
    ).toThrow(/must match spec.name/);
  });
 });
@@ -0,0 +1,64 @@
 import { describe, expect, test } from "bun:test";
 import { START, type ThreadContext } from "@uncaged/workflow";
 import { createLlmAdapter } from "../src/create-llm-adapter.js";
 function makeCtx(userContent: string): ThreadContext {
  return {
    start: {
      role: START,
      content: userContent,
      meta: { maxRounds: 10 },
      timestamp: 1,
    },
    steps: [],
  };
 }
 describe("createLlmAdapter", () => {
  const originalFetch = globalThis.fetch;
  test("posts system + user (start.content) and returns assistant text", async () => {
    globalThis.fetch = () =>
      Promise.resolve(
        new Response(JSON.stringify({ choices: [{ message: { content: "model reply" } }] }), {
          status: 200,
          headers: { "Content-Type": "application/json" },
        }),
      );
    const provider = { baseUrl: "https://api.example/v1", apiKey: "k", model: "m" };
    const adapter = createLlmAdapter(provider);
    const out = await adapter(makeCtx("trigger text"), "system instructions");
    globalThis.fetch = originalFetch;
    expect(out).toBe("model reply");
  });
  test("throws on non-ok fetch response", async () => {
    globalThis.fetch = () =>
      Promise.resolve(
        new Response("Internal Server Error", {
          status: 500,
          headers: { "Content-Type": "text/plain" },
        }),
      );
    const provider = { baseUrl: "https://api.example/v1", apiKey: "k", model: "m" };
    const adapter = createLlmAdapter(provider);
    await expect(adapter(makeCtx("hi"), "sys")).rejects.toThrow("llm:");
    globalThis.fetch = originalFetch;
  });
  test("throws on fetch network failure", async () => {
    globalThis.fetch = () => Promise.reject(new Error("ECONNREFUSED"));
    const provider = { baseUrl: "https://api.example/v1", apiKey: "k", model: "m" };
    const adapter = createLlmAdapter(provider);
    await expect(adapter(makeCtx("hi"), "sys")).rejects.toThrow();
    globalThis.fetch = originalFetch;
  });
 });
@@ -0,0 +1,156 @@
 import { afterEach, describe, expect, mock, spyOn, test } from "bun:test";
 import type { AgentFn, ThreadContext } from "@uncaged/workflow";
 import { START } from "@uncaged/workflow";
 import * as z from "zod/v4";
 import { createRole } from "../src/create-role.js";
 import * as llmExtract from "../src/llm-extract.js";
 const provider = {
  baseUrl: "https://example.com/v1",
  apiKey: "k",
  model: "m",
 };
 function toolCallResponse(argsJson: string): Response {
  return new Response(
    JSON.stringify({
      choices: [
        {
          message: {
            tool_calls: [
              {
                function: {
                  name: "extract",
                  arguments: argsJson,
                },
              },
            ],
          },
        },
      ],
    }),
    { status: 200, headers: { "Content-Type": "application/json" } },
  );
 }
 function makeCtx(): ThreadContext {
  return {
    start: {
      role: START,
      content: "",
      meta: { maxRounds: 10 },
      timestamp: Date.now(),
    },
    steps: [],
  };
 }
 describe("createRole", () => {
  const originalFetch = globalThis.fetch;
  afterEach(() => {
    globalThis.fetch = originalFetch;
    mock.restore();
  });
  test("runs AgentFn then structured extract", async () => {
    globalThis.fetch = () => Promise.resolve(toolCallResponse(JSON.stringify({ n: 3 })));
    const schema = z.object({ n: z.number() });
    const agent: AgentFn = async (_ctx, prompt) => prompt;
    const role = createRole({
      name: "test",
      schema,
      systemPrompt: "hello",
      agent,
      extract: { provider, dryRun: null },
    });
    const out = await role(makeCtx());
    expect(out.content).toBe("hello");
    expect(out.meta).toEqual({ n: 3 });
  });
  test("passes ThreadContext to AgentFn", async () => {
    globalThis.fetch = () => Promise.resolve(toolCallResponse(JSON.stringify({ n: 0 })));
    const seen: ThreadContext[] = [];
    const agent: AgentFn = async (ctx, _prompt) => {
      seen.push(ctx);
      return "x";
    };
    const role = createRole({
      name: "test",
      schema: z.object({ n: z.number() }),
      systemPrompt: "p",
      agent,
      extract: { provider, dryRun: null },
    });
    await role(makeCtx());
    expect(seen).toHaveLength(1);
    expect(seen[0].steps).toEqual([]);
  });
  test("resolves dynamic systemPrompt functions before AgentFn", async () => {
    globalThis.fetch = () => Promise.resolve(toolCallResponse(JSON.stringify({ n: 99 })));
    const schema = z.object({ n: z.number() });
    const agent: AgentFn = async (_ctx, prompt) => prompt;
    const role = createRole({
      name: "test",
      schema,
      systemPrompt: async (ctx) => `rounds=${ctx.steps.length}`,
      agent,
      extract: { provider, dryRun: null },
    });
    const ctx = makeCtx();
    const out = await role(ctx);
    expect(out.content).toBe("rounds=0");
    expect(out.meta).toEqual({ n: 99 });
  });
  test("extract dryRun null runs live extract path", async () => {
    const spy = spyOn(llmExtract, "extractMetaOrThrow").mockResolvedValue({ n: 0 });
    const agent: AgentFn = async () => "raw";
    const role = createRole({
      name: "r1",
      schema: z.object({ n: z.number() }),
      systemPrompt: "p",
      agent,
      extract: { provider, dryRun: null },
    });
    await role(makeCtx());
    expect(spy).toHaveBeenCalledWith(
      "r1",
      "raw",
      expect.anything(),
      expect.objectContaining({ provider, dryRun: false }),
    );
  });
  test("extract.dryRun true uses structured extract dry-run", async () => {
    const spy = spyOn(llmExtract, "extractMetaOrThrow").mockResolvedValue({ n: 0 });
    const agent: AgentFn = async () => "raw";
    const role = createRole({
      name: "r2",
      schema: z.object({ n: z.number() }),
      systemPrompt: "p",
      agent,
      extract: { provider, dryRun: true },
    });
    await role(makeCtx());
    expect(spy).toHaveBeenCalledWith(
      "r2",
      "raw",
      expect.anything(),
      expect.objectContaining({ dryRun: true }),
    );
  });
 });
@@ -0,0 +1,100 @@
 import { describe, expect, test } from "bun:test";
 import type { Role, ThreadContext } from "@uncaged/workflow";
 import { START } from "@uncaged/workflow";
 import { decorateRole, onFail, withDryRun } from "../src/decorators.js";
 type TestMeta = Record<string, unknown> & { ok: boolean };
 function fakeCtx(): ThreadContext {
  return {
    start: {
      role: START,
      content: "",
      meta: {
        maxRounds: 10,
      },
      timestamp: Date.now(),
    },
    steps: [],
  };
 }
 const successRole: Role<TestMeta> = async () => ({
  content: "done",
  meta: { ok: true },
 });
 const failRole: Role<TestMeta> = async () => {
  throw new Error("boom");
 };
 const failNonErrorRole: Role<TestMeta> = async () => {
  throw "string error";
 };
 describe("withDryRun", () => {
  test("short-circuits on dry-run", async () => {
    const dec = withDryRun<TestMeta>({ label: "test", meta: { ok: true }, dryRun: true });
    const role = dec(successRole);
    const result = await role(fakeCtx());
    expect(result.content).toBe("[dry-run] test skipped");
    expect(result.meta).toEqual({ ok: true });
  });
  test("delegates when not dry-run", async () => {
    const innerDec = withDryRun<TestMeta>({ label: "test", meta: { ok: true }, dryRun: false });
    const role = innerDec(successRole);
    const result = await role(fakeCtx());
    expect(result.content).toBe("done");
    expect(result.meta).toEqual({ ok: true });
  });
 });
 describe("onFail", () => {
  test("passes through on success", async () => {
    const dec = onFail<TestMeta>({ label: "test", meta: { ok: false } });
    const role = dec(successRole);
    const result = await role(fakeCtx());
    expect(result.content).toBe("done");
    expect(result.meta).toEqual({ ok: true });
  });
  test("catches Error and returns structured failure", async () => {
    const dec = onFail<TestMeta>({ label: "test", meta: { ok: false } });
    const role = dec(failRole);
    const result = await role(fakeCtx());
    expect(result.content).toBe("test failed: boom");
    expect(result.meta).toEqual({ ok: false });
  });
  test("catches non-Error throws", async () => {
    const dec = onFail<TestMeta>({ label: "test", meta: { ok: false } });
    const role = dec(failNonErrorRole);
    const result = await role(fakeCtx());
    expect(result.content).toBe("test failed: string error");
    expect(result.meta).toEqual({ ok: false });
  });
 });
 describe("decorateRole", () => {
  test("applies decorators left-to-right", async () => {
    const role = decorateRole(failRole, [
      withDryRun<TestMeta>({ label: "x", meta: { ok: true }, dryRun: false }),
      onFail<TestMeta>({ label: "x", meta: { ok: false } }),
    ]);
    const result = await role(fakeCtx());
    expect(result.content).toBe("x failed: boom");
    expect(result.meta).toEqual({ ok: false });
  });
  test("dry-run short-circuits before onFail", async () => {
    const role = decorateRole(failRole, [
      withDryRun<TestMeta>({ label: "x", meta: { ok: true }, dryRun: true }),
      onFail<TestMeta>({ label: "x", meta: { ok: false } }),
    ]);
    const result = await role(fakeCtx());
    expect(result.content).toBe("[dry-run] x skipped");
    expect(result.meta).toEqual({ ok: true });
  });
 });
@@ -0,0 +1,143 @@
 import { describe, expect, test } from "bun:test";
 import * as z from "zod/v4";
 import { llmExtract } from "../src/llm-extract.js";
 describe("llmExtract", () => {
  const originalFetch = globalThis.fetch;
  test("parses tool call arguments and validates with the zod schema", async () => {
    const schema = z
      .object({
        name: z.string(),
        description: z.string(),
      })
      .describe("Extract sense metadata from plan");
    let capturedUrl: string | null = null;
    let capturedInit: RequestInit | null = null;
    globalThis.fetch = (input: RequestInfo | URL, init?: RequestInit) => {
      capturedUrl = typeof input === "string" ? input : input.toString();
      capturedInit = init ?? null;
      return Promise.resolve(
        new Response(
          JSON.stringify({
            choices: [
              {
                message: {
                  tool_calls: [
                    {
                      function: {
                        name: "extract",
                        arguments: JSON.stringify({
                          name: "cpu-usage",
                          description: "CPU load",
                        }),
                      },
                    },
                  ],
                },
              },
            ],
          }),
          { status: 200, headers: { "Content-Type": "application/json" } },
        ),
      );
    };
    const result = await llmExtract({
      text: "some plan",
      schema,
      provider: {
        baseUrl: "https://example.com/v1",
        apiKey: "k",
        model: "m",
      },
      dryRun: false,
    });
    globalThis.fetch = originalFetch;
    expect(result.ok).toBe(true);
    if (!result.ok) {
      return;
    }
    expect(result.value).toEqual({ name: "cpu-usage", description: "CPU load" });
    expect(capturedUrl).toBe("https://example.com/v1/chat/completions");
    expect(capturedInit?.method).toBe("POST");
    expect(capturedInit?.headers).toMatchObject({
      Authorization: "Bearer k",
      "Content-Type": "application/json",
    });
    const body = JSON.parse(capturedInit?.body as string) as {
      model: string;
      tool_choice: { function: { name: string } };
    };
    expect(body.model).toBe("m");
    expect(body.tool_choice.function.name).toBeDefined();
  });
  test("returns schema_validation_failed when arguments do not match the schema", async () => {
    const schema = z.object({ n: z.number() });
    globalThis.fetch = () =>
      Promise.resolve(
        new Response(
          JSON.stringify({
            choices: [
              {
                message: {
                  tool_calls: [
                    { function: { name: "extract", arguments: JSON.stringify({ n: "oops" }) } },
                  ],
                },
              },
            ],
          }),
          { status: 200, headers: { "Content-Type": "application/json" } },
        ),
      );
    const result = await llmExtract({
      text: "x",
      schema,
      provider: { baseUrl: "https://example.com", apiKey: "k", model: "m" },
      dryRun: false,
    });
    globalThis.fetch = originalFetch;
    expect(result.ok).toBe(false);
    if (result.ok) {
      return;
    }
    expect(result.error.kind).toBe("schema_validation_failed");
  });
  test("dryRun skips fetch and returns schema-shaped stub values", async () => {
    let calls = 0;
    globalThis.fetch = () => {
      calls += 1;
      return Promise.resolve(new Response("{}", { status: 200 }));
    };
    const schema = z.object({ n: z.number() });
    const result = await llmExtract({
      text: "ignored",
      schema,
      provider: { baseUrl: "https://example.com", apiKey: "k", model: "m" },
      dryRun: true,
    });
    globalThis.fetch = originalFetch;
    expect(calls).toBe(0);
    expect(result.ok).toBe(true);
    if (!result.ok) {
      return;
    }
    expect(result.value).toEqual({ n: 0 });
  });
 });
@@ -0,0 +1,15 @@
 {
  "name": "@uncaged/workflow-role-llm",
  "version": "0.1.0",
  "type": "module",
  "main": "src/index.ts",
  "types": "src/index.ts",
  "scripts": {
    "build": "echo 'TODO'",
    "test": "bun test"
  },
  "dependencies": {
    "@uncaged/workflow": "workspace:*",
    "zod": "^4.0.0"
  }
 }
@@ -0,0 +1,38 @@
 import type { WorkflowDescriptor, WorkflowRoleSchema } from "@uncaged/workflow";
 import * as z from "zod/v4";
 export type RoleDescriptorInput<M extends Record<string, unknown> = Record<string, unknown>> = {
  name: string;
  schema: z.ZodType<M>;
  /** Human-readable role description; use empty string when unknown. */
  description: string | null;
 };
 function stripJsonSchemaMeta(json: Record<string, unknown>): WorkflowRoleSchema {
  const { $schema: _drop, ...rest } = json;
  return rest as WorkflowRoleSchema;
 }
 /**
 * Builds a {@link WorkflowDescriptor} from role specs, emitting JSON Schema per role via
 * `z.toJSONSchema`.
 */
 export function buildDescriptorFromRoles(args: {
  description: string;
  roles: Record<string, RoleDescriptorInput>;
 }): WorkflowDescriptor {
  const roles: WorkflowDescriptor["roles"] = {};
  for (const [key, spec] of Object.entries(args.roles)) {
    if (spec.name !== key) {
      throw new Error(
        `buildDescriptorFromRoles: role key "${key}" must match spec.name "${spec.name}"`,
      );
    }
    const rawJsonSchema = z.toJSONSchema(spec.schema) as Record<string, unknown>;
    roles[key] = {
      description: spec.description === null ? "" : spec.description,
      schema: stripJsonSchemaMeta(rawJsonSchema),
    };
  }
  return { description: args.description, roles };
 }
@@ -0,0 +1,107 @@
 import { type AgentFn, err, ok, type Result, type ThreadContext } from "@uncaged/workflow";
 import type { LlmMessage, LlmProvider } from "./types.js";
 export type LlmChatError =
  | { kind: "http_error"; status: number; body: string }
  | { kind: "invalid_response_json"; message: string }
  | { kind: "network_error"; message: string }
  | { kind: "empty_choices" }
  | { kind: "no_assistant_text" };
 function chatUrl(baseUrl: string): string {
  const trimmed = baseUrl.replace(/\/+$/, "");
  return `${trimmed}/chat/completions`;
 }
 function isRecord(value: unknown): value is Record<string, unknown> {
  return typeof value === "object" && value !== null && !Array.isArray(value);
 }
 function formatLlmChatError(e: LlmChatError): string {
  return JSON.stringify(e);
 }
 async function fetchChatJson(
  provider: LlmProvider,
  body: Record<string, unknown>,
 ): Promise<Result<unknown, LlmChatError>> {
  let response: Response;
  try {
    response = await fetch(chatUrl(provider.baseUrl), {
      method: "POST",
      headers: {
        Authorization: `Bearer ${provider.apiKey}`,
        "Content-Type": "application/json",
      },
      body: JSON.stringify(body),
    });
  } catch (cause) {
    const message = cause instanceof Error ? cause.message : String(cause);
    return err({ kind: "network_error", message });
  }
  const responseText = await response.text();
  if (!response.ok) {
    return err({ kind: "http_error", status: response.status, body: responseText.slice(0, 4000) });
  }
  let parsed: unknown;
  try {
    parsed = JSON.parse(responseText) as unknown;
  } catch (cause) {
    const message = cause instanceof Error ? cause.message : String(cause);
    return err({ kind: "invalid_response_json", message });
  }
  return ok(parsed);
 }
 function parseAssistantText(parsed: unknown): Result<string, LlmChatError> {
  if (!isRecord(parsed)) {
    return err({ kind: "invalid_response_json", message: "Not an object" });
  }
  const choices = parsed.choices;
  if (!Array.isArray(choices) || choices.length === 0) {
    return err({ kind: "empty_choices" });
  }
  const c0 = choices[0];
  if (!isRecord(c0)) {
    return err({ kind: "empty_choices" });
  }
  const messageObj = c0.message;
  if (!isRecord(messageObj)) {
    return err({ kind: "no_assistant_text" });
  }
  const content = messageObj.content;
  if (typeof content === "string") {
    return ok(content);
  }
  return err({ kind: "no_assistant_text" });
 }
 export async function chatCompletionText(options: {
  provider: LlmProvider;
  messages: LlmMessage[];
 }): Promise<Result<string, LlmChatError>> {
  const body = { model: options.provider.model, messages: options.messages };
  const res = await fetchChatJson(options.provider, body);
  if (!res.ok) {
    return res;
  }
  return parseAssistantText(res.value);
 }
 /** Single-turn chat adapter: system comes from `createRole` prompt; user is the thread start frame. */
 export function createLlmAdapter(provider: LlmProvider): AgentFn {
  return async (ctx: ThreadContext, systemPrompt: string) => {
    const result = await chatCompletionText({
      provider,
      messages: [
        { role: "system", content: systemPrompt },
        { role: "user", content: ctx.start.content },
      ],
    });
    if (!result.ok) {
      throw new Error(`llm: ${formatLlmChatError(result.error)}`);
    }
    return result.value;
  };
 }
@@ -0,0 +1,35 @@
 import type { AgentFn, Role, ThreadContext } from "@uncaged/workflow";
 import type * as z from "zod/v4";
 import { extractMetaOrThrow } from "./llm-extract.js";
 import type { LlmProvider } from "./types.js";
 export type CreateRoleArgs<M extends Record<string, unknown>> = {
  name: string;
  schema: z.ZodType<M>;
  systemPrompt: string | ((ctx: ThreadContext) => Promise<string>);
  agent: AgentFn;
  extract: {
    provider: LlmProvider;
    /** When `true`, structured extract returns schema-shaped defaults. When `null`, live API extract. */
    dryRun: boolean | null;
  };
 };
 function resolveExtractDryRun(extractDryRun: boolean | null): boolean {
  return extractDryRun === true;
 }
 /** Builds a {@link Role} from an {@link AgentFn}, system prompt, Zod meta schema, and extract wiring. */
 export function createRole<M extends Record<string, unknown>>(args: CreateRoleArgs<M>): Role<M> {
  return async (ctx: ThreadContext) => {
    const promptText =
      typeof args.systemPrompt === "string" ? args.systemPrompt : await args.systemPrompt(ctx);
    const raw = await args.agent(ctx, promptText);
    const meta = await extractMetaOrThrow(args.name, raw, args.schema, {
      provider: args.extract.provider,
      dryRun: resolveExtractDryRun(args.extract.dryRun),
    });
    return { content: raw, meta };
  };
 }
@@ -0,0 +1,63 @@
 import type { Role, ThreadContext } from "@uncaged/workflow";
 /** A role decorator: takes a role, returns an enhanced role. */
 export type RoleDecorator<M extends Record<string, unknown>> = (role: Role<M>) => Role<M>;
 /**
 * Apply an ordered list of decorators to a role.
 * Decorators are applied left-to-right (first in list wraps innermost).
 */
 export function decorateRole<M extends Record<string, unknown>>(
  role: Role<M>,
  decorators: RoleDecorator<M>[],
 ): Role<M> {
  return decorators.reduce((r, dec) => dec(r), role);
 }
 export type WithDryRunOptions<M extends Record<string, unknown>> = {
  /** Used in skip message (e.g. "committer", "publish"). */
  label: string;
  /** Meta returned when dry-run skips execution. */
  meta: M;
  /** Adapter-level dry-run flag (e.g. from extract / wiring config). */
  dryRun: boolean;
 };
 /** Short-circuits with a stable result when `dryRun` is true. */
 export function withDryRun<M extends Record<string, unknown>>(
  opts: WithDryRunOptions<M>,
 ): RoleDecorator<M> {
  return (role) => async (ctx: ThreadContext) => {
    if (opts.dryRun) {
      return {
        content: `[dry-run] ${opts.label} skipped`,
        meta: opts.meta,
      };
    }
    return role(ctx);
  };
 }
 export type OnFailOptions<M extends Record<string, unknown>> = {
  /** Used in failure message (e.g. "committer", "publish"). */
  label: string;
  /** Meta returned when the inner role throws. */
  meta: M;
 };
 /** Catches thrown errors and converts them into a structured {@link Role} result instead of propagating. */
 export function onFail<M extends Record<string, unknown>>(
  opts: OnFailOptions<M>,
 ): RoleDecorator<M> {
  return (role) => async (ctx: ThreadContext) => {
    try {
      return await role(ctx);
    } catch (e) {
      const msg = e instanceof Error ? e.message : String(e);
      return {
        content: `${opts.label} failed: ${msg}`,
        meta: opts.meta,
      };
    }
  };
 }
@@ -0,0 +1,22 @@
 export { buildDescriptorFromRoles, type RoleDescriptorInput } from "./build-descriptor.js";
 export { chatCompletionText, createLlmAdapter, type LlmChatError } from "./create-llm-adapter.js";
 export { type CreateRoleArgs, createRole } from "./create-role.js";
 export {
  decorateRole,
  type OnFailOptions,
  onFail,
  type RoleDecorator,
  type WithDryRunOptions,
  withDryRun,
 } from "./decorators.js";
 export {
  extractMetaOrThrow,
  type LlmError,
  type LlmExtractArgs,
  type LlmProvider,
  llmErrorToCause,
  llmExtract,
  llmExtractWithRetry,
 } from "./llm-extract.js";
 export { schemaDefaults } from "./schema-defaults.js";
 export type { LlmMessage, MetaExtractConfig } from "./types.js";
@@ -0,0 +1,274 @@
 import { err, ok, type Result } from "@uncaged/workflow";
 import * as z from "zod/v4";
 import { schemaDefaults } from "./schema-defaults.js";
 import type { LlmProvider } from "./types.js";
 export type { LlmProvider } from "./types.js";
 export type LlmExtractArgs<T> = {
  text: string;
  schema: z.ZodType<T>;
  provider: LlmProvider;
  dryRun: boolean;
 };
 export type LlmError =
  | { kind: "http_error"; status: number; body: string }
  | { kind: "invalid_response_json"; message: string }
  | { kind: "no_tool_call"; preview: string }
  | { kind: "tool_arguments_invalid_json"; message: string }
  | { kind: "schema_validation_failed"; message: string }
  | { kind: "network_error"; message: string };
 function chatCompletionsUrl(baseUrl: string): string {
  const trimmed = baseUrl.replace(/\/+$/, "");
  return `${trimmed}/chat/completions`;
 }
 function isRecord(value: unknown): value is Record<string, unknown> {
  return typeof value === "object" && value !== null && !Array.isArray(value);
 }
 function stripJsonSchemaMeta(json: Record<string, unknown>): Record<string, unknown> {
  const { $schema: _drop, ...rest } = json;
  return rest;
 }
 function readToolName(parametersSchema: Record<string, unknown>): string {
  const title = parametersSchema.title;
  if (typeof title === "string" && title.trim().length > 0) {
    return title.trim();
  }
  return "extract";
 }
 function readToolDescription(parametersSchema: Record<string, unknown>): string {
  const d = parametersSchema.description;
  if (typeof d === "string" && d.trim().length > 0) {
    return d.trim();
  }
  return "Extract structured data from the input text.";
 }
 function readToolArgumentsJson(parsed: unknown, previewSource: string): Result<string, LlmError> {
  if (!isRecord(parsed)) {
    return err({ kind: "invalid_response_json", message: "Top-level JSON is not an object" });
  }
  const choices = parsed.choices;
  if (!Array.isArray(choices) || choices.length === 0) {
    return err({ kind: "no_tool_call", preview: previewSource.slice(0, 500) });
  }
  const first = choices[0];
  if (!isRecord(first)) {
    return err({ kind: "no_tool_call", preview: previewSource.slice(0, 500) });
  }
  const messageObj = first.message;
  if (!isRecord(messageObj)) {
    return err({ kind: "no_tool_call", preview: previewSource.slice(0, 500) });
  }
  const toolCalls = messageObj.tool_calls;
  if (!Array.isArray(toolCalls) || toolCalls.length === 0) {
    return err({ kind: "no_tool_call", preview: previewSource.slice(0, 500) });
  }
  const call0 = toolCalls[0];
  if (!isRecord(call0)) {
    return err({ kind: "no_tool_call", preview: previewSource.slice(0, 500) });
  }
  const fn = call0.function;
  if (!isRecord(fn)) {
    return err({ kind: "no_tool_call", preview: previewSource.slice(0, 500) });
  }
  const argsRaw = fn.arguments;
  if (typeof argsRaw !== "string") {
    return err({ kind: "no_tool_call", preview: previewSource.slice(0, 500) });
  }
  return ok(argsRaw);
 }
 function isRetryableExtractError(error: LlmError): boolean {
  return error.kind === "schema_validation_failed" || error.kind === "tool_arguments_invalid_json";
 }
 function describeRetryHint(error: LlmError): string {
  if (error.kind === "schema_validation_failed") {
    return `Schema validation failed: ${error.message}`;
  }
  if (error.kind === "tool_arguments_invalid_json") {
    return `Tool arguments were not valid JSON: ${error.message}`;
  }
  return JSON.stringify(error);
 }
 export function llmErrorToCause(error: LlmError): Error {
  switch (error.kind) {
    case "http_error":
      return new Error(`HTTP ${error.status}: ${error.body.slice(0, 500)}`);
    case "invalid_response_json":
      return new Error(error.message);
    case "no_tool_call":
      return new Error(`No tool call in response: ${error.preview}`);
    case "tool_arguments_invalid_json":
      return new Error(error.message);
    case "schema_validation_failed":
      return new Error(error.message);
    case "network_error":
      return new Error(error.message);
  }
 }
 async function performLlmExtract<T>(
  options: LlmExtractArgs<T> & { userContent: string },
 ): Promise<Result<T, LlmError>> {
  if (options.dryRun) {
    return ok(schemaDefaults(options.schema) as T);
  }
  const rawJsonSchema = z.toJSONSchema(options.schema) as Record<string, unknown>;
  const parameters = stripJsonSchemaMeta(rawJsonSchema);
  const toolName = readToolName(parameters);
  const toolDescription = readToolDescription(parameters);
  const body = {
    model: options.provider.model,
    messages: [
      {
        role: "system" as const,
        content: "Extract the requested information from the provided text. Be precise.",
      },
      { role: "user" as const, content: options.userContent },
    ],
    tools: [
      {
        type: "function" as const,
        function: {
          name: toolName,
          description: toolDescription,
          parameters,
        },
      },
    ],
    tool_choice: { type: "function" as const, function: { name: toolName } },
  };
  let response: Response;
  try {
    response = await fetch(chatCompletionsUrl(options.provider.baseUrl), {
      method: "POST",
      headers: {
        Authorization: `Bearer ${options.provider.apiKey}`,
        "Content-Type": "application/json",
      },
      body: JSON.stringify(body),
    });
  } catch (cause) {
    const message = cause instanceof Error ? cause.message : String(cause);
    return err({ kind: "network_error", message });
  }
  const responseText = await response.text();
  if (!response.ok) {
    return err({ kind: "http_error", status: response.status, body: responseText.slice(0, 4000) });
  }
  let parsed: unknown;
  try {
    parsed = JSON.parse(responseText) as unknown;
  } catch (cause) {
    const message = cause instanceof Error ? cause.message : String(cause);
    return err({ kind: "invalid_response_json", message });
  }
  const argsJson = readToolArgumentsJson(parsed, responseText);
  if (!argsJson.ok) {
    return argsJson;
  }
  let argsParsed: unknown;
  try {
    argsParsed = JSON.parse(argsJson.value) as unknown;
  } catch (cause) {
    const message = cause instanceof Error ? cause.message : String(cause);
    return err({ kind: "tool_arguments_invalid_json", message });
  }
  const validated = options.schema.safeParse(argsParsed);
  if (!validated.success) {
    return err({
      kind: "schema_validation_failed",
      message: validated.error.message,
    });
  }
  return ok(validated.data);
 }
 /** Single LLM extract attempt over OpenAI-compatible chat completions with forced tool call. */
 export async function llmExtract<T>(options: LlmExtractArgs<T>): Promise<Result<T, LlmError>> {
  return performLlmExtract({ ...options, userContent: options.text });
 }
 /**
 * Runs extract up to two times: on the first schema/tool-args parse failure, resends the agent
 * output plus the error so the model can correct the tool call.
 */
 export async function llmExtractWithRetry<T>(
  options: LlmExtractArgs<T>,
 ): Promise<Result<T, LlmError>> {
  const first = await performLlmExtract({
    ...options,
    userContent: options.text,
  });
  if (first.ok) {
    return first;
  }
  if (!isRetryableExtractError(first.error)) {
    return first;
  }
  const hint = describeRetryHint(first.error);
  const correction = `The previous extraction attempt failed.
 ${hint}
 Respond again with a single tool call whose \`arguments\` JSON strictly matches the schema.`;
  const secondContent = `${options.text}
 ---
 ${correction}`;
  return performLlmExtract({
    ...options,
    userContent: secondContent,
  });
 }
 export async function extractMetaOrThrow<T extends Record<string, unknown>>(
  roleName: string,
  raw: string,
  schema: z.ZodType<T>,
  options: { provider: LlmProvider; dryRun: boolean },
 ): Promise<T> {
  const result = await llmExtractWithRetry({
    text: raw,
    schema,
    provider: options.provider,
    dryRun: options.dryRun,
  });
  if (!result.ok) {
    throw new Error(
      `Role "${roleName}": structured extraction failed after retry: ${JSON.stringify(result.error)}`,
    );
  }
  return result.value;
 }
@@ -0,0 +1,190 @@
 import type * as z from "zod/v4";
 type ZodTypeAny = z.ZodType;
 type Def = Record<string, unknown> & { type: string };
 type TypeHandler = (schema: ZodTypeAny, def: Def) => unknown;
 function isPlainObject(value: unknown): value is Record<string, unknown> {
  return typeof value === "object" && value !== null && !Array.isArray(value);
 }
 function isZodExactOptional(s: ZodTypeAny): boolean {
  return s.constructor.name === "ZodExactOptional";
 }
 function resolveDefaultValue(defaultValue: unknown | (() => unknown)): unknown {
  if (typeof defaultValue === "function") {
    return (defaultValue as () => unknown)();
  }
  return defaultValue;
 }
 function mergeIntersection(left: unknown, right: unknown): unknown {
  if (isPlainObject(left) && isPlainObject(right)) {
    return { ...left, ...right };
  }
  return right;
 }
 function defaultsForObject(_schema: ZodTypeAny, def: Def): unknown {
  const shape = def.shape as Record<string, ZodTypeAny> | undefined;
  if (shape === undefined) {
    return {};
  }
  const out: Record<string, unknown> = {};
  for (const key of Object.keys(shape)) {
    const child = shape[key];
    const cdef = child.def as { type: string };
    if (cdef.type === "optional") {
      if (isZodExactOptional(child)) {
        continue;
      }
      out[key] = undefined;
    } else {
      out[key] = schemaDefaultsInner(child);
    }
  }
  return out;
 }
 function firstUnionOption(_schema: ZodTypeAny, def: Def): unknown {
  const options = def.options as readonly ZodTypeAny[] | undefined;
  if (options === undefined || options.length === 0) {
    return null;
  }
  return schemaDefaultsInner(options[0]);
 }
 function defaultsFromNullable(_schema: ZodTypeAny, _def: Def): unknown {
  return null;
 }
 function defaultsFromInner(_schema: ZodTypeAny, def: Def): unknown {
  const inner = def.innerType as ZodTypeAny | undefined;
  if (inner === undefined) {
    return null;
  }
  return schemaDefaultsInner(inner);
 }
 function defaultsForPipe(_schema: ZodTypeAny, def: Def): unknown {
  const out = def.out as ZodTypeAny | undefined;
  if (out === undefined) {
    return null;
  }
  return schemaDefaultsInner(out);
 }
 function defaultsForIntersection(_schema: ZodTypeAny, def: Def): unknown {
  const left = def.left as ZodTypeAny | undefined;
  const right = def.right as ZodTypeAny | undefined;
  if (left === undefined || right === undefined) {
    return null;
  }
  return mergeIntersection(schemaDefaultsInner(left), schemaDefaultsInner(right));
 }
 function defaultsForTuple(_schema: ZodTypeAny, def: Def): unknown {
  const items = def.items as readonly ZodTypeAny[] | undefined;
  if (items === undefined) {
    return [];
  }
  return items.map((item) => schemaDefaultsInner(item));
 }
 function defaultsForLazy(schema: ZodTypeAny, def: Def): unknown {
  const inner =
    (schema as { _zod?: { innerType?: ZodTypeAny } })._zod?.innerType ??
    (def.getter as (() => ZodTypeAny) | undefined)?.();
  if (inner === undefined) {
    return null;
  }
  return schemaDefaultsInner(inner);
 }
 function defaultsForPromise(_schema: ZodTypeAny, def: Def): unknown {
  const inner = def.innerType as ZodTypeAny | undefined;
  if (inner === undefined) {
    return Promise.resolve(null);
  }
  return Promise.resolve(schemaDefaultsInner(inner));
 }
 function firstEnumValue(_schema: ZodTypeAny, def: Def): unknown {
  const entries = def.entries as Record<string, string | number> | undefined;
  if (entries === undefined) {
    return null;
  }
  const values = Object.values(entries);
  return values[0] ?? null;
 }
 function firstLiteralValue(_schema: ZodTypeAny, def: Def): unknown {
  const values = def.values as unknown[] | undefined;
  if (values === undefined || values.length === 0) {
    return null;
  }
  return values[0];
 }
 const TYPE_HANDLERS: Record<string, TypeHandler> = {
  string: () => "",
  number: () => 0,
  boolean: () => false,
  bigint: () => 0n,
  date: () => new Date(0),
  symbol: () => Symbol(),
  undefined: () => undefined,
  null: () => null,
  void: () => undefined,
  any: () => null,
  unknown: () => null,
  never: () => undefined,
  nan: () => Number.NaN,
  array: () => [],
  object: defaultsForObject,
  record: () => ({}),
  map: () => new Map(),
  set: () => new Set(),
  enum: firstEnumValue,
  literal: firstLiteralValue,
  optional: () => undefined,
  nullable: defaultsFromNullable,
  default: (_s, def) => resolveDefaultValue(def.defaultValue as unknown | (() => unknown)),
  prefault: (_s, def) => resolveDefaultValue(def.defaultValue as unknown | (() => unknown)),
  nonoptional: defaultsFromInner,
  catch: defaultsFromInner,
  success: () => false,
  readonly: defaultsFromInner,
  union: firstUnionOption,
  xor: firstUnionOption,
  intersection: defaultsForIntersection,
  pipe: defaultsForPipe,
  transform: () => null,
  tuple: defaultsForTuple,
  lazy: defaultsForLazy,
  promise: defaultsForPromise,
  file: () => new File([], ""),
  function: () => null,
  custom: () => null,
  template_literal: () => "",
 };
 /**
 * Produces a structurally valid placeholder that mirrors primitive/array/object
 * shape for a Zod schema. Used for `llmExtract` dry runs so downstream code
 * does not throw on `undefined` fields.
 */
 export function schemaDefaults(schema: z.ZodType): unknown {
  return schemaDefaultsInner(schema as ZodTypeAny);
 }
 function schemaDefaultsInner(schema: ZodTypeAny): unknown {
  const def = schema.def as Def;
  const run = TYPE_HANDLERS[def.type];
  if (run === undefined) {
    return null;
  }
  return run(schema, def);
 }
@@ -0,0 +1,15 @@
 import type * as z from "zod/v4";
 export type LlmProvider = {
  baseUrl: string;
  apiKey: string;
  model: string;
 };
 export type LlmMessage = { role: "system" | "user" | "assistant"; content: string };
 /** Pairs an OpenAI-compatible provider with the Zod meta schema used for structured extraction. */
 export type MetaExtractConfig<T> = {
  provider: LlmProvider;
  schema: z.ZodType<T>;
 };
@@ -0,0 +1,10 @@
 {
  "extends": "../../tsconfig.json",
  "compilerOptions": {
    "rootDir": "src",
    "outDir": "dist",
    "composite": true
  },
  "include": ["src/**/*.ts"],
  "references": [{ "path": "../workflow" }]
 }
@@ -15,5 +15,9 @@
    "composite": true,
    "outDir": "dist"
  },
-  "references": [{ "path": "packages/workflow" }, { "path": "packages/cli-workflow" }]
+  "references": [
    { "path": "packages/workflow" },
    { "path": "packages/workflow-role-llm" },
    { "path": "packages/cli-workflow" }
  ]
 }