// === src/agents/chunker.ts ===
import { estimateTokens } from "../utils/llm.js";

const MAX_CHUNK_TOKENS = 80_000; // Leave room for system prompt + output
const OVERLAP_CHARS = 500; // Overlap between chunks to preserve context at boundaries

export interface Chunk {
  index: number;
  total: number;
  text: string;
  tokenEstimate: number;
}

/**
 * Split text into chunks that fit within LLM context limits.
 * Splits on paragraph boundaries when possible, with overlap.
 */
export function chunkInput(text: string): Chunk[] {
  const totalTokens = estimateTokens(text);

  if (totalTokens <= MAX_CHUNK_TOKENS) {
    return [{ index: 0, total: 1, text, tokenEstimate: totalTokens }];
  }

  const maxCharsPerChunk = MAX_CHUNK_TOKENS * 4; // reverse of token estimate
  const chunks: Chunk[] = [];
  let offset = 0;

  while (offset < text.length) {
    let end = Math.min(offset + maxCharsPerChunk, text.length);

    // Try to split on a paragraph boundary
    if (end < text.length) {
      const searchRegion = text.slice(Math.max(end - 2000, offset), end);
      const lastParagraph = searchRegion.lastIndexOf("\n\n");
      if (lastParagraph > 0) {
        end = Math.max(end - 2000, offset) + lastParagraph + 2;
      } else {
        // Fall back to line boundary
        const lastLine = searchRegion.lastIndexOf("\n");
        if (lastLine > 0) {
          end = Math.max(end - 2000, offset) + lastLine + 1;
        }
      }
    }

    const chunkText = text.slice(offset, end);
    chunks.push({
      index: chunks.length,
      total: 0, // filled in below
      text: chunkText,
      tokenEstimate: estimateTokens(chunkText),
    });

    // Advance with overlap
    offset = end - (end < text.length ? OVERLAP_CHARS : 0);
  }

  // Set total count
  for (const chunk of chunks) {
    chunk.total = chunks.length;
  }

  return chunks;
}

// === src/agents/extraction.ts ===
import { callAgentJSON, checkInputSize } from "../utils/llm.js";
import type { PipelineInput } from "../pipeline/index.js";
import { chunkInput } from "./chunker.js";
import { getPromptForSourceType } from "./prompts.js";
import { validateExtraction } from "../schema/extraction.js";

export interface RawExtraction {
  entities: Array<{
    name: string;
    type: string;
    description: string;
    properties?: Record<string, unknown>;
    tags?: string[];
  }>;
  relations: Array<{
    source: string;
    target: string;
    type: string;
    label: string;
    bidirectional?: boolean;
  }>;
  processes: Array<{
    name: string;
    description: string;
    trigger?: string;
    steps: Array<{
      order: number;
      action: string;
      actor?: string;
      inputs?: string[];
      outputs?: string[];
    }>;
    participants: string[];
    outcomes: string[];
  }>;
  constraints: Array<{
    name: string;
    type: string;
    description: string;
    scope: string[];
    severity: "hard" | "soft";
  }>;
  model_name: string;
  model_description: string;
  source_summary: string;
  confidence: number;
  extraction_notes: string[];
}

const SYSTEM_PROMPT = `You are a world-model extraction agent. Your job is to analyze ANY input — text, code, conversation, documentation, descriptions — and extract a complete structured world model from it.

You must extract:

1. **Entities** — every distinct thing, actor, system, concept, resource, location, event, or group mentioned or implied. For each:
   - name: clear identifier
   - type: one of [actor, object, system, concept, location, event, group, resource]
   - description: what it is and why it matters in context
   - properties: any measurable/specific attributes
   - tags: categorization labels

2. **Relations** — every connection between entities. For each:
   - source: name of source entity (must match an entity name exactly)
   - target: name of target entity (must match an entity name exactly)
   - type: one of [has, is_a, part_of, depends_on, produces, consumes, controls, communicates_with, located_in, triggers, inherits, contains, uses, flows_to, opposes, enables, transforms]
   - label: human-readable description
   - bidirectional: true if the relation goes both ways

3. **Processes** — every dynamic sequence, workflow, or series of events. For each:
   - name, description, trigger
   - steps: ordered list with action, actor (entity name), inputs (entity names), outputs (entity names)
   - participants: all entity names involved
   - outcomes: what the process produces or changes

4. **Constraints** — every rule, invariant, limitation, boundary, or requirement. For each:
   - name, description
   - type: one of [invariant, rule, boundary, dependency, capacity, temporal, authorization]
   - scope: entity names this applies to
   - severity: hard (violation = error) or soft (violation = warning)

5. **Metadata**:
   - model_name: a concise name for the world being modeled
   - model_description: what domain/system this represents
   - source_summary: brief description of the input
   - confidence: 0-1 overall extraction confidence
   - extraction_notes: ambiguities, gaps, assumptions you made

RULES:
- Extract EVERYTHING — be thorough, not selective
- Infer implicit entities and relations (e.g., if "users log in", there's a User actor, an Authentication system, and a Login process)
- Entity names in relations/processes MUST exactly match entity names
- Output ONLY valid JSON matching the schema — no commentary outside the JSON
- If the input is code, model the architecture (modules, data flows, APIs, etc.)
- If the input is a conversation, model the topics, participants, decisions, and action items
- If the input is vague, extract what you can and note gaps in extraction_notes`;

const CHUNK_SYSTEM_PROMPT = `${SYSTEM_PROMPT}

IMPORTANT: You are processing chunk {chunkIndex} of {chunkTotal} from a larger input.
- Extract everything from THIS chunk
- Use consistent entity names (the chunks will be merged later)
- Note in extraction_notes that this is a partial extraction from chunk {chunkIndex}/{chunkTotal}`;

function mergeRawExtractions(extractions: RawExtraction[]): RawExtraction {
  const merged: RawExtraction = {
    entities: [],
    relations: [],
    processes: [],
    constraints: [],
    model_name: extractions[0]?.model_name ?? "Untitled",
    model_description: extractions[0]?.model_description ?? "",
    source_summary: extractions
      .map((e) => e.source_summary)
      .filter(Boolean)
      .join("; "),
    confidence: 0,
    extraction_notes: [],
  };

  // Deduplicate entities by normalized name
  const entityMap = new Map<string, RawExtraction["entities"][number]>();
  for (const ext of extractions) {
    for (const e of ext.entities) {
      const key = e.name.toLowerCase().trim();
      if (!entityMap.has(key)) {
        entityMap.set(key, e);
      } else {
        const existing = entityMap.get(key)!;
        // Keep longer description, merge props/tags
        if (e.description.length > existing.description.length) {
          existing.description = e.description;
        }
        if (e.properties) {
          existing.properties = { ...existing.properties, ...e.properties };
        }
        if (e.tags) {
          existing.tags = [...new Set([...(existing.tags ?? []), ...e.tags])];
        }
      }
    }
  }
  merged.entities = [...entityMap.values()];

  // Deduplicate relations by (source, target, type)
  const relSet = new Set<string>();
  for (const ext of extractions) {
    for (const r of ext.relations) {
      const key = `${r.source.toLowerCase()}::${r.type}::${r.target.toLowerCase()}`;
      if (!relSet.has(key)) {
        relSet.add(key);
        merged.relations.push(r);
      }
    }
  }

  // Deduplicate processes by name
  const procSet = new Set<string>();
  for (const ext of extractions) {
    for (const p of ext.processes) {
      const key = p.name.toLowerCase().trim();
      if (!procSet.has(key)) {
        procSet.add(key);
        merged.processes.push(p);
      }
    }
  }

  // Deduplicate constraints by name
  const cstrSet = new Set<string>();
  for (const ext of extractions) {
    for (const c of ext.constraints) {
      const key = c.name.toLowerCase().trim();
      if (!cstrSet.has(key)) {
        cstrSet.add(key);
        merged.constraints.push(c);
      }
    }
  }

  // Average confidence
  const confidences = extractions.map((e) => e.confidence).filter((c) => c > 0);
  merged.confidence = confidences.length
    ? confidences.reduce((a, b) => a + b, 0) / confidences.length
    : 0.5;

  // Collect all notes
  merged.extraction_notes = extractions.flatMap(
    (e) => e.extraction_notes ?? [],
  );
  if (extractions.length > 1) {
    merged.extraction_notes.push(
      `Merged from ${extractions.length} chunks (${merged.entities.length} unique entities after dedup)`,
    );
  }

  return merged;
}

function validateAndCoerce(raw: unknown): RawExtraction {
  const { extraction, issues } = validateExtraction(raw);
  if (issues.length > 0) {
    process.stderr.write(`  [validation] ${issues.join("; ")}\n`);
  }
  // Cast validated extraction to RawExtraction (shapes are compatible)
  return extraction as unknown as RawExtraction;
}

export async function extractionAgent(
  input: PipelineInput,
): Promise<{ input: PipelineInput; extraction: RawExtraction }> {
  if (!input.raw || !input.raw.trim()) {
    throw new Error("Cannot extract from empty input");
  }

  const sizeCheck = checkInputSize(input.raw);
  if (sizeCheck.warning) {
    process.stderr.write(`  [warn] ${sizeCheck.warning}\n`);
  }

  const chunks = chunkInput(input.raw);
  const sourcePrompt = getPromptForSourceType(input.sourceType);

  if (chunks.length === 1) {
    // Single chunk — direct extraction with source-specific prompt
    const userMessage = `Analyze the following ${input.sourceType} input and extract a complete world model.\n\n---\n\n${input.raw}`;
    const rawResult = await callAgentJSON<unknown>(sourcePrompt, userMessage, {
      maxTokens: 16384,
    });
    return { input, extraction: validateAndCoerce(rawResult) };
  }

  // Multi-chunk — extract per chunk with source-specific prompt, then merge
  const chunkSuffix = `\n\nIMPORTANT: You are processing chunk {chunkIndex} of {chunkTotal} from a larger input.\n- Extract everything from THIS chunk\n- Use consistent entity names (chunks will be merged later)\n- Note in extraction_notes that this is a partial extraction from chunk {chunkIndex}/{chunkTotal}`;

  const extractions: RawExtraction[] = [];
  for (const chunk of chunks) {
    const prompt = (sourcePrompt + chunkSuffix)
      .replace(/\{chunkIndex\}/g, String(chunk.index + 1))
      .replace(/\{chunkTotal\}/g, String(chunk.total));

    const userMessage = `Analyze chunk ${chunk.index + 1}/${chunk.total} of a ${input.sourceType} input and extract all world model elements.\n\n---\n\n${chunk.text}`;

    const rawResult = await callAgentJSON<unknown>(prompt, userMessage, {
      maxTokens: 16384,
    });
    extractions.push(validateAndCoerce(rawResult));
  }

  return { input, extraction: mergeRawExtractions(extractions) };
}

// === src/agents/index.ts ===
export { extractionAgent } from "./extraction.js";
export { structuringAgent } from "./structuring.js";
export { validationAgent } from "./validation.js";
export { refineWorldModel } from "./refinement.js";
export { chunkInput } from "./chunker.js";
export { getPromptForSourceType } from "./prompts.js";
export { secondPassAgent } from "./second-pass.js";

// === src/agents/prompts.ts ===
const BASE_SCHEMA = `You must output ONLY valid JSON with this structure:
{
  "entities": [{ "name", "type" (actor|object|system|concept|location|event|group|resource), "description", "properties"?, "tags"? }],
  "relations": [{ "source" (entity name), "target" (entity name), "type" (has|is_a|part_of|depends_on|produces|consumes|controls|communicates_with|located_in|triggers|inherits|contains|uses|flows_to|opposes|enables|transforms), "label", "bidirectional"? }],
  "processes": [{ "name", "description", "trigger"?, "steps": [{ "order", "action", "actor"?, "inputs"?, "outputs"? }], "participants" (entity names), "outcomes" }],
  "constraints": [{ "name", "type" (invariant|rule|boundary|dependency|capacity|temporal|authorization), "description", "scope" (entity names), "severity" (hard|soft) }],
  "model_name", "model_description", "source_summary", "confidence" (0-1), "extraction_notes": []
}

RULES:
- Entity names in relations/processes MUST exactly match entity names
- Extract EVERYTHING — be thorough, not selective
- Infer implicit entities and relations
- Output ONLY valid JSON — no commentary outside the JSON`;

export const PROMPTS: Record<string, string> = {
  text: `You are a world-model extraction agent. Analyze the given text and extract a complete structured world model.

Focus on:
- Named entities (people, organizations, places, things, concepts)
- Relationships between them (ownership, hierarchy, dependency, flow)
- Any described processes, workflows, or sequences of events
- Rules, constraints, limitations mentioned or implied
- Implicit entities that must exist for described behaviors to work

${BASE_SCHEMA}`,

  code: `You are a world-model extraction agent specialized in SOURCE CODE analysis. Analyze the code and extract its architectural world model.

Focus on:
- Modules, classes, functions, and services as entities
- Import/export dependencies as relations
- Data flow between components (who produces what, who consumes what)
- API endpoints, routes, handlers as processes with steps
- Type definitions and interfaces as concept entities
- Database models and schemas as resource entities
- Configuration and environment variables as constraints
- Error handling patterns as boundary constraints
- Authentication/authorization as authorization constraints
- External service integrations as system entities

Infer the ARCHITECTURE, not just list files. Model how data flows through the system.

${BASE_SCHEMA}`,

  conversation: `You are a world-model extraction agent specialized in CONVERSATION analysis. Analyze the conversation and extract a structured world model of its content.

Focus on:
- Participants as actor entities
- Topics discussed as concept entities
- Systems/products/tools mentioned as system/object entities
- Decisions made as event entities with relations to what they affect
- Action items as process entities with steps and assigned actors
- Agreements and disagreements as relations (enables/opposes)
- Deadlines and commitments as temporal constraints
- Open questions as extraction_notes

Model the SUBSTANCE of the conversation, not the conversation itself.

${BASE_SCHEMA}`,

  document: `You are a world-model extraction agent specialized in DOCUMENT analysis. Analyze the document and extract a complete structured world model.

Focus on:
- All named entities (organizations, roles, systems, concepts, regulations)
- Hierarchical relationships (org charts, system architectures, taxonomies)
- Described workflows and procedures as processes
- Requirements, policies, and rules as constraints
- Defined terms as concept entities
- Dependencies between components or teams
- Temporal sequences (phases, milestones, deadlines)

Treat the document as a specification of a world — extract that world completely.

${BASE_SCHEMA}`,

  url: `You are a world-model extraction agent. The input is content fetched from a URL. Analyze it and extract a complete structured world model.

Focus on:
- The domain/topic the page covers
- All entities, services, products, or concepts described
- Relationships between them
- Any processes, workflows, or user journeys described
- Pricing, limitations, or constraints mentioned
- Technical specifications as properties on entities

${BASE_SCHEMA}`,

  mixed: `You are a world-model extraction agent. The input contains MIXED content types (possibly text, code, data, and structured content together).

Focus on:
- Identify what each section represents (narrative, code, data, config)
- Extract entities from ALL sections — they may reference each other
- Cross-reference: code entities may implement concepts described in text
- Data sections may define entity properties or constraints
- Use consistent entity names across all sections

${BASE_SCHEMA}`,
};

export function getPromptForSourceType(sourceType: string): string {
  return PROMPTS[sourceType] ?? PROMPTS.text;
}

// === src/agents/query.ts ===
import { callAgent } from "../utils/llm.js";
import {
  findEntity,
  findDependents,
  pathsBetween,
  getStats,
} from "../utils/graph.js";
import type { WorldModelType } from "../schema/index.js";

export interface QueryResult {
  answer: string;
  method: "graph" | "inference";
  entities_referenced: string[];
  confidence: number;
}

// ─── Deterministic graph queries ──────────────────────────────

const GRAPH_PATTERNS: Array<{
  pattern: RegExp;
  handler: (
    model: WorldModelType,
    match: RegExpMatchArray,
  ) => QueryResult | null;
}> = [
  {
    // "what depends on X" / "what uses X" / "what needs X"
    pattern:
      /what\s+(?:depends\s+on|uses|needs|requires|consumes)\s+(?:the\s+)?(.+?)(?:\?|$)/i,
    handler: (model, match) => {
      const entity = findEntity(model, match[1].trim());
      if (!entity) return null;
      const deps = findDependents(model, entity.id);
      if (deps.incoming.length === 0) {
        return {
          answer: `Nothing in the model depends on ${entity.name}.`,
          method: "graph",
          entities_referenced: [entity.name],
          confidence: 1,
        };
      }
      const lines = deps.incoming.map(
        (d) =>
          `- ${d.entity.name} —[${d.relation.type}]→ ${entity.name}: ${d.relation.label}`,
      );
      return {
        answer: `${deps.incoming.length} entities depend on ${entity.name}:\n${lines.join("\n")}`,
        method: "graph",
        entities_referenced: [
          entity.name,
          ...deps.incoming.map((d) => d.entity.name),
        ],
        confidence: 1,
      };
    },
  },
  {
    // "what does X depend on" / "what does X use" / "what does X need"
    pattern:
      /what\s+does\s+(.+?)\s+(?:depend\s+on|use|need|require|consume)(?:\?|$)/i,
    handler: (model, match) => {
      const entity = findEntity(model, match[1].trim());
      if (!entity) return null;
      const deps = findDependents(model, entity.id);
      if (deps.outgoing.length === 0) {
        return {
          answer: `${entity.name} does not depend on anything in the model.`,
          method: "graph",
          entities_referenced: [entity.name],
          confidence: 1,
        };
      }
      const lines = deps.outgoing.map(
        (d) =>
          `- ${entity.name} —[${d.relation.type}]→ ${d.entity.name}: ${d.relation.label}`,
      );
      return {
        answer: `${entity.name} depends on ${deps.outgoing.length} entities:\n${lines.join("\n")}`,
        method: "graph",
        entities_referenced: [
          entity.name,
          ...deps.outgoing.map((d) => d.entity.name),
        ],
        confidence: 1,
      };
    },
  },
  {
    // "how is X connected to Y" / "path from X to Y" / "how does X relate to Y"
    pattern:
      /(?:how\s+(?:is|does)\s+(.+?)\s+(?:connected|related?)\s+to\s+(.+?)|path\s+from\s+(.+?)\s+to\s+(.+?))(?:\?|$)/i,
    handler: (model, match) => {
      const srcName = (match[1] || match[3])?.trim();
      const tgtName = (match[2] || match[4])?.trim();
      if (!srcName || !tgtName) return null;
      const src = findEntity(model, srcName);
      const tgt = findEntity(model, tgtName);
      if (!src || !tgt) return null;

      const paths = pathsBetween(model, src.id, tgt.id);
      if (paths.length === 0) {
        return {
          answer: `No path found from ${src.name} to ${tgt.name} in the model.`,
          method: "graph",
          entities_referenced: [src.name, tgt.name],
          confidence: 1,
        };
      }

      const pathDescs = paths.map((path, i) => {
        const hops = path
          .map((step, j) => {
            if (j === 0) return step.entity.name;
            return `—[${step.relation?.type ?? "?"}]→ ${step.entity.name}`;
          })
          .join(" ");
        return `  Path ${i + 1}: ${hops}`;
      });

      return {
        answer: `${paths.length} path(s) from ${src.name} to ${tgt.name}:\n${pathDescs.join("\n")}`,
        method: "graph",
        entities_referenced: [src.name, tgt.name],
        confidence: 1,
      };
    },
  },
  {
    // "what constraints apply to X" / "rules for X"
    pattern:
      /(?:what\s+constraints?\s+(?:apply|applies)\s+to|rules?\s+for)\s+(?:the\s+)?(.+?)(?:\?|$)/i,
    handler: (model, match) => {
      const entity = findEntity(model, match[1].trim());
      if (!entity) return null;

      const applicable = model.constraints.filter((c) =>
        c.scope.includes(entity.id),
      );

      if (applicable.length === 0) {
        return {
          answer: `No constraints apply to ${entity.name}.`,
          method: "graph",
          entities_referenced: [entity.name],
          confidence: 1,
        };
      }

      const lines = applicable.map(
        (c) => `- [${c.severity}] ${c.name}: ${c.description}`,
      );
      return {
        answer: `${applicable.length} constraint(s) apply to ${entity.name}:\n${lines.join("\n")}`,
        method: "graph",
        entities_referenced: [entity.name],
        confidence: 1,
      };
    },
  },
  {
    // "how many entities" / "stats" / "summary"
    pattern: /(?:how\s+many|stats|statistics|summary|overview)\b/i,
    handler: (model) => {
      const stats = getStats(model);
      const lines = [
        `Entities: ${stats.entities.total} (${Object.entries(
          stats.entities.byType,
        )
          .map(([t, c]) => `${c} ${t}`)
          .join(", ")})`,
        `Relations: ${stats.relations.total}`,
        `Processes: ${stats.processes.total} (${stats.processes.totalSteps} steps)`,
        `Constraints: ${stats.constraints.total} (${stats.constraints.hard} hard, ${stats.constraints.soft} soft)`,
        `Confidence: ${stats.confidence}`,
        "",
        "Most connected:",
        ...stats.mostConnected.map(
          (mc) => `  - ${mc.entity}: ${mc.connections} connections`,
        ),
      ];
      return {
        answer: lines.join("\n"),
        method: "graph",
        entities_referenced: stats.mostConnected.map((mc) => mc.entity),
        confidence: 1,
      };
    },
  },
  {
    // "what is X" / "describe X" / "tell me about X"
    pattern:
      /(?:what\s+is|describe|tell\s+me\s+about|who\s+is)\s+(?:the\s+)?(.+?)(?:\?|$)/i,
    handler: (model, match) => {
      const entity = findEntity(model, match[1].trim());
      if (!entity) return null;

      const deps = findDependents(model, entity.id);
      const constraints = model.constraints.filter((c) =>
        c.scope.includes(entity.id),
      );
      const processes = model.processes.filter((p) =>
        p.participants.includes(entity.id),
      );

      const lines = [
        `**${entity.name}** (${entity.type})`,
        entity.description,
        "",
      ];

      if (entity.properties && Object.keys(entity.properties).length > 0) {
        lines.push(`Properties: ${JSON.stringify(entity.properties)}`);
      }

      if (deps.incoming.length > 0) {
        lines.push(
          `Depended on by: ${deps.incoming.map((d) => d.entity.name).join(", ")}`,
        );
      }
      if (deps.outgoing.length > 0) {
        lines.push(
          `Depends on: ${deps.outgoing.map((d) => d.entity.name).join(", ")}`,
        );
      }
      if (processes.length > 0) {
        lines.push(
          `Participates in: ${processes.map((p) => p.name).join(", ")}`,
        );
      }
      if (constraints.length > 0) {
        lines.push(
          `Constraints: ${constraints.map((c) => `[${c.severity}] ${c.name}`).join(", ")}`,
        );
      }

      return {
        answer: lines.join("\n"),
        method: "graph",
        entities_referenced: [
          entity.name,
          ...deps.incoming.map((d) => d.entity.name),
          ...deps.outgoing.map((d) => d.entity.name),
        ],
        confidence: 1,
      };
    },
  },
];

// ─── LLM inference query ──────────────────────────────────────

function modelToContext(model: WorldModelType): string {
  const entities = model.entities
    .map((e) => `- ${e.name} (${e.type}): ${e.description}`)
    .join("\n");

  const relations = model.relations
    .map((r) => {
      const src =
        model.entities.find((e) => e.id === r.source)?.name ?? r.source;
      const tgt =
        model.entities.find((e) => e.id === r.target)?.name ?? r.target;
      return `- ${src} —[${r.type}]→ ${tgt}: ${r.label}`;
    })
    .join("\n");

  const processes = model.processes
    .map((p) => {
      const steps = p.steps
        .map((s) => {
          const actor = s.actor
            ? (model.entities.find((e) => e.id === s.actor)?.name ?? "?")
            : "?";
          return `  ${s.order}. ${actor}: ${s.action}`;
        })
        .join("\n");
      return `- ${p.name} (trigger: ${p.trigger ?? "n/a"}): ${p.description}\n${steps}\n  Outcomes: ${p.outcomes.join(", ")}`;
    })
    .join("\n");

  const constraints = model.constraints
    .map((c) => {
      const scopeNames = c.scope
        .map((id) => model.entities.find((e) => e.id === id)?.name ?? id)
        .join(", ");
      return `- [${c.severity}] ${c.name} (applies to: ${scopeNames}): ${c.description}`;
    })
    .join("\n");

  return `# World Model: ${model.name}\n${model.description}\n\n## Entities (${model.entities.length})\n${entities}\n\n## Relations (${model.relations.length})\n${relations}\n\n## Processes (${model.processes.length})\n${processes}\n\n## Constraints (${model.constraints.length})\n${constraints}`;
}

const QUERY_SYSTEM_PROMPT = `You are a world-model query agent. You answer questions based STRICTLY on the world model provided.

RULES:
- Only use information present in the model — do not hallucinate or infer beyond what the model states
- If the model doesn't contain enough information to answer, say so explicitly
- Reference specific entities, relations, processes, and constraints by name
- Be concise and direct
- If the question asks about something not in the model, say "The model does not contain information about [X]"`;

async function inferenceQuery(
  model: WorldModelType,
  question: string,
): Promise<QueryResult> {
  const context = modelToContext(model);
  const userMessage = `${context}\n\n---\n\nQuestion: ${question}`;

  const answer = await callAgent(QUERY_SYSTEM_PROMPT, userMessage, {
    maxTokens: 4096,
  });

  // Extract entity names that appear in the answer
  const referenced = model.entities
    .filter((e) => answer.toLowerCase().includes(e.name.toLowerCase()))
    .map((e) => e.name);

  return {
    answer,
    method: "inference",
    entities_referenced: referenced,
    confidence: 0.8,
  };
}

// ─── Public API ───────────────────────────────────────────────

export async function queryWorldModel(
  model: WorldModelType,
  question: string,
): Promise<QueryResult> {
  if (!question || !question.trim()) {
    return {
      answer: "No question provided.",
      method: "graph",
      entities_referenced: [],
      confidence: 1,
    };
  }

  // Try deterministic graph queries first
  for (const { pattern, handler } of GRAPH_PATTERNS) {
    const match = question.match(pattern);
    if (match) {
      const result = handler(model, match);
      if (result) return result;
      // Pattern matched but handler returned null (entity not found) — fall through to inference
    }
  }

  // Fall back to LLM inference
  return inferenceQuery(model, question);
}

// === src/agents/refinement.ts ===
import { callAgentJSON } from "../utils/llm.js";
import type { WorldModelType } from "../schema/index.js";
import type { PipelineInput } from "../pipeline/index.js";
import type { RawExtraction } from "./extraction.js";
import { structuringAgent } from "./structuring.js";
import { validationAgent } from "./validation.js";
import { mergeWorldModels } from "../utils/merge.js";

const REFINEMENT_PROMPT = `You are a world-model refinement agent. You are given an EXISTING world model and NEW input.
Your job is to extract ONLY what the new input adds, changes, or contradicts relative to the existing model.

## Existing World Model Summary:
{existingModelSummary}

## Instructions:
1. Extract new entities NOT already in the existing model
2. Extract new relations between entities (new or existing)
3. Extract new processes or refinements to existing processes
4. Extract new constraints or modifications to existing ones
5. If the new input CONTRADICTS something in the existing model, extract the new version and note the contradiction in extraction_notes

RULES:
- DO NOT re-extract entities/relations that already exist unchanged
- DO reference existing entity names exactly when creating new relations to them
- Mark confidence based on how clearly the new input supports each extraction
- Note in extraction_notes what was added vs what was modified
- Output ONLY valid JSON matching the extraction schema`;

function summarizeModel(model: WorldModelType): string {
  const entityList = model.entities
    .map((e) => `  - ${e.name} (${e.type}): ${e.description.slice(0, 100)}`)
    .join("\n");

  const relationList = model.relations
    .map((r) => {
      const src =
        model.entities.find((e) => e.id === r.source)?.name ?? r.source;
      const tgt =
        model.entities.find((e) => e.id === r.target)?.name ?? r.target;
      return `  - ${src} —[${r.type}]→ ${tgt}`;
    })
    .join("\n");

  const processList = model.processes
    .map((p) => `  - ${p.name}: ${p.description.slice(0, 80)}`)
    .join("\n");

  const constraintList = model.constraints
    .map((c) => `  - [${c.severity}] ${c.name}: ${c.description.slice(0, 80)}`)
    .join("\n");

  return `Entities (${model.entities.length}):\n${entityList}\n\nRelations (${model.relations.length}):\n${relationList}\n\nProcesses (${model.processes.length}):\n${processList}\n\nConstraints (${model.constraints.length}):\n${constraintList}`;
}

export async function refineWorldModel(
  existingModel: WorldModelType,
  newInput: PipelineInput,
  options?: {
    onStageStart?: (name: string) => void;
    onStageEnd?: (name: string, ms: number) => void;
  },
): Promise<{ worldModel: WorldModelType; delta: WorldModelType }> {
  const summary = summarizeModel(existingModel);
  const systemPrompt = REFINEMENT_PROMPT.replace(
    "{existingModelSummary}",
    summary,
  );

  // Extract delta
  options?.onStageStart?.("refinement-extraction");
  const start = Date.now();

  const userMessage = `Given the existing world model above, analyze this NEW ${newInput.sourceType} input and extract only what's new or changed.\n\n---\n\n${newInput.raw}`;

  const deltaExtraction = await callAgentJSON<RawExtraction>(
    systemPrompt,
    userMessage,
    {
      maxTokens: 16384,
    },
  );

  options?.onStageEnd?.("refinement-extraction", Date.now() - start);

  // Structure the delta into a world model
  options?.onStageStart?.("refinement-structuring");
  const structStart = Date.now();

  const { worldModel: deltaModel } = await structuringAgent({
    input: newInput,
    extraction: deltaExtraction,
  });

  options?.onStageEnd?.("refinement-structuring", Date.now() - structStart);

  // Merge existing + delta
  options?.onStageStart?.("refinement-merge");
  const mergeStart = Date.now();

  const merged = mergeWorldModels(existingModel, deltaModel, {
    name: existingModel.name,
    description: existingModel.description,
  });

  options?.onStageEnd?.("refinement-merge", Date.now() - mergeStart);

  // Validate the merged result
  options?.onStageStart?.("refinement-validation");
  const valStart = Date.now();

  const { worldModel: validatedModel } = await validationAgent({
    input: newInput,
    worldModel: merged,
  });

  options?.onStageEnd?.("refinement-validation", Date.now() - valStart);

  return { worldModel: validatedModel, delta: deltaModel };
}

// === src/agents/second-pass.ts ===
import { callAgentJSON } from "../utils/llm.js";
import type { WorldModelType } from "../schema/index.js";
import type { PipelineInput } from "../pipeline/index.js";
import type { RawExtraction } from "./extraction.js";
import { validateExtraction } from "../schema/extraction.js";

const SECOND_PASS_PROMPT = `You are a world-model COMPLETENESS agent. You are given:
1. The original raw input
2. A world model that was already extracted from it

Your job is to find everything the FIRST PASS MISSED. The first pass captures what's explicitly stated. You capture what's IMPLICIT.

Look for:

**Missing entities:**
- Entities that must EXIST for the described processes to work, but were never named
- Infrastructure entities (authentication, logging, error handling, networking)
- Role entities implied by actions ("someone approves" → there's an Approver actor)
- Data entities implied by processes ("saves to database" → there's a Record object)

**Missing relations:**
- Dependencies that are logically necessary but not stated
- Hierarchical relations implied by context (if X contains Y, Y is part_of X)
- Communication paths implied by processes (if A triggers B, A communicates_with B)

**Missing processes:**
- Error/failure paths (what happens when the main process fails?)
- Setup/teardown processes (what must happen before/after the described flow?)
- Maintenance processes (backups, migrations, updates)

**Missing constraints:**
- Physical/logical impossibilities not stated (can't be in two places, can't exceed capacity)
- Temporal constraints implied by ordering (step 2 can't happen before step 1)
- Authorization constraints implied by roles (only admins can X)
- Data integrity constraints (required fields, unique identifiers, referential integrity)

RULES:
- ONLY extract what's NEW — do not re-extract entities/relations already in the model
- Reference existing entity names exactly when creating relations to them
- Every extraction must be JUSTIFIED by the input — no hallucination
- Set confidence lower (0.3-0.7) since these are inferences, not direct extractions
- In extraction_notes, explain WHY each new element was inferred
- Output ONLY valid JSON matching the extraction schema`;

function summarizeModelForPrompt(model: WorldModelType): string {
  const entities = model.entities
    .map((e) => `- ${e.name} (${e.type}): ${e.description}`)
    .join("\n");

  const relations = model.relations
    .map((r) => {
      const src =
        model.entities.find((e) => e.id === r.source)?.name ?? r.source;
      const tgt =
        model.entities.find((e) => e.id === r.target)?.name ?? r.target;
      return `- ${src} —[${r.type}]→ ${tgt}: ${r.label}`;
    })
    .join("\n");

  const processes = model.processes
    .map((p) => {
      const steps = p.steps
        .map((s) => {
          const actor = s.actor
            ? (model.entities.find((e) => e.id === s.actor)?.name ?? s.actor)
            : "unknown";
          return `  ${s.order}. ${actor}: ${s.action}`;
        })
        .join("\n");
      return `- ${p.name}: ${p.description}\n${steps}`;
    })
    .join("\n");

  const constraints = model.constraints
    .map((c) => `- [${c.severity}] ${c.name}: ${c.description}`)
    .join("\n");

  return `ENTITIES (${model.entities.length}):\n${entities}\n\nRELATIONS (${model.relations.length}):\n${relations}\n\nPROCESSES (${model.processes.length}):\n${processes}\n\nCONSTRAINTS (${model.constraints.length}):\n${constraints}`;
}

export async function secondPassAgent(
  originalInput: PipelineInput,
  currentModel: WorldModelType,
): Promise<RawExtraction> {
  const modelSummary = summarizeModelForPrompt(currentModel);

  const userMessage = `## Original Input:\n${originalInput.raw}\n\n---\n\n## Already Extracted World Model:\n${modelSummary}\n\n---\n\nWhat did the first pass MISS? Extract only NEW entities, relations, processes, and constraints that are implicit in the input but not yet in the model.`;

  const rawResult = await callAgentJSON<unknown>(
    SECOND_PASS_PROMPT,
    userMessage,
    {
      maxTokens: 16384,
    },
  );

  const { extraction, issues } = validateExtraction(rawResult);
  if (issues.length > 0) {
    process.stderr.write(`  [second-pass validation] ${issues.join("; ")}\n`);
  }

  return extraction as unknown as RawExtraction;
}

// === src/agents/structuring.ts ===
import type { WorldModelType } from "../schema/index.js";
import type { PipelineInput } from "../pipeline/index.js";
import type { RawExtraction } from "./extraction.js";
import { genId } from "../utils/ids.js";

export interface StructuringOutput {
  input: PipelineInput;
  worldModel: WorldModelType;
}

export function structuringAgent(stageInput: {
  input: PipelineInput;
  extraction: RawExtraction;
}): Promise<StructuringOutput> {
  const { input, extraction } = stageInput;

  // Normalize entity types the LLM may return outside the enum
  const VALID_ENTITY_TYPES = new Set([
    "actor",
    "object",
    "system",
    "concept",
    "location",
    "event",
    "group",
    "resource",
  ]);
  const ENTITY_TYPE_ALIASES: Record<string, string> = {
    person: "actor",
    user: "actor",
    role: "actor",
    agent: "actor",
    organization: "group",
    org: "group",
    team: "group",
    company: "group",
    place: "location",
    area: "location",
    region: "location",
    service: "system",
    platform: "system",
    tool: "system",
    application: "system",
    app: "system",
    idea: "concept",
    principle: "concept",
    pattern: "concept",
    category: "concept",
    item: "object",
    thing: "object",
    product: "object",
    data: "resource",
    asset: "resource",
    file: "resource",
    document: "resource",
    incident: "event",
    action: "event",
    occurrence: "event",
  };
  function normalizeEntityType(
    raw: string,
  ): WorldModelType["entities"][number]["type"] {
    const lower = raw.toLowerCase().trim();
    if (VALID_ENTITY_TYPES.has(lower))
      return lower as WorldModelType["entities"][number]["type"];
    return (ENTITY_TYPE_ALIASES[lower] ??
      "object") as WorldModelType["entities"][number]["type"];
  }

  // Normalize relation types
  const VALID_RELATION_TYPES = new Set([
    "has",
    "is_a",
    "part_of",
    "depends_on",
    "produces",
    "consumes",
    "controls",
    "communicates_with",
    "located_in",
    "triggers",
    "inherits",
    "contains",
    "uses",
    "flows_to",
    "opposes",
    "enables",
    "transforms",
  ]);
  function normalizeRelationType(
    raw: string,
  ): WorldModelType["relations"][number]["type"] {
    const lower = raw.toLowerCase().trim().replace(/ /g, "_");
    if (VALID_RELATION_TYPES.has(lower))
      return lower as WorldModelType["relations"][number]["type"];
    return "uses" as WorldModelType["relations"][number]["type"];
  }

  // Normalize constraint types
  const VALID_CONSTRAINT_TYPES = new Set([
    "invariant",
    "rule",
    "boundary",
    "dependency",
    "capacity",
    "temporal",
    "authorization",
  ]);
  function normalizeConstraintType(
    raw: string,
  ): WorldModelType["constraints"][number]["type"] {
    const lower = raw.toLowerCase().trim().replace(/ /g, "_");
    if (VALID_CONSTRAINT_TYPES.has(lower))
      return lower as WorldModelType["constraints"][number]["type"];
    return "rule" as WorldModelType["constraints"][number]["type"];
  }

  // Build entity name → ID map
  const entityIdMap = new Map<string, string>();
  const entities = extraction.entities.map((e) => {
    const id = genId("ent");
    entityIdMap.set(e.name, id);
    return {
      id,
      name: e.name,
      type: normalizeEntityType(e.type),
      description: e.description,
      properties: e.properties,
      tags: e.tags,
    };
  });

  const resolveEntityId = (name: string): string => {
    const existing = entityIdMap.get(name);
    if (existing) return existing;
    // Create a placeholder entity for unresolved references
    const id = genId("ent");
    entityIdMap.set(name, id);
    entities.push({
      id,
      name,
      type: "object",
      description: `Auto-created entity for unresolved reference: ${name}`,
      properties: undefined,
      tags: ["auto-created"],
    });
    return id;
  };

  const relations = extraction.relations.map((r) => ({
    id: genId("rel"),
    type: normalizeRelationType(r.type),
    source: resolveEntityId(r.source),
    target: resolveEntityId(r.target),
    label: r.label,
    bidirectional: r.bidirectional,
  }));

  const processes = extraction.processes.map((p) => ({
    id: genId("proc"),
    name: p.name,
    description: p.description,
    trigger: p.trigger,
    steps: p.steps.map((s, idx) => ({
      order: s.order ?? idx + 1,
      action: s.action,
      actor: s.actor ? resolveEntityId(s.actor) : undefined,
      input: s.inputs?.map(resolveEntityId),
      output: s.outputs?.map(resolveEntityId),
    })),
    participants: p.participants.map(resolveEntityId),
    outcomes: p.outcomes,
  }));

  const constraints = extraction.constraints.map((c) => ({
    id: genId("cstr"),
    name: c.name,
    type: normalizeConstraintType(c.type),
    description: c.description,
    scope: c.scope.map(resolveEntityId),
    severity: c.severity,
  }));

  const worldModel: WorldModelType = {
    id: genId("wm"),
    name: extraction.model_name || input.name || "Untitled World Model",
    description: extraction.model_description || "Extracted world model",
    version: "0.1.0",
    created_at: new Date().toISOString(),
    entities,
    relations,
    processes,
    constraints,
    metadata: {
      source_type: input.sourceType,
      source_summary: extraction.source_summary || "No summary",
      confidence: extraction.confidence ?? 0.5,
      extraction_notes: extraction.extraction_notes,
    },
  };

  return Promise.resolve({ input, worldModel });
}

// === src/agents/validation.ts ===
import type {
  WorldModelType,
  ValidationResultType,
  ValidationIssueType,
} from "../schema/index.js";
import type { PipelineInput } from "../pipeline/index.js";

export interface ValidationOutput {
  worldModel: WorldModelType;
  validation: ValidationResultType;
}

export function validationAgent(stageInput: {
  input: PipelineInput;
  worldModel: WorldModelType;
}): Promise<ValidationOutput> {
  const { worldModel } = stageInput;
  const issues: ValidationIssueType[] = [];

  const entityIds = new Set(worldModel.entities.map((e) => e.id));

  // Check relations reference valid entities
  for (const rel of worldModel.relations) {
    if (!entityIds.has(rel.source)) {
      issues.push({
        type: "error",
        code: "DANGLING_REL_SOURCE",
        message: `Relation "${rel.id}" references non-existent source entity "${rel.source}"`,
        path: `relations.${rel.id}.source`,
      });
    }
    if (!entityIds.has(rel.target)) {
      issues.push({
        type: "error",
        code: "DANGLING_REL_TARGET",
        message: `Relation "${rel.id}" references non-existent target entity "${rel.target}"`,
        path: `relations.${rel.id}.target`,
      });
    }
    if (rel.source === rel.target) {
      issues.push({
        type: "warning",
        code: "SELF_RELATION",
        message: `Relation "${rel.id}" is a self-reference on entity "${rel.source}"`,
        path: `relations.${rel.id}`,
      });
    }
  }

  // Check processes reference valid entities
  for (const proc of worldModel.processes) {
    for (const participant of proc.participants) {
      if (!entityIds.has(participant)) {
        issues.push({
          type: "error",
          code: "DANGLING_PROC_PARTICIPANT",
          message: `Process "${proc.name}" references non-existent participant "${participant}"`,
          path: `processes.${proc.id}.participants`,
        });
      }
    }
    for (const step of proc.steps) {
      if (step.actor && !entityIds.has(step.actor)) {
        issues.push({
          type: "error",
          code: "DANGLING_STEP_ACTOR",
          message: `Process "${proc.name}" step ${step.order} references non-existent actor "${step.actor}"`,
          path: `processes.${proc.id}.steps.${step.order}.actor`,
        });
      }
    }
    if (proc.steps.length === 0) {
      issues.push({
        type: "warning",
        code: "EMPTY_PROCESS",
        message: `Process "${proc.name}" has no steps`,
        path: `processes.${proc.id}.steps`,
      });
    }
  }

  // Check constraints reference valid entities
  for (const constraint of worldModel.constraints) {
    for (const scopeId of constraint.scope) {
      if (!entityIds.has(scopeId)) {
        issues.push({
          type: "error",
          code: "DANGLING_CONSTRAINT_SCOPE",
          message: `Constraint "${constraint.name}" references non-existent entity "${scopeId}"`,
          path: `constraints.${constraint.id}.scope`,
        });
      }
    }
  }

  // Check for orphan entities (no relations, not in any process)
  const referencedEntities = new Set<string>();
  for (const rel of worldModel.relations) {
    referencedEntities.add(rel.source);
    referencedEntities.add(rel.target);
  }
  for (const proc of worldModel.processes) {
    for (const p of proc.participants) referencedEntities.add(p);
  }
  for (const constraint of worldModel.constraints) {
    for (const s of constraint.scope) referencedEntities.add(s);
  }

  for (const entity of worldModel.entities) {
    if (!referencedEntities.has(entity.id)) {
      issues.push({
        type: "warning",
        code: "ORPHAN_ENTITY",
        message: `Entity "${entity.name}" (${entity.id}) is not referenced by any relation, process, or constraint`,
        path: `entities.${entity.id}`,
      });
    }
  }

  // Check for duplicate entity names
  const nameCount = new Map<string, number>();
  for (const entity of worldModel.entities) {
    nameCount.set(entity.name, (nameCount.get(entity.name) ?? 0) + 1);
  }
  for (const [name, count] of nameCount) {
    if (count > 1) {
      issues.push({
        type: "warning",
        code: "DUPLICATE_ENTITY_NAME",
        message: `Entity name "${name}" appears ${count} times — may indicate extraction duplication`,
        path: `entities`,
      });
    }
  }

  // Completeness checks
  if (worldModel.entities.length === 0) {
    issues.push({
      type: "error",
      code: "NO_ENTITIES",
      message: "World model has no entities",
    });
  }
  if (worldModel.relations.length === 0) {
    issues.push({
      type: "warning",
      code: "NO_RELATIONS",
      message: "World model has no relations — entities are unconnected",
    });
  }

  const hasErrors = issues.some((i) => i.type === "error");

  const validation: ValidationResultType = {
    valid: !hasErrors,
    issues,
    stats: {
      entities: worldModel.entities.length,
      relations: worldModel.relations.length,
      processes: worldModel.processes.length,
      constraints: worldModel.constraints.length,
    },
  };

  return Promise.resolve({ worldModel, validation });
}

// === src/cli.ts ===
#!/usr/bin/env node

import { program } from "commander";
import { readFileSync, writeFileSync, existsSync } from "node:fs";
import { resolve } from "node:path";
import chalk from "chalk";
import { stringify as yamlStringify } from "yaml";
import { buildWorldModel } from "./swm.js";
import { refineWorldModel } from "./agents/refinement.js";
import { mergeWorldModels, diffWorldModels } from "./utils/merge.js";
import {
  findEntity,
  findDependents,
  toMermaid,
  toDot,
  getStats,
} from "./utils/graph.js";
import { queryWorldModel } from "./agents/query.js";
import { intersection, difference, overlay } from "./utils/algebra.js";
import { toClaudeMd } from "./export/claude-md.js";
import { toSystemPrompt } from "./export/system-prompt.js";
import { toMcpSchema } from "./export/mcp-schema.js";
import {
  createTimeline,
  addSnapshot,
  entityHistory,
  timelineSummary,
} from "./utils/timeline.js";
import type { Timeline } from "./utils/timeline.js";
import type { PipelineInput } from "./pipeline/index.js";
import type { WorldModelType } from "./schema/index.js";

function detectSourceType(raw: string): PipelineInput["sourceType"] {
  if (raw.startsWith("http://") || raw.startsWith("https://")) return "url";
  if (
    raw.includes("function ") ||
    raw.includes("class ") ||
    raw.includes("import ") ||
    raw.includes("def ") ||
    raw.includes("fn ")
  )
    return "code";
  if (raw.includes("?") && raw.includes(":")) return "conversation";
  return "text";
}

function readInput(inputArg?: string, filePath?: string): string {
  if (filePath) return readFileSync(resolve(filePath), "utf-8");
  if (inputArg) {
    try {
      return readFileSync(resolve(inputArg), "utf-8");
    } catch {
      return inputArg;
    }
  }
  throw new Error(
    "No input provided. Pass text, a file path, or use -f <file>.",
  );
}

function readModel(path: string): WorldModelType {
  const raw = readFileSync(resolve(path), "utf-8");
  return JSON.parse(raw) as WorldModelType;
}

function formatOutput(
  model: WorldModelType,
  format: string,
  pretty: boolean,
): string {
  if (format === "yaml") return yamlStringify(model);
  if (format === "mermaid") return toMermaid(model);
  if (format === "dot") return toDot(model);
  return pretty ? JSON.stringify(model, null, 2) : JSON.stringify(model);
}

function stageCallbacks(quiet?: boolean) {
  return {
    onStageStart: (name: string) => {
      if (!quiet) process.stderr.write(chalk.yellow(`  ▸ ${name}...`));
    },
    onStageEnd: (_name: string, ms: number) => {
      if (!quiet) process.stderr.write(chalk.green(` done (${ms}ms)\n`));
    },
  };
}

program
  .name("swm")
  .description(
    "Structured World Model — turn anything into a structured world model",
  )
  .version("0.1.0");

// ─── model ────────────────────────────────────────────────────
program
  .command("model")
  .description("Build a structured world model from input")
  .argument("[input]", "Text input or file path")
  .option("-f, --file <path>", "Read input from file")
  .option("-o, --output <path>", "Write output to file")
  .option(
    "-t, --type <type>",
    "Source type: text, code, document, url, conversation, mixed",
  )
  .option(
    "--format <format>",
    "Output format: json, yaml, mermaid, dot",
    "json",
  )
  .option("--pretty", "Pretty-print JSON output", true)
  .option("--quiet", "Suppress progress output")
  .option(
    "-p, --passes <n>",
    "Number of extraction passes (1=standard, 2-3=deeper)",
    "1",
  )
  .action(
    async (
      inputArg: string | undefined,
      opts: Record<string, string | boolean | undefined>,
    ) => {
      try {
        const raw = readInput(inputArg, opts.file as string | undefined);
        if (!raw.trim()) {
          console.error(chalk.red("Error: No input provided"));
          process.exit(1);
        }

        const sourceType =
          (opts.type as PipelineInput["sourceType"]) || detectSourceType(raw);
        const input: PipelineInput = {
          raw,
          sourceType,
          name:
            (opts.file as string) ||
            (inputArg && inputArg.length < 100 ? inputArg : undefined),
        };

        if (!opts.quiet) {
          console.error(chalk.blue("■ Structured World Model"));
          console.error(
            chalk.gray(`  Source: ${sourceType} (${raw.length} chars)\n`),
          );
        }

        const passes = parseInt((opts.passes as string) ?? "1", 10) || 1;
        const result = await buildWorldModel(input, {
          ...stageCallbacks(opts.quiet as boolean),
          passes,
        });
        const output = formatOutput(
          result.worldModel,
          (opts.format as string) ?? "json",
          (opts.pretty as boolean) ?? true,
        );

        if (opts.output) {
          writeFileSync(resolve(opts.output as string), output, "utf-8");
          if (!opts.quiet)
            console.error(chalk.green(`\n  ✓ Written to ${opts.output}`));
        } else {
          console.log(output);
        }

        if (!opts.quiet) {
          const v = result.validation;
          const statusColor = v.valid ? chalk.green : chalk.red;
          console.error(
            statusColor(
              `\n  Validation: ${v.valid ? "PASSED" : "FAILED"} — ${v.stats.entities} entities, ${v.stats.relations} relations, ${v.stats.processes} processes, ${v.stats.constraints} constraints`,
            ),
          );
          if (v.issues.length > 0) {
            console.error(chalk.gray(`  Issues:`));
            for (const issue of v.issues) {
              const icon =
                issue.type === "error"
                  ? chalk.red("✗")
                  : issue.type === "warning"
                    ? chalk.yellow("!")
                    : chalk.blue("i");
              console.error(`    ${icon} ${issue.message}`);
            }
          }
          console.error(chalk.gray(`\n  Total: ${result.totalDurationMs}ms`));
        }
      } catch (err) {
        console.error(
          chalk.red(
            `Error: ${err instanceof Error ? err.message : String(err)}`,
          ),
        );
        process.exit(1);
      }
    },
  );

// ─── refine ───────────────────────────────────────────────────
program
  .command("refine")
  .description(
    "Refine an existing world model with new input (incremental extraction)",
  )
  .argument("<model>", "Path to existing world model JSON")
  .argument("[input]", "New text input or file path")
  .option("-f, --file <path>", "Read new input from file")
  .option("-o, --output <path>", "Write refined model to file")
  .option("-t, --type <type>", "Source type of new input")
  .option(
    "--format <format>",
    "Output format: json, yaml, mermaid, dot",
    "json",
  )
  .option("--quiet", "Suppress progress output")
  .action(
    async (
      modelPath: string,
      inputArg: string | undefined,
      opts: Record<string, string | boolean | undefined>,
    ) => {
      try {
        const existing = readModel(modelPath);
        const raw = readInput(inputArg, opts.file as string | undefined);
        const sourceType =
          (opts.type as PipelineInput["sourceType"]) || detectSourceType(raw);

        if (!opts.quiet) {
          console.error(chalk.blue("■ Refining World Model"));
          console.error(
            chalk.gray(
              `  Existing: ${existing.entities.length} entities, ${existing.relations.length} relations`,
            ),
          );
          console.error(
            chalk.gray(`  New input: ${sourceType} (${raw.length} chars)\n`),
          );
        }

        const { worldModel, delta } = await refineWorldModel(
          existing,
          { raw, sourceType },
          stageCallbacks(opts.quiet as boolean),
        );

        const output = formatOutput(
          worldModel,
          (opts.format as string) ?? "json",
          true,
        );

        if (opts.output) {
          writeFileSync(resolve(opts.output as string), output, "utf-8");
          if (!opts.quiet)
            console.error(chalk.green(`\n  ✓ Written to ${opts.output}`));
        } else {
          console.log(output);
        }

        if (!opts.quiet) {
          console.error(
            chalk.gray(
              `\n  Delta: +${delta.entities.length} entities, +${delta.relations.length} relations, +${delta.processes.length} processes`,
            ),
          );
          console.error(
            chalk.gray(
              `  Result: ${worldModel.entities.length} entities, ${worldModel.relations.length} relations total`,
            ),
          );
        }
      } catch (err) {
        console.error(
          chalk.red(
            `Error: ${err instanceof Error ? err.message : String(err)}`,
          ),
        );
        process.exit(1);
      }
    },
  );

// ─── merge ────────────────────────────────────────────────────
program
  .command("merge")
  .description("Merge two world models into one")
  .argument("<modelA>", "Path to first world model JSON")
  .argument("<modelB>", "Path to second world model JSON")
  .option("-o, --output <path>", "Write merged model to file")
  .option("--format <format>", "Output format: json, yaml", "json")
  .action(
    (
      pathA: string,
      pathB: string,
      opts: Record<string, string | undefined>,
    ) => {
      try {
        const a = readModel(pathA);
        const b = readModel(pathB);
        const merged = mergeWorldModels(a, b);
        const output = formatOutput(merged, opts.format ?? "json", true);

        if (opts.output) {
          writeFileSync(resolve(opts.output), output, "utf-8");
          console.error(
            chalk.green(`✓ Merged model written to ${opts.output}`),
          );
        } else {
          console.log(output);
        }

        console.error(
          chalk.gray(
            `  ${merged.entities.length} entities, ${merged.relations.length} relations`,
          ),
        );
      } catch (err) {
        console.error(
          chalk.red(
            `Error: ${err instanceof Error ? err.message : String(err)}`,
          ),
        );
        process.exit(1);
      }
    },
  );

// ─── diff ─────────────────────────────────────────────────────
program
  .command("diff")
  .description("Diff two world models")
  .argument("<before>", "Path to before world model JSON")
  .argument("<after>", "Path to after world model JSON")
  .action((beforePath: string, afterPath: string) => {
    try {
      const before = readModel(beforePath);
      const after = readModel(afterPath);
      const diff = diffWorldModels(before, after);

      console.log(chalk.blue("■ World Model Diff\n"));
      console.log(chalk.white(`  Summary: ${diff.summary}\n`));

      if (diff.entities.added.length) {
        console.log(chalk.green("  + Entities added:"));
        for (const name of diff.entities.added)
          console.log(chalk.green(`    + ${name}`));
      }
      if (diff.entities.removed.length) {
        console.log(chalk.red("  - Entities removed:"));
        for (const name of diff.entities.removed)
          console.log(chalk.red(`    - ${name}`));
      }
      if (diff.entities.modified.length) {
        console.log(chalk.yellow("  ~ Entities modified:"));
        for (const name of diff.entities.modified)
          console.log(chalk.yellow(`    ~ ${name}`));
      }
      if (diff.relations.added.length) {
        console.log(
          chalk.green(`  + ${diff.relations.added.length} relations added`),
        );
      }
      if (diff.relations.removed.length) {
        console.log(
          chalk.red(`  - ${diff.relations.removed.length} relations removed`),
        );
      }
      if (diff.processes.added.length) {
        console.log(
          chalk.green(`  + ${diff.processes.added.length} processes added`),
        );
      }
      if (diff.constraints.added.length) {
        console.log(
          chalk.green(`  + ${diff.constraints.added.length} constraints added`),
        );
      }
    } catch (err) {
      console.error(
        chalk.red(`Error: ${err instanceof Error ? err.message : String(err)}`),
      );
      process.exit(1);
    }
  });

// ─── inspect ──────────────────────────────────────────────────
program
  .command("inspect")
  .description("Inspect a world model — stats, entity lookup, graph export")
  .argument("<model>", "Path to world model JSON")
  .option(
    "-e, --entity <name>",
    "Look up a specific entity and show its relations",
  )
  .option("--stats", "Show detailed statistics")
  .option("--format <format>", "Export format: mermaid, dot")
  .action(
    (modelPath: string, opts: Record<string, string | boolean | undefined>) => {
      try {
        const model = readModel(modelPath);

        if (opts.format) {
          console.log(formatOutput(model, opts.format as string, true));
          return;
        }

        if (opts.entity) {
          const entity = findEntity(model, opts.entity as string);
          if (!entity) {
            console.error(chalk.red(`Entity "${opts.entity}" not found`));
            process.exit(1);
          }

          console.log(
            chalk.blue(`■ ${entity.name}`) + chalk.gray(` (${entity.type})`),
          );
          console.log(chalk.white(`  ${entity.description}`));
          if (entity.properties) {
            console.log(
              chalk.gray(`  Properties: ${JSON.stringify(entity.properties)}`),
            );
          }

          const deps = findDependents(model, entity.id);
          if (deps.incoming.length) {
            console.log(chalk.gray("\n  Incoming:"));
            for (const d of deps.incoming) {
              console.log(
                `    ${d.entity.name} —[${d.relation.type}]→ ${entity.name}`,
              );
            }
          }
          if (deps.outgoing.length) {
            console.log(chalk.gray("\n  Outgoing:"));
            for (const d of deps.outgoing) {
              console.log(
                `    ${entity.name} —[${d.relation.type}]→ ${d.entity.name}`,
              );
            }
          }
          return;
        }

        // Default: show stats
        const stats = getStats(model);
        console.log(chalk.blue(`■ ${model.name}`));
        console.log(chalk.gray(`  ${model.description}\n`));
        console.log(`  Entities:    ${stats.entities.total}`);
        for (const [type, count] of Object.entries(stats.entities.byType)) {
          console.log(chalk.gray(`    ${type}: ${count}`));
        }
        console.log(`  Relations:   ${stats.relations.total}`);
        for (const [type, count] of Object.entries(stats.relations.byType)) {
          console.log(chalk.gray(`    ${type}: ${count}`));
        }
        console.log(
          `  Processes:   ${stats.processes.total} (${stats.processes.totalSteps} steps)`,
        );
        console.log(
          `  Constraints: ${stats.constraints.total} (${stats.constraints.hard} hard, ${stats.constraints.soft} soft)`,
        );
        console.log(`  Confidence:  ${stats.confidence}`);

        if (stats.mostConnected.length) {
          console.log(chalk.gray("\n  Most connected:"));
          for (const mc of stats.mostConnected) {
            console.log(`    ${mc.entity}: ${mc.connections} connections`);
          }
        }
      } catch (err) {
        console.error(
          chalk.red(
            `Error: ${err instanceof Error ? err.message : String(err)}`,
          ),
        );
        process.exit(1);
      }
    },
  );

// ─── validate ─────────────────────────────────────────────────
program
  .command("validate")
  .description("Validate a world model JSON file with full integrity checks")
  .argument("<file>", "Path to world model JSON")
  .action(async (file: string) => {
    try {
      const model = readModel(file);

      console.log(chalk.blue("■ Validating world model"));
      console.log(
        chalk.gray(
          `  ${model.entities.length} entities, ${model.relations.length} relations\n`,
        ),
      );

      const { validationAgent } = await import("./agents/validation.js");
      const { validation } = await validationAgent({
        input: { raw: "", sourceType: "text" },
        worldModel: model,
      });

      const statusColor = validation.valid ? chalk.green : chalk.red;
      console.log(
        statusColor(`  ${validation.valid ? "✓ VALID" : "✗ INVALID"}`),
      );

      if (validation.issues.length > 0) {
        for (const issue of validation.issues) {
          const icon =
            issue.type === "error"
              ? chalk.red("✗")
              : issue.type === "warning"
                ? chalk.yellow("!")
                : chalk.blue("i");
          console.log(`  ${icon} [${issue.code}] ${issue.message}`);
        }
      } else {
        console.log(chalk.green("  No issues found"));
      }

      console.log(
        chalk.gray(
          `\n  Stats: ${validation.stats.entities} entities, ${validation.stats.relations} relations, ${validation.stats.processes} processes, ${validation.stats.constraints} constraints`,
        ),
      );
    } catch (err) {
      console.error(
        chalk.red(`Error: ${err instanceof Error ? err.message : String(err)}`),
      );
      process.exit(1);
    }
  });

// ─── query ────────────────────────────────────────────────────
program
  .command("query")
  .description("Ask a question about a world model")
  .argument("<model>", "Path to world model JSON")
  .argument("<question>", "Natural language question")
  .option("--json", "Output result as JSON")
  .action(
    async (
      modelPath: string,
      question: string,
      opts: Record<string, boolean | undefined>,
    ) => {
      try {
        const model = readModel(modelPath);
        const result = await queryWorldModel(model, question);

        if (opts.json) {
          console.log(JSON.stringify(result, null, 2));
        } else {
          console.log(result.answer);
          console.error(
            chalk.gray(
              `\n  Method: ${result.method} | Confidence: ${result.confidence} | Entities: ${result.entities_referenced.join(", ") || "none"}`,
            ),
          );
        }
      } catch (err) {
        console.error(
          chalk.red(
            `Error: ${err instanceof Error ? err.message : String(err)}`,
          ),
        );
        process.exit(1);
      }
    },
  );

// ─── algebra: intersect ───────────────────────────────────────
program
  .command("intersect")
  .description("Compute the intersection of two world models (shared entities)")
  .argument("<modelA>", "Path to first world model JSON")
  .argument("<modelB>", "Path to second world model JSON")
  .option("-o, --output <path>", "Write result to file")
  .action(
    (
      pathA: string,
      pathB: string,
      opts: Record<string, string | undefined>,
    ) => {
      try {
        const result = intersection(readModel(pathA), readModel(pathB));
        const output = JSON.stringify(result, null, 2);
        if (opts.output) {
          writeFileSync(resolve(opts.output), output, "utf-8");
          console.error(chalk.green(`✓ Written to ${opts.output}`));
        } else {
          console.log(output);
        }
        console.error(
          chalk.gray(
            `  ${result.entities.length} shared entities, ${result.relations.length} shared relations`,
          ),
        );
      } catch (err) {
        console.error(
          chalk.red(
            `Error: ${err instanceof Error ? err.message : String(err)}`,
          ),
        );
        process.exit(1);
      }
    },
  );

// ─── algebra: subtract ───────────────────────────────────────
program
  .command("subtract")
  .description("Compute A \\ B — entities in A that are not in B")
  .argument("<modelA>", "Path to base world model JSON")
  .argument("<modelB>", "Path to model to subtract")
  .option("-o, --output <path>", "Write result to file")
  .action(
    (
      pathA: string,
      pathB: string,
      opts: Record<string, string | undefined>,
    ) => {
      try {
        const result = difference(readModel(pathA), readModel(pathB));
        const output = JSON.stringify(result, null, 2);
        if (opts.output) {
          writeFileSync(resolve(opts.output), output, "utf-8");
          console.error(chalk.green(`✓ Written to ${opts.output}`));
        } else {
          console.log(output);
        }
        console.error(
          chalk.gray(`  ${result.entities.length} unique entities remaining`),
        );
      } catch (err) {
        console.error(
          chalk.red(
            `Error: ${err instanceof Error ? err.message : String(err)}`,
          ),
        );
        process.exit(1);
      }
    },
  );

// ─── algebra: overlay ────────────────────────────────────────
program
  .command("overlay")
  .description(
    "Apply a lens model on top of a base model (constraints, relations overlay)",
  )
  .argument("<base>", "Path to base world model JSON")
  .argument("<lens>", "Path to lens model to overlay")
  .option("-o, --output <path>", "Write result to file")
  .action(
    (
      basePath: string,
      lensPath: string,
      opts: Record<string, string | undefined>,
    ) => {
      try {
        const result = overlay(readModel(basePath), readModel(lensPath));
        const output = JSON.stringify(result, null, 2);
        if (opts.output) {
          writeFileSync(resolve(opts.output), output, "utf-8");
          console.error(chalk.green(`✓ Written to ${opts.output}`));
        } else {
          console.log(output);
        }
        console.error(
          chalk.gray(
            `  ${result.entities.length} entities, ${result.constraints.length} constraints after overlay`,
          ),
        );
      } catch (err) {
        console.error(
          chalk.red(
            `Error: ${err instanceof Error ? err.message : String(err)}`,
          ),
        );
        process.exit(1);
      }
    },
  );

// ─── export ──────────────────────────────────────────────────
program
  .command("export")
  .description("Export a world model as AI-consumable context")
  .argument("<model>", "Path to world model JSON")
  .option(
    "--as <format>",
    "Export format: claude-md, system-prompt, mcp",
    "claude-md",
  )
  .option("-o, --output <path>", "Write to file")
  .action((modelPath: string, opts: Record<string, string | undefined>) => {
    try {
      const model = readModel(modelPath);
      let output: string;

      switch (opts.as) {
        case "claude-md":
          output = toClaudeMd(model);
          break;
        case "system-prompt":
          output = toSystemPrompt(model);
          break;
        case "mcp":
          output = JSON.stringify(toMcpSchema(model), null, 2);
          break;
        default:
          console.error(
            chalk.red(
              `Unknown export format: ${opts.as}. Use: claude-md, system-prompt, mcp`,
            ),
          );
          process.exit(1);
      }

      if (opts.output) {
        writeFileSync(resolve(opts.output), output, "utf-8");
        console.error(
          chalk.green(`✓ Exported as ${opts.as} to ${opts.output}`),
        );
      } else {
        console.log(output);
      }
    } catch (err) {
      console.error(
        chalk.red(`Error: ${err instanceof Error ? err.message : String(err)}`),
      );
      process.exit(1);
    }
  });

// ─── timeline: snapshot ───────────────────────────────────────
program
  .command("snapshot")
  .description("Add a world model as a snapshot to a timeline")
  .argument("<model>", "Path to world model JSON")
  .option(
    "--timeline <path>",
    "Path to timeline JSON (created if missing)",
    "timeline.json",
  )
  .option("-l, --label <label>", "Label for this snapshot")
  .action((modelPath: string, opts: Record<string, string | undefined>) => {
    try {
      const model = readModel(modelPath);
      const tlPath = resolve(opts.timeline ?? "timeline.json");

      let timeline: Timeline;
      try {
        const raw = readFileSync(tlPath, "utf-8");
        timeline = JSON.parse(raw) as Timeline;
      } catch {
        timeline = createTimeline(model.name);
        console.error(chalk.gray(`  Creating new timeline: ${tlPath}`));
      }

      timeline = addSnapshot(timeline, model, opts.label);
      writeFileSync(tlPath, JSON.stringify(timeline, null, 2), "utf-8");

      const snap = timeline.snapshots[timeline.snapshots.length - 1];
      console.error(chalk.green(`✓ Snapshot ${snap.id} added to ${tlPath}`));
      console.error(
        chalk.gray(
          `  ${snap.stats.entities} entities, ${snap.stats.relations} relations`,
        ),
      );
      if (snap.diff_from_previous) {
        console.error(
          chalk.gray(`  Changes: ${snap.diff_from_previous.summary}`),
        );
      }
      console.error(
        chalk.gray(`  Total snapshots: ${timeline.snapshots.length}`),
      );
    } catch (err) {
      console.error(
        chalk.red(`Error: ${err instanceof Error ? err.message : String(err)}`),
      );
      process.exit(1);
    }
  });

// ─── timeline: history ────────────────────────────────────────
program
  .command("history")
  .description("Show timeline evolution or entity history")
  .argument("<timeline>", "Path to timeline JSON")
  .option("-e, --entity <name>", "Track a specific entity across snapshots")
  .action((tlPath: string, opts: Record<string, string | undefined>) => {
    try {
      const raw = readFileSync(resolve(tlPath), "utf-8");
      const timeline = JSON.parse(raw) as Timeline;

      if (opts.entity) {
        const history = entityHistory(timeline, opts.entity);
        if (history.length === 0) {
          console.log(
            chalk.yellow(`Entity "${opts.entity}" not found in any snapshot.`),
          );
          return;
        }
        console.log(
          chalk.blue(
            `■ History of "${opts.entity}" across ${timeline.snapshots.length} snapshots\n`,
          ),
        );
        for (const entry of history) {
          const icon =
            entry.event === "appeared"
              ? chalk.green("+")
              : entry.event === "disappeared"
                ? chalk.red("-")
                : entry.event === "modified"
                  ? chalk.yellow("~")
                  : chalk.gray("=");
          const label = entry.label ? ` (${entry.label})` : "";
          console.log(`  ${icon} ${entry.timestamp}${label}: ${entry.event}`);
          if (entry.description)
            console.log(chalk.gray(`    ${entry.description}`));
        }
      } else {
        console.log(timelineSummary(timeline));
      }
    } catch (err) {
      console.error(
        chalk.red(`Error: ${err instanceof Error ? err.message : String(err)}`),
      );
      process.exit(1);
    }
  });

program.parse();

// === src/export/claude-md.ts ===
import type { WorldModelType } from "../schema/index.js";

/**
 * Export a world model as a CLAUDE.md file — a governing context document
 * that an AI agent can use as its operating reality.
 */
export function toClaudeMd(model: WorldModelType): string {
  const lines: string[] = [];

  lines.push(`# ${model.name}`);
  lines.push("");
  lines.push(model.description);
  lines.push("");
  lines.push(
    `> World model v${model.version} — ${model.entities.length} entities, ${model.relations.length} relations, ${model.processes.length} processes, ${model.constraints.length} constraints`,
  );
  lines.push(`> Confidence: ${model.metadata?.confidence ?? "unknown"}`);
  lines.push("");

  // ─── Domain Entities ────────────────────────────────────
  lines.push("## Domain Entities");
  lines.push("");
  lines.push("The system you are working with has these components:");
  lines.push("");

  const byType = new Map<string, WorldModelType["entities"]>();
  for (const e of model.entities) {
    const arr = byType.get(e.type) ?? [];
    arr.push(e);
    byType.set(e.type, arr);
  }

  for (const [type, entities] of byType) {
    lines.push(`### ${type.charAt(0).toUpperCase() + type.slice(1)}s`);
    lines.push("");
    for (const e of entities) {
      lines.push(`- **${e.name}**: ${e.description}`);
      if (e.properties && Object.keys(e.properties).length > 0) {
        for (const [k, v] of Object.entries(e.properties)) {
          lines.push(`  - ${k}: ${JSON.stringify(v)}`);
        }
      }
    }
    lines.push("");
  }

  // ─── Relationships ──────────────────────────────────────
  lines.push("## Relationships");
  lines.push("");
  lines.push("These are the dependencies and connections between components:");
  lines.push("");

  for (const r of model.relations) {
    const src = model.entities.find((e) => e.id === r.source)?.name ?? r.source;
    const tgt = model.entities.find((e) => e.id === r.target)?.name ?? r.target;
    lines.push(
      `- **${src}** ${r.type.replace(/_/g, " ")} **${tgt}**: ${r.label}`,
    );
  }
  lines.push("");

  // ─── Processes ──────────────────────────────────────────
  if (model.processes.length > 0) {
    lines.push("## Processes");
    lines.push("");
    lines.push("When these events occur, follow these sequences:");
    lines.push("");

    for (const p of model.processes) {
      lines.push(`### ${p.name}`);
      lines.push("");
      lines.push(p.description);
      if (p.trigger) {
        lines.push(`**Trigger:** ${p.trigger}`);
      }
      lines.push("");

      for (const step of p.steps) {
        const actor = step.actor
          ? (model.entities.find((e) => e.id === step.actor)?.name ?? "unknown")
          : "system";
        lines.push(`${step.order}. **${actor}**: ${step.action}`);
      }
      lines.push("");

      if (p.outcomes.length > 0) {
        lines.push(`**Outcomes:** ${p.outcomes.join(", ")}`);
        lines.push("");
      }
    }
  }

  // ─── Constraints ────────────────────────────────────────
  if (model.constraints.length > 0) {
    lines.push("## Constraints");
    lines.push("");
    lines.push("You MUST respect these rules at all times:");
    lines.push("");

    const hard = model.constraints.filter((c) => c.severity === "hard");
    const soft = model.constraints.filter((c) => c.severity === "soft");

    if (hard.length > 0) {
      lines.push("### Hard Constraints (violations are errors)");
      lines.push("");
      for (const c of hard) {
        const scopeNames = c.scope
          .map((id) => model.entities.find((e) => e.id === id)?.name ?? id)
          .join(", ");
        lines.push(
          `- **${c.name}** (applies to: ${scopeNames}): ${c.description}`,
        );
      }
      lines.push("");
    }

    if (soft.length > 0) {
      lines.push("### Soft Constraints (violations are warnings)");
      lines.push("");
      for (const c of soft) {
        const scopeNames = c.scope
          .map((id) => model.entities.find((e) => e.id === id)?.name ?? id)
          .join(", ");
        lines.push(
          `- **${c.name}** (applies to: ${scopeNames}): ${c.description}`,
        );
      }
      lines.push("");
    }
  }

  // ─── Extraction Notes ───────────────────────────────────
  if (
    model.metadata?.extraction_notes &&
    model.metadata.extraction_notes.length > 0
  ) {
    lines.push("## Notes");
    lines.push("");
    lines.push("The following observations were made during model extraction:");
    lines.push("");
    for (const note of model.metadata.extraction_notes) {
      lines.push(`- ${note}`);
    }
    lines.push("");
  }

  return lines.join("\n");
}

// === src/export/index.ts ===
export { toClaudeMd } from "./claude-md.js";
export { toSystemPrompt } from "./system-prompt.js";
export { toMcpSchema } from "./mcp-schema.js";

// === src/export/mcp-schema.ts ===
import type { WorldModelType } from "../schema/index.js";

interface MCPTool {
  name: string;
  description: string;
  inputSchema: {
    type: "object";
    properties: Record<
      string,
      { type: string; description: string; enum?: string[] }
    >;
    required: string[];
  };
}

interface MCPSchema {
  name: string;
  description: string;
  tools: MCPTool[];
}

/**
 * Export a world model as MCP tool definitions.
 * Each entity type gets query tools. Each process gets an execution tool.
 * Constraints become validation tools.
 */
export function toMcpSchema(model: WorldModelType): MCPSchema {
  const tools: MCPTool[] = [];

  // ─── Entity lookup tool ─────────────────────────────────
  const entityNames = model.entities.map((e) => e.name);
  tools.push({
    name: "get_entity",
    description: `Look up a domain entity by name. Available entities: ${entityNames.slice(0, 10).join(", ")}${entityNames.length > 10 ? ` and ${entityNames.length - 10} more` : ""}`,
    inputSchema: {
      type: "object",
      properties: {
        name: {
          type: "string",
          description: "Name of the entity to look up",
          enum: entityNames,
        },
      },
      required: ["name"],
    },
  });

  // ─── Relation query tool ────────────────────────────────
  tools.push({
    name: "get_relations",
    description:
      "Get all relations for a given entity — what it depends on, what depends on it",
    inputSchema: {
      type: "object",
      properties: {
        entity: {
          type: "string",
          description: "Name of the entity",
          enum: entityNames,
        },
        direction: {
          type: "string",
          description: "Direction of relations to query",
          enum: ["incoming", "outgoing", "both"],
        },
      },
      required: ["entity"],
    },
  });

  // ─── Process execution tools ────────────────────────────
  for (const proc of model.processes) {
    const participantNames = proc.participants.map(
      (id) => model.entities.find((e) => e.id === id)?.name ?? id,
    );

    tools.push({
      name: `process_${proc.name.toLowerCase().replace(/[^a-z0-9]/g, "_")}`,
      description: `${proc.description}. Participants: ${participantNames.join(", ")}. ${proc.steps.length} steps.${proc.trigger ? ` Triggered by: ${proc.trigger}` : ""}`,
      inputSchema: {
        type: "object",
        properties: {
          step: {
            type: "string",
            description: `Which step to query or execute (1-${proc.steps.length})`,
          },
          context: {
            type: "string",
            description: "Additional context for this process invocation",
          },
        },
        required: [],
      },
    });
  }

  // ─── Constraint validation tool ─────────────────────────
  if (model.constraints.length > 0) {
    const constraintNames = model.constraints.map((c) => c.name);
    tools.push({
      name: "check_constraint",
      description:
        "Validate whether an action or state violates a domain constraint",
      inputSchema: {
        type: "object",
        properties: {
          constraint: {
            type: "string",
            description: "Name of the constraint to check",
            enum: constraintNames,
          },
          action: {
            type: "string",
            description:
              "Description of the action or state to validate against the constraint",
          },
        },
        required: ["constraint", "action"],
      },
    });
  }

  // ─── Query tool ─────────────────────────────────────────
  tools.push({
    name: "query_world_model",
    description: "Ask a natural language question about the domain model",
    inputSchema: {
      type: "object",
      properties: {
        question: {
          type: "string",
          description: "Natural language question about the domain",
        },
      },
      required: ["question"],
    },
  });

  return {
    name: model.name.toLowerCase().replace(/[^a-z0-9]/g, "-"),
    description: `MCP server for ${model.name}: ${model.description}`,
    tools,
  };
}

// === src/export/system-prompt.ts ===
import type { WorldModelType } from "../schema/index.js";

/**
 * Export a world model as a system prompt that makes an LLM
 * "an expert in this world."
 */
export function toSystemPrompt(model: WorldModelType): string {
  const entityList = model.entities
    .map((e) => `- ${e.name} (${e.type}): ${e.description}`)
    .join("\n");

  const relationList = model.relations
    .map((r) => {
      const src =
        model.entities.find((e) => e.id === r.source)?.name ?? r.source;
      const tgt =
        model.entities.find((e) => e.id === r.target)?.name ?? r.target;
      return `- ${src} ${r.type.replace(/_/g, " ")} ${tgt}`;
    })
    .join("\n");

  const processDescriptions = model.processes
    .map((p) => {
      const steps = p.steps
        .map((s) => {
          const actor = s.actor
            ? (model.entities.find((e) => e.id === s.actor)?.name ?? "unknown")
            : "system";
          return `  ${s.order}. ${actor}: ${s.action}`;
        })
        .join("\n");
      return `${p.name}: ${p.description}\n${steps}`;
    })
    .join("\n\n");

  const constraintList = model.constraints
    .map((c) => {
      const scopeNames = c.scope
        .map((id) => model.entities.find((e) => e.id === id)?.name ?? id)
        .join(", ");
      return `- [${c.severity.toUpperCase()}] ${c.name} (${scopeNames}): ${c.description}`;
    })
    .join("\n");

  return `You are an expert on the domain: ${model.name}.

${model.description}

You have complete knowledge of this domain's structure. Answer questions accurately based on the following world model. Do not speculate beyond what the model defines — if something isn't represented, say so.

ENTITIES (${model.entities.length}):
${entityList}

RELATIONSHIPS (${model.relations.length}):
${relationList}

PROCESSES (${model.processes.length}):
${processDescriptions}

CONSTRAINTS (${model.constraints.length}):
${constraintList}

When answering:
- Reference entities by their exact names
- Respect all HARD constraints as absolute rules
- Treat SOFT constraints as strong preferences
- Trace processes step-by-step when asked about workflows
- Identify which entities are involved when answering about any topic`;
}

// === src/index.ts ===
export { buildWorldModel } from "./swm.js";
export type { SWMOptions } from "./swm.js";
export { Pipeline } from "./pipeline/index.js";
export type { PipelineInput, PipelineResult } from "./pipeline/index.js";
export type { WorldModelType, ValidationResultType } from "./schema/index.js";

// Agents
export { refineWorldModel } from "./agents/refinement.js";
export { queryWorldModel } from "./agents/query.js";
export type { QueryResult } from "./agents/query.js";

// Graph operations
export {
  findEntity,
  findDependents,
  pathsBetween,
  toMermaid,
  toDot,
  getStats,
} from "./utils/graph.js";

// Merge & diff
export { mergeWorldModels, diffWorldModels } from "./utils/merge.js";
export type { WorldModelDiff } from "./utils/merge.js";

// Algebra
export { intersection, difference, overlay } from "./utils/algebra.js";

// Export formats
export { toClaudeMd } from "./export/claude-md.js";
export { toSystemPrompt } from "./export/system-prompt.js";
export { toMcpSchema } from "./export/mcp-schema.js";

// Timeline
export {
  createTimeline,
  addSnapshot,
  entityHistory,
  timelineSummary,
} from "./utils/timeline.js";
export type { Timeline, Snapshot } from "./utils/timeline.js";

// === src/pipeline/index.ts ===
export { Pipeline } from "./pipeline.js";
export type {
  PipelineInput,
  PipelineResult,
  PipelineStageResult,
  PipelineStage,
  StageHandler,
} from "./pipeline.js";

// === src/pipeline/pipeline.ts ===
import type { WorldModelType, ValidationResultType } from "../schema/index.js";

export interface PipelineInput {
  raw: string;
  sourceType: "text" | "document" | "url" | "code" | "conversation" | "mixed";
  name?: string;
}

export interface PipelineStageResult<T> {
  stage: string;
  data: T;
  durationMs: number;
}

export interface PipelineResult {
  worldModel: WorldModelType;
  validation: ValidationResultType;
  stages: PipelineStageResult<unknown>[];
  totalDurationMs: number;
}

export type StageHandler<TIn, TOut> = (input: TIn) => Promise<TOut>;

export interface PipelineStage<TIn = unknown, TOut = unknown> {
  name: string;
  run: StageHandler<TIn, TOut>;
}

export class Pipeline {
  private stages: PipelineStage[] = [];
  private onStageStart?: (name: string) => void;
  private onStageEnd?: (name: string, durationMs: number) => void;

  constructor(options?: {
    onStageStart?: (name: string) => void;
    onStageEnd?: (name: string, durationMs: number) => void;
  }) {
    this.onStageStart = options?.onStageStart;
    this.onStageEnd = options?.onStageEnd;
  }

  addStage<TIn, TOut>(name: string, run: StageHandler<TIn, TOut>): Pipeline {
    this.stages.push({ name, run: run as StageHandler<unknown, unknown> });
    return this;
  }

  async execute(input: PipelineInput): Promise<PipelineResult> {
    const stageResults: PipelineStageResult<unknown>[] = [];
    let current: unknown = input;
    const totalStart = Date.now();

    for (const stage of this.stages) {
      this.onStageStart?.(stage.name);
      const start = Date.now();

      current = await stage.run(current);

      const durationMs = Date.now() - start;
      this.onStageEnd?.(stage.name, durationMs);

      stageResults.push({
        stage: stage.name,
        data: current,
        durationMs,
      });
    }

    const finalResult = current as {
      worldModel: WorldModelType;
      validation: ValidationResultType;
    };

    return {
      worldModel: finalResult.worldModel,
      validation: finalResult.validation,
      stages: stageResults,
      totalDurationMs: Date.now() - totalStart,
    };
  }
}

// === src/schema/extraction.ts ===
import { z } from "zod/v4";

/**
 * Zod schema for raw extraction output from the LLM.
 * Used to validate + coerce LLM responses before structuring.
 * Intentionally lenient — uses defaults and coercion rather than
 * rejecting partial extractions.
 */

const RawEntitySchema = z.object({
  name: z.string().default("unnamed"),
  type: z.string().default("object"),
  description: z.string().default(""),
  properties: z.record(z.string(), z.unknown()).optional(),
  tags: z.array(z.string()).optional(),
});

const RawRelationSchema = z.object({
  source: z.string(),
  target: z.string(),
  type: z.string().default("uses"),
  label: z.string().default(""),
  bidirectional: z.boolean().optional(),
});

const RawProcessStepSchema = z.object({
  order: z.number().optional(),
  action: z.string().default(""),
  actor: z.string().optional(),
  inputs: z.array(z.string()).optional(),
  outputs: z.array(z.string()).optional(),
});

const RawProcessSchema = z.object({
  name: z.string().default("unnamed process"),
  description: z.string().default(""),
  trigger: z.string().optional(),
  steps: z.array(RawProcessStepSchema).default([]),
  participants: z.array(z.string()).default([]),
  outcomes: z.array(z.string()).default([]),
});

const RawConstraintSchema = z.object({
  name: z.string().default("unnamed constraint"),
  type: z.string().default("rule"),
  description: z.string().default(""),
  scope: z.array(z.string()).default([]),
  severity: z.enum(["hard", "soft"]).default("soft"),
});

export const RawExtractionSchema = z.object({
  entities: z.array(RawEntitySchema).default([]),
  relations: z.array(RawRelationSchema).default([]),
  processes: z.array(RawProcessSchema).default([]),
  constraints: z.array(RawConstraintSchema).default([]),
  model_name: z.string().default("Untitled"),
  model_description: z.string().default(""),
  source_summary: z.string().default(""),
  confidence: z.number().min(0).max(1).default(0.5),
  extraction_notes: z.array(z.string()).default([]),
});

export type ValidatedRawExtraction = z.infer<typeof RawExtractionSchema>;

/**
 * Validate and coerce raw LLM extraction output.
 * Returns a clean extraction with defaults for missing fields,
 * plus any validation issues encountered.
 */
export function validateExtraction(raw: unknown): {
  extraction: ValidatedRawExtraction;
  issues: string[];
} {
  const issues: string[] = [];

  // Handle completely wrong types
  if (raw === null || raw === undefined) {
    issues.push("Extraction was null/undefined — returning empty model");
    return { extraction: RawExtractionSchema.parse({}), issues };
  }

  if (typeof raw !== "object") {
    issues.push(
      `Extraction was ${typeof raw} instead of object — returning empty model`,
    );
    return { extraction: RawExtractionSchema.parse({}), issues };
  }

  const result = RawExtractionSchema.safeParse(raw);

  if (result.success) {
    // Filter out entities with empty names
    const extraction = result.data;
    const beforeCount = extraction.entities.length;
    extraction.entities = extraction.entities.filter(
      (e) => e.name && e.name !== "unnamed",
    );
    if (extraction.entities.length < beforeCount) {
      issues.push(
        `Dropped ${beforeCount - extraction.entities.length} entities with empty/default names`,
      );
    }

    // Filter out relations with empty source/target
    const relBefore = extraction.relations.length;
    extraction.relations = extraction.relations.filter(
      (r) => r.source && r.target,
    );
    if (extraction.relations.length < relBefore) {
      issues.push(
        `Dropped ${relBefore - extraction.relations.length} relations with empty source/target`,
      );
    }

    return { extraction, issues };
  }

  // Partial parse — try to salvage what we can
  issues.push(
    `Extraction had schema errors: ${result.error.issues
      .slice(0, 3)
      .map((i) => i.message)
      .join("; ")}`,
  );

  // Attempt lenient parse by stripping invalid fields
  try {
    const obj = raw as Record<string, unknown>;
    const lenient = RawExtractionSchema.parse({
      entities: Array.isArray(obj.entities) ? obj.entities : [],
      relations: Array.isArray(obj.relations) ? obj.relations : [],
      processes: Array.isArray(obj.processes) ? obj.processes : [],
      constraints: Array.isArray(obj.constraints) ? obj.constraints : [],
      model_name:
        typeof obj.model_name === "string" ? obj.model_name : "Untitled",
      model_description:
        typeof obj.model_description === "string" ? obj.model_description : "",
      source_summary:
        typeof obj.source_summary === "string" ? obj.source_summary : "",
      confidence: typeof obj.confidence === "number" ? obj.confidence : 0.5,
      extraction_notes: Array.isArray(obj.extraction_notes)
        ? obj.extraction_notes
        : [],
    });
    issues.push("Recovered partial extraction via lenient parse");
    return { extraction: lenient, issues };
  } catch {
    issues.push("Lenient parse also failed — returning empty model");
    return { extraction: RawExtractionSchema.parse({}), issues };
  }
}

// === src/schema/index.ts ===
export {
  Entity,
  EntityId,
  Relation,
  RelationId,
  Process,
  ProcessId,
  ProcessStep,
  Constraint,
  ConstraintId,
  WorldModel,
  ValidationIssue,
  ValidationResult,
} from "./world-model.js";

export type {
  Entity as EntityType,
  Relation as RelationType,
  Process as ProcessType,
  Constraint as ConstraintType,
  WorldModel as WorldModelType,
  ValidationIssue as ValidationIssueType,
  ValidationResult as ValidationResultType,
} from "./world-model.js";

// === src/schema/world-model.ts ===
import { z } from "zod/v4";

// ─── Primitives ───────────────────────────────────────────────

export const EntityId = z.string().describe("Unique entity identifier");
export const RelationId = z.string().describe("Unique relation identifier");
export const ProcessId = z.string().describe("Unique process identifier");
export const ConstraintId = z.string().describe("Unique constraint identifier");

// ─── Entity ───────────────────────────────────────────────────
// Something that exists in the world. Can be concrete (a server, a user)
// or abstract (a policy, a concept).

export const Entity = z.object({
  id: EntityId,
  name: z.string().describe("Human-readable name"),
  type: z
    .enum([
      "actor",
      "object",
      "system",
      "concept",
      "location",
      "event",
      "group",
      "resource",
    ])
    .describe("Ontological category"),
  description: z.string().describe("What this entity is and why it matters"),
  properties: z
    .record(z.string(), z.unknown())
    .describe("Arbitrary key-value attributes")
    .optional(),
  tags: z.array(z.string()).optional(),
});

export type Entity = z.infer<typeof Entity>;

// ─── Relation ─────────────────────────────────────────────────
// A directed edge between two entities.

export const Relation = z.object({
  id: RelationId,
  type: z
    .enum([
      "has",
      "is_a",
      "part_of",
      "depends_on",
      "produces",
      "consumes",
      "controls",
      "communicates_with",
      "located_in",
      "triggers",
      "inherits",
      "contains",
      "uses",
      "flows_to",
      "opposes",
      "enables",
      "transforms",
    ])
    .describe("Semantic type of the relation"),
  source: EntityId.describe("Source entity ID"),
  target: EntityId.describe("Target entity ID"),
  label: z.string().describe("Human-readable description of the relation"),
  weight: z
    .number()
    .min(0)
    .max(1)
    .optional()
    .describe("Strength/confidence of the relation"),
  bidirectional: z.boolean().optional(),
});

export type Relation = z.infer<typeof Relation>;

// ─── Process ──────────────────────────────────────────────────
// A dynamic sequence — something that happens over time.

export const ProcessStep = z.object({
  order: z.number(),
  action: z.string().describe("What happens in this step"),
  actor: EntityId.optional().describe("Who/what performs the action"),
  input: z.array(EntityId).optional(),
  output: z.array(EntityId).optional(),
});

export const Process = z.object({
  id: ProcessId,
  name: z.string(),
  description: z.string(),
  trigger: z.string().optional().describe("What initiates this process"),
  steps: z.array(ProcessStep),
  participants: z.array(EntityId).describe("All entities involved"),
  outcomes: z
    .array(z.string())
    .describe("What this process produces or changes"),
});

export type Process = z.infer<typeof Process>;

// ─── Constraint ───────────────────────────────────────────────
// An invariant — something that must always be true.

export const Constraint = z.object({
  id: ConstraintId,
  name: z.string(),
  type: z.enum([
    "invariant",
    "rule",
    "boundary",
    "dependency",
    "capacity",
    "temporal",
    "authorization",
  ]),
  description: z.string().describe("What must hold true"),
  scope: z
    .array(EntityId)
    .describe("Which entities this constraint applies to"),
  severity: z
    .enum(["hard", "soft"])
    .describe("Hard = violation is an error, Soft = violation is a warning"),
});

export type Constraint = z.infer<typeof Constraint>;

// ─── World Model ──────────────────────────────────────────────
// The complete structured representation.

export const WorldModel = z.object({
  id: z.string(),
  name: z.string().describe("Name of this world model"),
  description: z.string().describe("What domain/system this model represents"),
  version: z.string().default("0.1.0"),
  created_at: z.string(),

  entities: z.array(Entity),
  relations: z.array(Relation),
  processes: z.array(Process),
  constraints: z.array(Constraint),

  metadata: z
    .object({
      source_type: z
        .enum(["text", "document", "url", "code", "conversation", "mixed"])
        .describe("What kind of input produced this model"),
      source_summary: z.string().describe("Brief description of the input"),
      confidence: z
        .number()
        .min(0)
        .max(1)
        .describe("Overall extraction confidence"),
      extraction_notes: z
        .array(z.string())
        .optional()
        .describe("Observations, ambiguities, or gaps noted during extraction"),
    })
    .optional(),
});

export type WorldModel = z.infer<typeof WorldModel>;

// ─── Validation result ────────────────────────────────────────

export const ValidationIssue = z.object({
  type: z.enum(["error", "warning", "info"]),
  code: z.string(),
  message: z.string(),
  path: z.string().optional().describe("JSONPath to the problematic element"),
});

export type ValidationIssue = z.infer<typeof ValidationIssue>;

export const ValidationResult = z.object({
  valid: z.boolean(),
  issues: z.array(ValidationIssue),
  stats: z.object({
    entities: z.number(),
    relations: z.number(),
    processes: z.number(),
    constraints: z.number(),
  }),
});

export type ValidationResult = z.infer<typeof ValidationResult>;

// === src/swm.ts ===
import { Pipeline } from "./pipeline/index.js";
import type { PipelineInput, PipelineResult } from "./pipeline/index.js";
import { extractionAgent } from "./agents/extraction.js";
import { structuringAgent } from "./agents/structuring.js";
import { validationAgent } from "./agents/validation.js";
import { secondPassAgent } from "./agents/second-pass.js";
import { mergeWorldModels } from "./utils/merge.js";
import type { WorldModelType } from "./schema/index.js";

export interface SWMOptions {
  onStageStart?: (name: string) => void;
  onStageEnd?: (name: string, durationMs: number) => void;
  /** Number of extraction passes (1 = standard, 2+ = deeper). Default 1. Max 3. */
  passes?: number;
}

export async function buildWorldModel(
  input: PipelineInput,
  options?: SWMOptions,
): Promise<PipelineResult> {
  const passes = Math.min(Math.max(options?.passes ?? 1, 1), 3);
  const callbacks = {
    onStageStart: options?.onStageStart,
    onStageEnd: options?.onStageEnd,
  };

  // Pass 1: standard pipeline
  const pipeline = new Pipeline(callbacks);
  pipeline
    .addStage("extraction", extractionAgent)
    .addStage("structuring", structuringAgent)
    .addStage("validation", validationAgent);

  const firstPassResult = await pipeline.execute(input);

  if (passes === 1) {
    return firstPassResult;
  }

  // Multi-pass: run second-pass agent, merge, re-validate
  let currentModel = firstPassResult.worldModel;
  const allStages = [...firstPassResult.stages];
  let totalMs = firstPassResult.totalDurationMs;

  for (let pass = 2; pass <= passes; pass++) {
    const passLabel = `pass-${pass}-extraction`;

    callbacks.onStageStart?.(passLabel);
    const passStart = Date.now();

    const deltaExtraction = await secondPassAgent(input, currentModel);

    const passMs = Date.now() - passStart;
    callbacks.onStageEnd?.(passLabel, passMs);
    allStages.push({
      stage: passLabel,
      data: deltaExtraction,
      durationMs: passMs,
    });
    totalMs += passMs;

    // Structure the delta
    callbacks.onStageStart?.(`pass-${pass}-structuring`);
    const structStart = Date.now();

    const { worldModel: deltaModel } = await structuringAgent({
      input,
      extraction: deltaExtraction,
    });

    const structMs = Date.now() - structStart;
    callbacks.onStageEnd?.(`pass-${pass}-structuring`, structMs);
    allStages.push({
      stage: `pass-${pass}-structuring`,
      data: deltaModel,
      durationMs: structMs,
    });
    totalMs += structMs;

    // Merge
    callbacks.onStageStart?.(`pass-${pass}-merge`);
    const mergeStart = Date.now();

    currentModel = mergeWorldModels(currentModel, deltaModel, {
      name: currentModel.name,
      description: currentModel.description,
    });

    const mergeMs = Date.now() - mergeStart;
    callbacks.onStageEnd?.(`pass-${pass}-merge`, mergeMs);
    allStages.push({
      stage: `pass-${pass}-merge`,
      data: currentModel,
      durationMs: mergeMs,
    });
    totalMs += mergeMs;
  }

  // Final validation on the merged model
  callbacks.onStageStart?.("final-validation");
  const valStart = Date.now();

  const { worldModel: finalModel, validation } = await validationAgent({
    input,
    worldModel: currentModel,
  });

  const valMs = Date.now() - valStart;
  callbacks.onStageEnd?.("final-validation", valMs);
  allStages.push({
    stage: "final-validation",
    data: validation,
    durationMs: valMs,
  });
  totalMs += valMs;

  return {
    worldModel: finalModel,
    validation,
    stages: allStages,
    totalDurationMs: totalMs,
  };
}

export { Pipeline };
export type { PipelineInput, PipelineResult };

// === src/utils/algebra.ts ===
import type { WorldModelType } from "../schema/index.js";
import { genId } from "./ids.js";

type Entity = WorldModelType["entities"][number];
type Relation = WorldModelType["relations"][number];

function normalizeKey(name: string): string {
  return name
    .toLowerCase()
    .replace(/[^a-z0-9]/g, "_")
    .replace(/_+/g, "_")
    .replace(/^_|_$/g, "");
}

function entityKey(e: Entity): string {
  return normalizeKey(e.name);
}

function relKey(r: Relation, model: WorldModelType): string {
  const src = model.entities.find((e) => e.id === r.source)?.name ?? r.source;
  const tgt = model.entities.find((e) => e.id === r.target)?.name ?? r.target;
  return `${normalizeKey(src)}::${r.type}::${normalizeKey(tgt)}`;
}

function procKey(p: WorldModelType["processes"][number]): string {
  return normalizeKey(p.name);
}

function cstrKey(c: WorldModelType["constraints"][number]): string {
  return normalizeKey(c.name);
}

/**
 * Intersection: entities, relations, processes, constraints that appear in BOTH models.
 * Matched by name (entities, processes, constraints) or by (source, type, target) for relations.
 */
export function intersection(
  a: WorldModelType,
  b: WorldModelType,
): WorldModelType {
  const bEntityKeys = new Set(b.entities.map(entityKey));
  const bRelKeys = new Set(b.relations.map((r) => relKey(r, b)));
  const bProcKeys = new Set(b.processes.map(procKey));
  const bCstrKeys = new Set(b.constraints.map(cstrKey));

  const entities = a.entities
    .filter((e) => bEntityKeys.has(entityKey(e)))
    .map((e) => ({ ...e, id: genId("ent") }));

  const entityIdMap = new Map<string, string>();
  for (const origE of a.entities) {
    const newE = entities.find((e) => entityKey(e) === entityKey(origE));
    if (newE) entityIdMap.set(origE.id, newE.id);
  }
  // Also map B's IDs
  for (const origE of b.entities) {
    const newE = entities.find((e) => entityKey(e) === entityKey(origE));
    if (newE) entityIdMap.set(origE.id, newE.id);
  }

  const resolve = (id: string) => entityIdMap.get(id) ?? id;

  const relations = a.relations
    .filter((r) => bRelKeys.has(relKey(r, a)))
    .map((r) => ({
      ...r,
      id: genId("rel"),
      source: resolve(r.source),
      target: resolve(r.target),
    }));

  const processes = a.processes
    .filter((p) => bProcKeys.has(procKey(p)))
    .map((p) => ({
      ...p,
      id: genId("proc"),
      participants: p.participants.map(resolve),
      steps: p.steps.map((s) => ({
        ...s,
        actor: s.actor ? resolve(s.actor) : undefined,
        input: s.input?.map(resolve),
        output: s.output?.map(resolve),
      })),
    }));

  const constraints = a.constraints
    .filter((c) => bCstrKeys.has(cstrKey(c)))
    .map((c) => ({ ...c, id: genId("cstr"), scope: c.scope.map(resolve) }));

  return {
    id: genId("wm"),
    name: `${a.name} ∩ ${b.name}`,
    description: `Intersection of ${a.name} and ${b.name}`,
    version: "0.1.0",
    created_at: new Date().toISOString(),
    entities,
    relations,
    processes,
    constraints,
    metadata: {
      source_type: "mixed",
      source_summary: `Intersection: ${entities.length} shared entities`,
      confidence: Math.min(
        a.metadata?.confidence ?? 0.5,
        b.metadata?.confidence ?? 0.5,
      ),
    },
  };
}

/**
 * Difference: entities in A that are NOT in B.
 * Relations, processes, constraints are kept only if all their entity references remain.
 */
export function difference(
  a: WorldModelType,
  b: WorldModelType,
): WorldModelType {
  const bEntityKeys = new Set(b.entities.map(entityKey));

  const entities = a.entities
    .filter((e) => !bEntityKeys.has(entityKey(e)))
    .map((e) => ({ ...e, id: genId("ent") }));

  const entityIdMap = new Map<string, string>();
  for (const origE of a.entities) {
    const newE = entities.find((ne) => entityKey(ne) === entityKey(origE));
    if (newE) entityIdMap.set(origE.id, newE.id);
  }

  const remainingIds = new Set(entities.map((e) => e.id));
  const resolve = (id: string) => entityIdMap.get(id) ?? id;

  // Keep relations only if both endpoints remain
  const relations = a.relations
    .filter((r) => {
      const src = resolve(r.source);
      const tgt = resolve(r.target);
      return remainingIds.has(src) && remainingIds.has(tgt);
    })
    .map((r) => ({
      ...r,
      id: genId("rel"),
      source: resolve(r.source),
      target: resolve(r.target),
    }));

  // Keep processes only if all participants remain
  const processes = a.processes
    .filter((p) =>
      p.participants.every((pid) => remainingIds.has(resolve(pid))),
    )
    .map((p) => ({
      ...p,
      id: genId("proc"),
      participants: p.participants.map(resolve),
      steps: p.steps.map((s) => ({
        ...s,
        actor: s.actor ? resolve(s.actor) : undefined,
        input: s.input?.map(resolve),
        output: s.output?.map(resolve),
      })),
    }));

  // Keep constraints only if all scope entities remain
  const constraints = a.constraints
    .filter((c) => c.scope.every((sid) => remainingIds.has(resolve(sid))))
    .map((c) => ({ ...c, id: genId("cstr"), scope: c.scope.map(resolve) }));

  return {
    id: genId("wm"),
    name: `${a.name} \\ ${b.name}`,
    description: `Entities in ${a.name} but not in ${b.name}`,
    version: "0.1.0",
    created_at: new Date().toISOString(),
    entities,
    relations,
    processes,
    constraints,
    metadata: {
      source_type: "mixed",
      source_summary: `Difference: ${entities.length} entities unique to ${a.name}`,
      confidence: a.metadata?.confidence ?? 0.5,
    },
  };
}

/**
 * Overlay: apply B as a "lens" on top of A.
 * - All of A's entities remain
 * - B's constraints and relations are applied to matching entities in A
 * - B's entities that don't exist in A are added
 * - B's constraints override A's constraints with the same name
 */
export function overlay(
  base: WorldModelType,
  lens: WorldModelType,
): WorldModelType {
  // Start with all of base's entities
  const entityIdMap = new Map<string, string>();
  const entities: Entity[] = base.entities.map((e) => {
    const newId = genId("ent");
    entityIdMap.set(e.id, newId);
    return { ...e, id: newId };
  });

  // Map lens entities to base entities by name, or add new ones
  for (const le of lens.entities) {
    const key = entityKey(le);
    const existing = entities.find((e) => entityKey(e) === key);
    if (existing) {
      entityIdMap.set(le.id, existing.id);
      // Merge lens properties onto base
      if (le.properties) {
        existing.properties = { ...existing.properties, ...le.properties };
      }
      if (le.tags) {
        existing.tags = [...new Set([...(existing.tags ?? []), ...le.tags])];
      }
    } else {
      const newId = genId("ent");
      entityIdMap.set(le.id, newId);
      entities.push({ ...le, id: newId });
    }
  }

  const resolve = (id: string) => entityIdMap.get(id) ?? id;

  // Union all relations, dedup by (source, type, target)
  const relSeen = new Set<string>();
  const relations: Relation[] = [];

  for (const r of [...base.relations, ...lens.relations]) {
    const src = resolve(r.source);
    const tgt = resolve(r.target);
    const key = `${src}::${r.type}::${tgt}`;
    if (!relSeen.has(key)) {
      relSeen.add(key);
      relations.push({ ...r, id: genId("rel"), source: src, target: tgt });
    }
  }

  // Union processes, lens takes precedence for same name
  const procMap = new Map<string, WorldModelType["processes"][number]>();
  for (const p of base.processes) {
    procMap.set(procKey(p), {
      ...p,
      id: genId("proc"),
      participants: p.participants.map(resolve),
      steps: p.steps.map((s) => ({
        ...s,
        actor: s.actor ? resolve(s.actor) : undefined,
        input: s.input?.map(resolve),
        output: s.output?.map(resolve),
      })),
    });
  }
  for (const p of lens.processes) {
    procMap.set(procKey(p), {
      ...p,
      id: genId("proc"),
      participants: p.participants.map(resolve),
      steps: p.steps.map((s) => ({
        ...s,
        actor: s.actor ? resolve(s.actor) : undefined,
        input: s.input?.map(resolve),
        output: s.output?.map(resolve),
      })),
    });
  }

  // Constraints: lens overrides base for same name
  const cstrMap = new Map<string, WorldModelType["constraints"][number]>();
  for (const c of base.constraints) {
    cstrMap.set(cstrKey(c), {
      ...c,
      id: genId("cstr"),
      scope: c.scope.map(resolve),
    });
  }
  for (const c of lens.constraints) {
    cstrMap.set(cstrKey(c), {
      ...c,
      id: genId("cstr"),
      scope: c.scope.map(resolve),
    });
  }

  return {
    id: genId("wm"),
    name: `${base.name} + ${lens.name}`,
    description: `${base.name} with ${lens.name} overlay applied`,
    version: "0.1.0",
    created_at: new Date().toISOString(),
    entities,
    relations,
    processes: [...procMap.values()],
    constraints: [...cstrMap.values()],
    metadata: {
      source_type: "mixed",
      source_summary: `Overlay: ${base.name} (base) + ${lens.name} (lens)`,
      confidence: Math.min(
        base.metadata?.confidence ?? 0.5,
        lens.metadata?.confidence ?? 0.5,
      ),
    },
  };
}

// === src/utils/graph.ts ===
import type { WorldModelType } from "../schema/index.js";

type Entity = WorldModelType["entities"][number];
type Relation = WorldModelType["relations"][number];

/**
 * Find all entities that directly depend on or relate to a given entity.
 */
export function findDependents(
  model: WorldModelType,
  entityId: string,
): {
  incoming: Array<{ relation: Relation; entity: Entity }>;
  outgoing: Array<{ relation: Relation; entity: Entity }>;
} {
  const entityMap = new Map(model.entities.map((e) => [e.id, e]));

  const incoming = model.relations
    .filter((r) => r.target === entityId)
    .map((r) => ({ relation: r, entity: entityMap.get(r.source)! }))
    .filter((r) => r.entity);

  const outgoing = model.relations
    .filter((r) => r.source === entityId)
    .map((r) => ({ relation: r, entity: entityMap.get(r.target)! }))
    .filter((r) => r.entity);

  return { incoming, outgoing };
}

/**
 * Find entity by name (case-insensitive partial match).
 */
export function findEntity(
  model: WorldModelType,
  query: string,
): Entity | undefined {
  const q = query.toLowerCase();
  return (
    model.entities.find((e) => e.name.toLowerCase() === q) ??
    model.entities.find((e) => e.name.toLowerCase().includes(q))
  );
}

/**
 * BFS to find shortest path between two entities via relations.
 */
export function pathsBetween(
  model: WorldModelType,
  sourceId: string,
  targetId: string,
  maxDepth = 10,
): Array<{ entity: Entity; relation?: Relation }[]> {
  const entityMap = new Map(model.entities.map((e) => [e.id, e]));

  // Build adjacency list (both directions for traversal)
  const adjacency = new Map<
    string,
    Array<{ neighborId: string; relation: Relation }>
  >();
  for (const ent of model.entities) {
    adjacency.set(ent.id, []);
  }
  for (const rel of model.relations) {
    adjacency.get(rel.source)?.push({ neighborId: rel.target, relation: rel });
    if (rel.bidirectional) {
      adjacency
        .get(rel.target)
        ?.push({ neighborId: rel.source, relation: rel });
    }
  }

  // BFS
  const results: Array<{ entity: Entity; relation?: Relation }>[] = [];
  const queue: Array<{
    path: Array<{ entityId: string; relation?: Relation }>;
  }> = [{ path: [{ entityId: sourceId }] }];
  const visited = new Set<string>();

  while (queue.length > 0 && results.length < 5) {
    const current = queue.shift()!;
    const lastNode = current.path[current.path.length - 1];

    if (lastNode.entityId === targetId && current.path.length > 1) {
      results.push(
        current.path.map((step) => ({
          entity: entityMap.get(step.entityId)!,
          relation: step.relation,
        })),
      );
      continue;
    }

    if (current.path.length >= maxDepth) continue;

    const neighbors = adjacency.get(lastNode.entityId) ?? [];
    for (const neighbor of neighbors) {
      if (
        !visited.has(neighbor.neighborId) ||
        neighbor.neighborId === targetId
      ) {
        queue.push({
          path: [
            ...current.path,
            { entityId: neighbor.neighborId, relation: neighbor.relation },
          ],
        });
      }
    }
    visited.add(lastNode.entityId);
  }

  return results;
}

/**
 * Export world model as Mermaid diagram.
 */
export function toMermaid(model: WorldModelType): string {
  const lines: string[] = ["graph TD"];
  const entityMap = new Map(model.entities.map((e) => [e.id, e]));

  // Sanitize ID for Mermaid (no special chars)
  const mermaidId = (id: string) => id.replace(/[^a-zA-Z0-9_]/g, "_");

  // Add entity nodes with shape based on type
  for (const e of model.entities) {
    const mid = mermaidId(e.id);
    const label = e.name.replace(/"/g, "'");
    switch (e.type) {
      case "actor":
        lines.push(`  ${mid}(["\`**${label}**\nactor\`"])`);
        break;
      case "system":
        lines.push(`  ${mid}[["${label}"]`);
        break;
      case "concept":
        lines.push(`  ${mid}>"${label}"]`);
        break;
      case "event":
        lines.push(`  ${mid}(("${label}"))`);
        break;
      default:
        lines.push(`  ${mid}["${label}"]`);
    }
  }

  // Add relation edges
  for (const r of model.relations) {
    const src = mermaidId(r.source);
    const tgt = mermaidId(r.target);
    const label = r.type.replace(/_/g, " ");
    if (r.bidirectional) {
      lines.push(`  ${src} <-- "${label}" --> ${tgt}`);
    } else {
      lines.push(`  ${src} -- "${label}" --> ${tgt}`);
    }
  }

  return lines.join("\n");
}

/**
 * Export world model as DOT (Graphviz) format.
 */
export function toDot(model: WorldModelType): string {
  const lines: string[] = [
    "digraph WorldModel {",
    "  rankdir=LR;",
    '  node [shape=box, style="rounded,filled", fillcolor="#f0f0f0", fontname="Helvetica"];',
    '  edge [fontname="Helvetica", fontsize=10];',
    "",
  ];

  const typeColors: Record<string, string> = {
    actor: "#d4edda",
    system: "#cce5ff",
    object: "#f0f0f0",
    concept: "#fff3cd",
    location: "#e2d5f1",
    event: "#f8d7da",
    group: "#d1ecf1",
    resource: "#ffeeba",
  };

  for (const e of model.entities) {
    const color = typeColors[e.type] ?? "#f0f0f0";
    const label = `${e.name}\\n(${e.type})`;
    lines.push(`  "${e.id}" [label="${label}", fillcolor="${color}"];`);
  }

  lines.push("");

  for (const r of model.relations) {
    const label = r.type.replace(/_/g, " ");
    const dir = r.bidirectional ? ", dir=both" : "";
    lines.push(`  "${r.source}" -> "${r.target}" [label="${label}"${dir}];`);
  }

  lines.push("}");
  return lines.join("\n");
}

/**
 * Get model statistics.
 */
export function getStats(model: WorldModelType) {
  const entityTypes = new Map<string, number>();
  for (const e of model.entities) {
    entityTypes.set(e.type, (entityTypes.get(e.type) ?? 0) + 1);
  }

  const relationTypes = new Map<string, number>();
  for (const r of model.relations) {
    relationTypes.set(r.type, (relationTypes.get(r.type) ?? 0) + 1);
  }

  // Find most connected entities
  const connectionCount = new Map<string, number>();
  for (const r of model.relations) {
    connectionCount.set(r.source, (connectionCount.get(r.source) ?? 0) + 1);
    connectionCount.set(r.target, (connectionCount.get(r.target) ?? 0) + 1);
  }

  const entityMap = new Map(model.entities.map((e) => [e.id, e]));
  const mostConnected = [...connectionCount.entries()]
    .sort((a, b) => b[1] - a[1])
    .slice(0, 5)
    .map(([id, count]) => ({
      entity: entityMap.get(id)?.name ?? id,
      connections: count,
    }));

  return {
    entities: {
      total: model.entities.length,
      byType: Object.fromEntries(entityTypes),
    },
    relations: {
      total: model.relations.length,
      byType: Object.fromEntries(relationTypes),
    },
    processes: {
      total: model.processes.length,
      totalSteps: model.processes.reduce((acc, p) => acc + p.steps.length, 0),
    },
    constraints: {
      total: model.constraints.length,
      hard: model.constraints.filter((c) => c.severity === "hard").length,
      soft: model.constraints.filter((c) => c.severity === "soft").length,
    },
    mostConnected,
    confidence: model.metadata?.confidence,
  };
}

// === src/utils/ids.ts ===
import { randomBytes } from "node:crypto";

export function genId(prefix: string): string {
  const hex = randomBytes(6).toString("hex");
  return `${prefix}_${hex}`;
}

// === src/utils/llm.ts ===
import Anthropic from "@anthropic-ai/sdk";

let client: Anthropic | null = null;

export function getClient(): Anthropic {
  if (!client) {
    client = new Anthropic();
  }
  return client;
}

export interface AgentMessage {
  role: "user" | "assistant";
  content: string;
}

export interface CallOptions {
  model?: string;
  maxTokens?: number;
  retries?: number;
  timeoutMs?: number;
}

const DEFAULT_RETRIES = 3;
const BASE_DELAY_MS = 1000;
const DEFAULT_TIMEOUT_MS = 120_000; // 2 minutes
const MAX_INPUT_TOKENS_WARNING = 150_000;

function isRetryable(err: unknown): boolean {
  if (err instanceof Anthropic.APIError) {
    return err.status === 429 || err.status >= 500;
  }
  if (err instanceof Error) {
    const msg = err.message.toLowerCase();
    return (
      msg.includes("timeout") ||
      msg.includes("econnreset") ||
      msg.includes("socket") ||
      msg.includes("aborted")
    );
  }
  return false;
}

async function withRetry<T>(
  fn: () => Promise<T>,
  retries: number,
  label: string,
): Promise<T> {
  let lastErr: unknown;
  for (let attempt = 0; attempt <= retries; attempt++) {
    try {
      return await fn();
    } catch (err) {
      lastErr = err;
      if (attempt < retries && isRetryable(err)) {
        const delay = BASE_DELAY_MS * Math.pow(2, attempt);
        const jitter = Math.random() * delay * 0.3;
        const waitMs = Math.round(delay + jitter);
        process.stderr.write(
          `\n  [retry] ${label} attempt ${attempt + 1}/${retries} failed, retrying in ${waitMs}ms...\n`,
        );
        await new Promise((r) => setTimeout(r, waitMs));
      } else {
        throw err;
      }
    }
  }
  throw lastErr;
}

/**
 * Wrap a promise with a timeout. Rejects with a clear error if the timeout fires.
 */
function withTimeout<T>(
  promise: Promise<T>,
  ms: number,
  label: string,
): Promise<T> {
  return new Promise<T>((resolve, reject) => {
    const timer = setTimeout(() => {
      reject(new Error(`${label} timed out after ${ms}ms`));
    }, ms);

    promise.then(
      (val) => {
        clearTimeout(timer);
        resolve(val);
      },
      (err) => {
        clearTimeout(timer);
        reject(err);
      },
    );
  });
}

export async function callAgent(
  systemPrompt: string,
  userMessage: string,
  options?: CallOptions,
): Promise<string> {
  if (!systemPrompt) throw new Error("callAgent: systemPrompt is required");
  if (!userMessage) throw new Error("callAgent: userMessage is required");

  const llm = getClient();
  const retries = options?.retries ?? DEFAULT_RETRIES;
  const timeoutMs = options?.timeoutMs ?? DEFAULT_TIMEOUT_MS;

  return withRetry(
    async () => {
      const apiCall = llm.messages.create({
        model: options?.model ?? "claude-sonnet-4-20250514",
        max_tokens: options?.maxTokens ?? 8192,
        system: systemPrompt,
        messages: [{ role: "user", content: userMessage }],
      });

      const response = await withTimeout(apiCall, timeoutMs, "LLM call");

      const textBlock = response.content.find((b) => b.type === "text");
      if (!textBlock || textBlock.type !== "text") {
        throw new Error("No text response from LLM");
      }
      return textBlock.text;
    },
    retries,
    "callAgent",
  );
}

export async function callAgentJSON<T>(
  systemPrompt: string,
  userMessage: string,
  options?: CallOptions,
): Promise<T> {
  const retries = options?.retries ?? DEFAULT_RETRIES;

  return withRetry(
    async () => {
      const raw = await callAgent(systemPrompt, userMessage, {
        ...options,
        retries: 0,
      });

      // Extract JSON from markdown code fences if present
      const jsonMatch = raw.match(/```(?:json)?\s*\n?([\s\S]*?)\n?```/);
      const jsonStr = jsonMatch ? jsonMatch[1].trim() : raw.trim();

      try {
        return JSON.parse(jsonStr) as T;
      } catch {
        throw new Error(
          `Failed to parse LLM response as JSON (${raw.length} chars):\n${raw.slice(0, 800)}`,
        );
      }
    },
    retries,
    "callAgentJSON",
  );
}

/**
 * Estimate token count from text (rough: 1 token ≈ 4 chars).
 */
export function estimateTokens(text: string): number {
  return Math.ceil(text.length / 4);
}

/**
 * Check input size and warn if it's very large.
 * Returns { safe: boolean, tokens: number, warning?: string }
 */
export function checkInputSize(text: string): {
  safe: boolean;
  tokens: number;
  warning?: string;
} {
  const tokens = estimateTokens(text);
  if (tokens > MAX_INPUT_TOKENS_WARNING) {
    return {
      safe: false,
      tokens,
      warning: `Input is ~${tokens.toLocaleString()} tokens (${text.length.toLocaleString()} chars). This exceeds the ${MAX_INPUT_TOKENS_WARNING.toLocaleString()} token warning threshold. The input will be chunked automatically.`,
    };
  }
  return { safe: true, tokens };
}

// === src/utils/merge.ts ===
import type { WorldModelType } from "../schema/index.js";
import { genId } from "./ids.js";

/**
 * Merge two world models into one. Deduplicates entities by name,
 * remaps all IDs, and unions relations/processes/constraints.
 */
export function mergeWorldModels(
  a: WorldModelType,
  b: WorldModelType,
  options?: { name?: string; description?: string },
): WorldModelType {
  // Build unified entity set, deduplicating by normalized name
  const entityMap = new Map<string, WorldModelType["entities"][number]>();
  const oldIdToNewId = new Map<string, string>();

  function normalizeEntityName(name: string): string {
    return name
      .toLowerCase()
      .replace(/[^a-z0-9]/g, "_")
      .replace(/_+/g, "_")
      .replace(/^_|_$/g, "");
  }

  function addEntity(e: WorldModelType["entities"][number]) {
    const key = normalizeEntityName(e.name);
    const existing = entityMap.get(key);
    if (existing) {
      oldIdToNewId.set(e.id, existing.id);
      // Merge properties and tags
      if (e.properties) {
        existing.properties = { ...existing.properties, ...e.properties };
      }
      if (e.tags) {
        const tagSet = new Set([...(existing.tags ?? []), ...e.tags]);
        existing.tags = [...tagSet];
      }
      // Keep the longer description
      if (e.description.length > existing.description.length) {
        existing.description = e.description;
      }
    } else {
      const newId = genId("ent");
      oldIdToNewId.set(e.id, newId);
      entityMap.set(key, { ...e, id: newId });
    }
  }

  for (const e of a.entities) addEntity(e);
  for (const e of b.entities) addEntity(e);

  const resolve = (oldId: string): string => oldIdToNewId.get(oldId) ?? oldId;

  // Merge relations, deduplicate by (source, target, type)
  const relationKey = (r: { source: string; target: string; type: string }) =>
    `${resolve(r.source)}::${r.type}::${resolve(r.target)}`;

  const relationMap = new Map<string, WorldModelType["relations"][number]>();

  for (const r of [...a.relations, ...b.relations]) {
    const key = relationKey(r);
    if (!relationMap.has(key)) {
      relationMap.set(key, {
        ...r,
        id: genId("rel"),
        source: resolve(r.source),
        target: resolve(r.target),
      });
    }
  }

  // Merge processes, deduplicate by normalized name
  const processMap = new Map<string, WorldModelType["processes"][number]>();

  for (const p of [...a.processes, ...b.processes]) {
    const key = normalizeEntityName(p.name);
    if (!processMap.has(key)) {
      processMap.set(key, {
        ...p,
        id: genId("proc"),
        participants: p.participants.map(resolve),
        steps: p.steps.map((s) => ({
          ...s,
          actor: s.actor ? resolve(s.actor) : undefined,
          input: s.input?.map(resolve),
          output: s.output?.map(resolve),
        })),
      });
    } else {
      // Keep the one with more steps
      const existing = processMap.get(key)!;
      if (p.steps.length > existing.steps.length) {
        processMap.set(key, {
          ...p,
          id: existing.id,
          participants: p.participants.map(resolve),
          steps: p.steps.map((s) => ({
            ...s,
            actor: s.actor ? resolve(s.actor) : undefined,
            input: s.input?.map(resolve),
            output: s.output?.map(resolve),
          })),
        });
      }
    }
  }

  // Merge constraints, deduplicate by normalized name
  const constraintMap = new Map<
    string,
    WorldModelType["constraints"][number]
  >();

  for (const c of [...a.constraints, ...b.constraints]) {
    const key = normalizeEntityName(c.name);
    if (!constraintMap.has(key)) {
      constraintMap.set(key, {
        ...c,
        id: genId("cstr"),
        scope: c.scope.map(resolve),
      });
    }
  }

  // Compute merged confidence
  const confA = a.metadata?.confidence ?? 0.5;
  const confB = b.metadata?.confidence ?? 0.5;
  const mergedConfidence = Math.min(1, (confA + confB) / 2);

  return {
    id: genId("wm"),
    name: options?.name ?? `${a.name} + ${b.name}`,
    description:
      options?.description ?? `Merged model from: ${a.name}, ${b.name}`,
    version: "0.1.0",
    created_at: new Date().toISOString(),
    entities: [...entityMap.values()],
    relations: [...relationMap.values()],
    processes: [...processMap.values()],
    constraints: [...constraintMap.values()],
    metadata: {
      source_type: "mixed",
      source_summary: `Merged from ${a.entities.length + b.entities.length} entities across 2 models`,
      confidence: mergedConfidence,
      extraction_notes: [
        ...(a.metadata?.extraction_notes ?? []),
        ...(b.metadata?.extraction_notes ?? []),
        `Merged: ${a.name} (${a.entities.length} entities) + ${b.name} (${b.entities.length} entities)`,
      ],
    },
  };
}

/**
 * Diff two world models. Returns what was added, removed, and changed.
 */
export interface WorldModelDiff {
  entities: {
    added: string[];
    removed: string[];
    modified: string[];
  };
  relations: {
    added: string[];
    removed: string[];
  };
  processes: {
    added: string[];
    removed: string[];
  };
  constraints: {
    added: string[];
    removed: string[];
  };
  summary: string;
}

export function diffWorldModels(
  before: WorldModelType,
  after: WorldModelType,
): WorldModelDiff {
  function nameSet(items: Array<{ name: string }>): Set<string> {
    return new Set(items.map((i) => i.name));
  }

  function descMap(
    items: Array<{ name: string; description: string }>,
  ): Map<string, string> {
    return new Map(items.map((i) => [i.name, i.description]));
  }

  const entBefore = nameSet(before.entities);
  const entAfter = nameSet(after.entities);
  const descBefore = descMap(before.entities);
  const descAfter = descMap(after.entities);

  const entAdded = [...entAfter].filter((n) => !entBefore.has(n));
  const entRemoved = [...entBefore].filter((n) => !entAfter.has(n));
  const entModified = [...entAfter].filter(
    (n) => entBefore.has(n) && descBefore.get(n) !== descAfter.get(n),
  );

  const relKey = (
    r: { source: string; target: string; type: string },
    model: WorldModelType,
  ) => {
    const src = model.entities.find((e) => e.id === r.source)?.name ?? r.source;
    const tgt = model.entities.find((e) => e.id === r.target)?.name ?? r.target;
    return `${src}::${r.type}::${tgt}`;
  };

  const relBefore = new Set(before.relations.map((r) => relKey(r, before)));
  const relAfter = new Set(after.relations.map((r) => relKey(r, after)));

  const procBefore = nameSet(before.processes);
  const procAfter = nameSet(after.processes);

  const cstrBefore = nameSet(before.constraints);
  const cstrAfter = nameSet(after.constraints);

  const diff: WorldModelDiff = {
    entities: {
      added: entAdded,
      removed: entRemoved,
      modified: entModified,
    },
    relations: {
      added: [...relAfter].filter((r) => !relBefore.has(r)),
      removed: [...relBefore].filter((r) => !relAfter.has(r)),
    },
    processes: {
      added: [...procAfter].filter((p) => !procBefore.has(p)),
      removed: [...procBefore].filter((p) => !procAfter.has(p)),
    },
    constraints: {
      added: [...cstrAfter].filter((c) => !cstrBefore.has(c)),
      removed: [...cstrBefore].filter((c) => !cstrAfter.has(c)),
    },
    summary: "",
  };

  const parts: string[] = [];
  if (entAdded.length) parts.push(`+${entAdded.length} entities`);
  if (entRemoved.length) parts.push(`-${entRemoved.length} entities`);
  if (entModified.length)
    parts.push(`~${entModified.length} entities modified`);
  if (diff.relations.added.length)
    parts.push(`+${diff.relations.added.length} relations`);
  if (diff.relations.removed.length)
    parts.push(`-${diff.relations.removed.length} relations`);
  if (diff.processes.added.length)
    parts.push(`+${diff.processes.added.length} processes`);
  if (diff.constraints.added.length)
    parts.push(`+${diff.constraints.added.length} constraints`);

  diff.summary = parts.length ? parts.join(", ") : "No changes";
  return diff;
}

// === src/utils/timeline.ts ===
import type { WorldModelType } from "../schema/index.js";
import { diffWorldModels, type WorldModelDiff } from "./merge.js";
import { genId } from "./ids.js";

export interface Snapshot {
  id: string;
  timestamp: string;
  label?: string;
  model: WorldModelType;
  diff_from_previous?: WorldModelDiff;
  stats: {
    entities: number;
    relations: number;
    processes: number;
    constraints: number;
  };
}

export interface Timeline {
  id: string;
  name: string;
  description: string;
  created_at: string;
  snapshots: Snapshot[];
}

/**
 * Create a new empty timeline.
 */
export function createTimeline(name: string, description?: string): Timeline {
  return {
    id: genId("tl"),
    name,
    description: description ?? `Timeline for ${name}`,
    created_at: new Date().toISOString(),
    snapshots: [],
  };
}

/**
 * Add a world model as a new snapshot to a timeline.
 * Automatically computes diff from the previous snapshot.
 */
export function addSnapshot(
  timeline: Timeline,
  model: WorldModelType,
  label?: string,
): Timeline {
  const previous =
    timeline.snapshots.length > 0
      ? timeline.snapshots[timeline.snapshots.length - 1]
      : null;

  const diff = previous ? diffWorldModels(previous.model, model) : undefined;

  const snapshot: Snapshot = {
    id: genId("snap"),
    timestamp: new Date().toISOString(),
    label,
    model,
    diff_from_previous: diff,
    stats: {
      entities: model.entities.length,
      relations: model.relations.length,
      processes: model.processes.length,
      constraints: model.constraints.length,
    },
  };

  return {
    ...timeline,
    snapshots: [...timeline.snapshots, snapshot],
  };
}

/**
 * Get the history of a specific entity across all snapshots.
 * Returns when it appeared, disappeared, or changed description.
 */
export function entityHistory(
  timeline: Timeline,
  entityName: string,
): Array<{
  snapshot_id: string;
  timestamp: string;
  label?: string;
  event: "appeared" | "disappeared" | "modified" | "unchanged";
  description?: string;
}> {
  const history: Array<{
    snapshot_id: string;
    timestamp: string;
    label?: string;
    event: "appeared" | "disappeared" | "modified" | "unchanged";
    description?: string;
  }> = [];

  const normalizedName = entityName.toLowerCase();
  let previousEntity: { name: string; description: string } | null = null;

  for (const snap of timeline.snapshots) {
    const entity = snap.model.entities.find(
      (e) => e.name.toLowerCase() === normalizedName,
    );

    if (entity && !previousEntity) {
      history.push({
        snapshot_id: snap.id,
        timestamp: snap.timestamp,
        label: snap.label,
        event: "appeared",
        description: entity.description,
      });
    } else if (!entity && previousEntity) {
      history.push({
        snapshot_id: snap.id,
        timestamp: snap.timestamp,
        label: snap.label,
        event: "disappeared",
      });
    } else if (entity && previousEntity) {
      if (entity.description !== previousEntity.description) {
        history.push({
          snapshot_id: snap.id,
          timestamp: snap.timestamp,
          label: snap.label,
          event: "modified",
          description: entity.description,
        });
      } else {
        history.push({
          snapshot_id: snap.id,
          timestamp: snap.timestamp,
          label: snap.label,
          event: "unchanged",
        });
      }
    }

    previousEntity = entity
      ? { name: entity.name, description: entity.description }
      : null;
  }

  return history;
}

/**
 * Get a summary of how the timeline has evolved.
 */
export function timelineSummary(timeline: Timeline): string {
  const lines: string[] = [];
  lines.push(`Timeline: ${timeline.name}`);
  lines.push(`Snapshots: ${timeline.snapshots.length}`);
  lines.push("");

  for (const snap of timeline.snapshots) {
    const diffStr = snap.diff_from_previous
      ? ` (${snap.diff_from_previous.summary})`
      : " (initial)";
    lines.push(
      `  ${snap.timestamp} ${snap.label ?? ""} — ${snap.stats.entities} entities, ${snap.stats.relations} relations${diffStr}`,
    );
  }

  if (timeline.snapshots.length >= 2) {
    const first = timeline.snapshots[0];
    const last = timeline.snapshots[timeline.snapshots.length - 1];
    lines.push("");
    lines.push(
      `Growth: ${first.stats.entities} → ${last.stats.entities} entities, ${first.stats.relations} → ${last.stats.relations} relations`,
    );
  }

  return lines.join("\n");
}