import fsSync from "node:fs"; import fs from "node:fs/promises"; import os from "node:os"; import path from "node:path"; import type { AppMessage, ThinkingLevel } from "@mariozechner/pi-agent-core"; import { type Api, type AssistantMessage, type Model, type OAuthStorage, setOAuthStorage, } from "@mariozechner/pi-ai"; import { buildSystemPrompt, createAgentSession, defaultGetApiKey, findModelByProviderAndId, SessionManager, SettingsManager, type Skill, } from "@mariozechner/pi-coding-agent"; import type { ThinkLevel, VerboseLevel } from "../auto-reply/thinking.js"; import { formatToolAggregate } from "../auto-reply/tool-meta.js"; import type { ClawdisConfig } from "../config/config.js"; import { splitMediaFromOutput } from "../media/parse.js"; import { enqueueCommand } from "../process/command-queue.js"; import { CONFIG_DIR, resolveUserPath } from "../utils.js"; import { resolveClawdisAgentDir } from "./agent-paths.js"; import { DEFAULT_MODEL, DEFAULT_PROVIDER } from "./defaults.js"; import { ensureClawdisModelsJson } from "./models-config.js"; import { buildBootstrapContextFiles, ensureSessionHeader, formatAssistantErrorText, sanitizeSessionMessagesImages, } from "./pi-embedded-helpers.js"; import { subscribeEmbeddedPiSession } from "./pi-embedded-subscribe.js"; import { extractAssistantText } from "./pi-embedded-utils.js"; import { createClawdisCodingTools } from "./pi-tools.js"; import { applySkillEnvOverrides, applySkillEnvOverridesFromSnapshot, buildWorkspaceSkillSnapshot, loadWorkspaceSkillEntries, type SkillEntry, type SkillSnapshot, } from "./skills.js"; import { buildAgentSystemPromptAppend } from "./system-prompt.js"; import { loadWorkspaceBootstrapFiles } from "./workspace.js"; export type EmbeddedPiAgentMeta = { sessionId: string; provider: string; model: string; usage?: { input?: number; output?: number; cacheRead?: number; cacheWrite?: number; total?: number; }; }; export type EmbeddedPiRunMeta = { durationMs: number; agentMeta?: EmbeddedPiAgentMeta; aborted?: boolean; }; export type EmbeddedPiRunResult = { payloads?: Array<{ text?: string; mediaUrl?: string; mediaUrls?: string[]; }>; meta: EmbeddedPiRunMeta; }; type EmbeddedPiQueueHandle = { queueMessage: (text: string) => Promise; isStreaming: () => boolean; }; const ACTIVE_EMBEDDED_RUNS = new Map(); const OAUTH_FILENAME = "oauth.json"; const DEFAULT_OAUTH_DIR = path.join(CONFIG_DIR, "credentials"); let oauthStorageConfigured = false; let cachedDefaultApiKey: ReturnType | null = null; function resolveClawdisOAuthPath(): string { const overrideDir = process.env.CLAWDIS_OAUTH_DIR?.trim() || DEFAULT_OAUTH_DIR; return path.join(resolveUserPath(overrideDir), OAUTH_FILENAME); } function loadOAuthStorageAt(pathname: string): OAuthStorage | null { if (!fsSync.existsSync(pathname)) return null; try { const content = fsSync.readFileSync(pathname, "utf8"); const json = JSON.parse(content) as OAuthStorage; if (!json || typeof json !== "object") return null; return json; } catch { return null; } } function hasAnthropicOAuth(storage: OAuthStorage): boolean { const entry = storage.anthropic as | { refresh?: string; refresh_token?: string; refreshToken?: string; access?: string; access_token?: string; accessToken?: string; } | undefined; if (!entry) return false; const refresh = entry.refresh ?? entry.refresh_token ?? entry.refreshToken ?? ""; const access = entry.access ?? entry.access_token ?? entry.accessToken ?? ""; return Boolean(refresh.trim() && access.trim()); } function saveOAuthStorageAt(pathname: string, storage: OAuthStorage): void { const dir = path.dirname(pathname); fsSync.mkdirSync(dir, { recursive: true, mode: 0o700 }); fsSync.writeFileSync( pathname, `${JSON.stringify(storage, null, 2)}\n`, "utf8", ); fsSync.chmodSync(pathname, 0o600); } function legacyOAuthPaths(): string[] { const paths: string[] = []; const piOverride = process.env.PI_CODING_AGENT_DIR?.trim(); if (piOverride) { paths.push(path.join(resolveUserPath(piOverride), OAUTH_FILENAME)); } paths.push(path.join(os.homedir(), ".pi", "agent", OAUTH_FILENAME)); paths.push(path.join(os.homedir(), ".claude", OAUTH_FILENAME)); paths.push(path.join(os.homedir(), ".config", "claude", OAUTH_FILENAME)); paths.push(path.join(os.homedir(), ".config", "anthropic", OAUTH_FILENAME)); return Array.from(new Set(paths)); } function importLegacyOAuthIfNeeded(destPath: string): void { if (fsSync.existsSync(destPath)) return; for (const legacyPath of legacyOAuthPaths()) { const storage = loadOAuthStorageAt(legacyPath); if (!storage || !hasAnthropicOAuth(storage)) continue; saveOAuthStorageAt(destPath, storage); return; } } function ensureOAuthStorage(): void { if (oauthStorageConfigured) return; oauthStorageConfigured = true; const oauthPath = resolveClawdisOAuthPath(); importLegacyOAuthIfNeeded(oauthPath); setOAuthStorage({ load: () => loadOAuthStorageAt(oauthPath) ?? {}, save: (storage) => saveOAuthStorageAt(oauthPath, storage), }); } function getDefaultApiKey() { if (!cachedDefaultApiKey) { ensureOAuthStorage(); cachedDefaultApiKey = defaultGetApiKey(); } return cachedDefaultApiKey; } export function queueEmbeddedPiMessage( sessionId: string, text: string, ): boolean { const handle = ACTIVE_EMBEDDED_RUNS.get(sessionId); if (!handle) return false; if (!handle.isStreaming()) return false; void handle.queueMessage(text); return true; } function mapThinkingLevel(level?: ThinkLevel): ThinkingLevel { // pi-agent-core supports "xhigh" too; Clawdis doesn't surface it for now. if (!level) return "off"; return level; } function resolveModel( provider: string, modelId: string, agentDir?: string, ): { model?: Model; error?: string } { const model = findModelByProviderAndId( provider, modelId, agentDir, ) as Model | null; if (!model) return { error: `Unknown model: ${provider}/${modelId}` }; return { model }; } async function getApiKeyForModel(model: Model): Promise { ensureOAuthStorage(); if (model.provider === "anthropic") { const oauthEnv = process.env.ANTHROPIC_OAUTH_TOKEN; if (oauthEnv?.trim()) return oauthEnv.trim(); } const key = await getDefaultApiKey()(model); if (key) return key; throw new Error(`No API key found for provider "${model.provider}"`); } function resolvePromptSkills( snapshot: SkillSnapshot, entries: SkillEntry[], ): Skill[] { if (snapshot.resolvedSkills?.length) { return snapshot.resolvedSkills; } const snapshotNames = snapshot.skills.map((entry) => entry.name); if (snapshotNames.length === 0) return []; const entryByName = new Map( entries.map((entry) => [entry.skill.name, entry.skill]), ); return snapshotNames .map((name) => entryByName.get(name)) .filter((skill): skill is Skill => Boolean(skill)); } export async function runEmbeddedPiAgent(params: { sessionId: string; sessionFile: string; workspaceDir: string; config?: ClawdisConfig; skillsSnapshot?: SkillSnapshot; prompt: string; provider?: string; model?: string; thinkLevel?: ThinkLevel; verboseLevel?: VerboseLevel; timeoutMs: number; runId: string; abortSignal?: AbortSignal; shouldEmitToolResult?: () => boolean; onPartialReply?: (payload: { text?: string; mediaUrls?: string[]; }) => void | Promise; onToolResult?: (payload: { text?: string; mediaUrls?: string[]; }) => void | Promise; onAgentEvent?: (evt: { stream: string; data: Record; }) => void; enqueue?: typeof enqueueCommand; }): Promise { const enqueue = params.enqueue ?? enqueueCommand; return enqueue(async () => { const started = Date.now(); const resolvedWorkspace = resolveUserPath(params.workspaceDir); const prevCwd = process.cwd(); const provider = (params.provider ?? DEFAULT_PROVIDER).trim() || DEFAULT_PROVIDER; const modelId = (params.model ?? DEFAULT_MODEL).trim() || DEFAULT_MODEL; await ensureClawdisModelsJson(params.config); const agentDir = resolveClawdisAgentDir(); const { model, error } = resolveModel(provider, modelId, agentDir); if (!model) { throw new Error(error ?? `Unknown model: ${provider}/${modelId}`); } const thinkingLevel = mapThinkingLevel(params.thinkLevel); await fs.mkdir(resolvedWorkspace, { recursive: true }); await ensureSessionHeader({ sessionFile: params.sessionFile, sessionId: params.sessionId, cwd: resolvedWorkspace, }); let restoreSkillEnv: (() => void) | undefined; process.chdir(resolvedWorkspace); try { const shouldLoadSkillEntries = !params.skillsSnapshot || !params.skillsSnapshot.resolvedSkills; const skillEntries = shouldLoadSkillEntries ? loadWorkspaceSkillEntries(resolvedWorkspace) : []; const skillsSnapshot = params.skillsSnapshot ?? buildWorkspaceSkillSnapshot(resolvedWorkspace, { config: params.config, entries: skillEntries, }); restoreSkillEnv = params.skillsSnapshot ? applySkillEnvOverridesFromSnapshot({ snapshot: params.skillsSnapshot, config: params.config, }) : applySkillEnvOverrides({ skills: skillEntries ?? [], config: params.config, }); const bootstrapFiles = await loadWorkspaceBootstrapFiles(resolvedWorkspace); const contextFiles = buildBootstrapContextFiles(bootstrapFiles); const promptSkills = resolvePromptSkills(skillsSnapshot, skillEntries); const tools = createClawdisCodingTools(); const systemPrompt = buildSystemPrompt({ appendPrompt: buildAgentSystemPromptAppend({ workspaceDir: resolvedWorkspace, defaultThinkLevel: params.thinkLevel, }), contextFiles, skills: promptSkills, cwd: resolvedWorkspace, tools, }); const sessionManager = SessionManager.open(params.sessionFile, agentDir); const settingsManager = SettingsManager.create( resolvedWorkspace, agentDir, ); const { session } = await createAgentSession({ cwd: resolvedWorkspace, agentDir, model, thinkingLevel, systemPrompt, // TODO(steipete): Once pi-mono publishes file-magic MIME detection in `read` image payloads, // remove `createClawdisCodingTools()` and use upstream `codingTools` again. tools, sessionManager, settingsManager, getApiKey: async (m) => { return await getApiKeyForModel(m as Model); }, skills: promptSkills, contextFiles, }); const prior = await sanitizeSessionMessagesImages( session.messages, "session:history", ); if (prior.length > 0) { session.agent.replaceMessages(prior); } const queueHandle: EmbeddedPiQueueHandle = { queueMessage: async (text: string) => { await session.queueMessage(text); }, isStreaming: () => session.isStreaming, }; ACTIVE_EMBEDDED_RUNS.set(params.sessionId, queueHandle); let aborted = Boolean(params.abortSignal?.aborted); const { assistantTexts, toolMetas, unsubscribe, flush: flushToolDebouncer, } = subscribeEmbeddedPiSession({ session, runId: params.runId, verboseLevel: params.verboseLevel, shouldEmitToolResult: params.shouldEmitToolResult, onToolResult: params.onToolResult, onPartialReply: params.onPartialReply, onAgentEvent: params.onAgentEvent, }); const abortTimer = setTimeout( () => { aborted = true; void session.abort(); }, Math.max(1, params.timeoutMs), ); let messagesSnapshot: AppMessage[] = []; let sessionIdUsed = session.sessionId; const onAbort = () => { aborted = true; void session.abort(); }; if (params.abortSignal) { if (params.abortSignal.aborted) { onAbort(); } else { params.abortSignal.addEventListener("abort", onAbort, { once: true }); } } let promptError: unknown = null; try { try { await session.prompt(params.prompt); } catch (err) { promptError = err; } finally { messagesSnapshot = session.messages.slice(); sessionIdUsed = session.sessionId; } } finally { clearTimeout(abortTimer); unsubscribe(); flushToolDebouncer(); if (ACTIVE_EMBEDDED_RUNS.get(params.sessionId) === queueHandle) { ACTIVE_EMBEDDED_RUNS.delete(params.sessionId); } session.dispose(); params.abortSignal?.removeEventListener?.("abort", onAbort); } if (promptError && !aborted) { throw promptError; } const lastAssistant = messagesSnapshot .slice() .reverse() .find((m) => (m as AppMessage)?.role === "assistant") as | AssistantMessage | undefined; const usage = lastAssistant?.usage; const agentMeta: EmbeddedPiAgentMeta = { sessionId: sessionIdUsed, provider: lastAssistant?.provider ?? provider, model: lastAssistant?.model ?? model.id, usage: usage ? { input: usage.input, output: usage.output, cacheRead: usage.cacheRead, cacheWrite: usage.cacheWrite, total: usage.totalTokens, } : undefined, }; const replyItems: Array<{ text: string; media?: string[] }> = []; const errorText = lastAssistant ? formatAssistantErrorText(lastAssistant) : undefined; if (errorText) replyItems.push({ text: errorText }); const inlineToolResults = params.verboseLevel === "on" && !params.onPartialReply && !params.onToolResult && toolMetas.length > 0; if (inlineToolResults) { for (const { toolName, meta } of toolMetas) { const agg = formatToolAggregate(toolName, meta ? [meta] : []); const { text: cleanedText, mediaUrls } = splitMediaFromOutput(agg); if (cleanedText) replyItems.push({ text: cleanedText, media: mediaUrls }); } } for (const text of assistantTexts.length ? assistantTexts : lastAssistant ? [extractAssistantText(lastAssistant)] : []) { const { text: cleanedText, mediaUrls } = splitMediaFromOutput(text); if (!cleanedText && (!mediaUrls || mediaUrls.length === 0)) continue; replyItems.push({ text: cleanedText, media: mediaUrls }); } const payloads = replyItems .map((item) => ({ text: item.text?.trim() ? item.text.trim() : undefined, mediaUrls: item.media?.length ? item.media : undefined, mediaUrl: item.media?.[0], })) .filter( (p) => p.text || p.mediaUrl || (p.mediaUrls && p.mediaUrls.length > 0), ); return { payloads: payloads.length ? payloads : undefined, meta: { durationMs: Date.now() - started, agentMeta, aborted, }, }; } finally { restoreSkillEnv?.(); process.chdir(prevCwd); } }); }