- Upgrade all pi packages from 0.49.3 to 0.50.4 - Replace discoverAuthStorage() with new AuthStorage() - Replace discoverModels() with new ModelRegistry() - Remove deprecated CreateAgentSessionOptions properties: - systemPrompt (removed from API) - skills (removed from API) - contextFiles (removed from API) - additionalExtensionPaths (removed from API) - Fix type issues with OAuth credentials email field - Update test mocks to work with new ModelRegistry class - Add null check for runner.task() in telegram monitor Resolves #4165
168 lines
5.1 KiB
TypeScript
168 lines
5.1 KiB
TypeScript
import process from "node:process";
|
|
|
|
import { extractErrorCode, formatUncaughtError } from "./errors.js";
|
|
|
|
type UnhandledRejectionHandler = (reason: unknown) => boolean;
|
|
|
|
const handlers = new Set<UnhandledRejectionHandler>();
|
|
|
|
const FATAL_ERROR_CODES = new Set([
|
|
"ERR_OUT_OF_MEMORY",
|
|
"ERR_SCRIPT_EXECUTION_TIMEOUT",
|
|
"ERR_WORKER_OUT_OF_MEMORY",
|
|
"ERR_WORKER_UNCAUGHT_EXCEPTION",
|
|
"ERR_WORKER_INITIALIZATION_FAILED",
|
|
]);
|
|
|
|
const CONFIG_ERROR_CODES = new Set(["INVALID_CONFIG", "MISSING_API_KEY", "MISSING_CREDENTIALS"]);
|
|
|
|
// Network error codes that indicate transient failures (shouldn't crash the gateway)
|
|
const TRANSIENT_NETWORK_CODES = new Set([
|
|
"ECONNRESET",
|
|
"ECONNREFUSED",
|
|
"ENOTFOUND",
|
|
"ETIMEDOUT",
|
|
"ESOCKETTIMEDOUT",
|
|
"ECONNABORTED",
|
|
"EPIPE",
|
|
"EHOSTUNREACH",
|
|
"ENETUNREACH",
|
|
"EAI_AGAIN",
|
|
"UND_ERR_CONNECT_TIMEOUT",
|
|
"UND_ERR_DNS_RESOLVE_FAILED",
|
|
"UND_ERR_CONNECT",
|
|
"UND_ERR_SOCKET",
|
|
"UND_ERR_HEADERS_TIMEOUT",
|
|
"UND_ERR_BODY_TIMEOUT",
|
|
]);
|
|
|
|
function getErrorCause(err: unknown): unknown {
|
|
if (!err || typeof err !== "object") return undefined;
|
|
return (err as { cause?: unknown }).cause;
|
|
}
|
|
|
|
function extractErrorCodeWithCause(err: unknown): string | undefined {
|
|
const direct = extractErrorCode(err);
|
|
if (direct) return direct;
|
|
return extractErrorCode(getErrorCause(err));
|
|
}
|
|
|
|
/**
|
|
* Checks if an error is an AbortError.
|
|
* These are typically intentional cancellations (e.g., during shutdown) and shouldn't crash.
|
|
*/
|
|
export function isAbortError(err: unknown): boolean {
|
|
if (!err || typeof err !== "object") return false;
|
|
const name = "name" in err ? String(err.name) : "";
|
|
if (name === "AbortError") return true;
|
|
// Check for "This operation was aborted" message from Node's undici
|
|
const message = "message" in err && typeof err.message === "string" ? err.message : "";
|
|
if (message === "This operation was aborted") return true;
|
|
return false;
|
|
}
|
|
|
|
function isFatalError(err: unknown): boolean {
|
|
const code = extractErrorCodeWithCause(err);
|
|
return code !== undefined && FATAL_ERROR_CODES.has(code);
|
|
}
|
|
|
|
function isConfigError(err: unknown): boolean {
|
|
const code = extractErrorCodeWithCause(err);
|
|
return code !== undefined && CONFIG_ERROR_CODES.has(code);
|
|
}
|
|
|
|
/**
|
|
* Checks if an error is a transient network error that shouldn't crash the gateway.
|
|
* These are typically temporary connectivity issues that will resolve on their own.
|
|
*/
|
|
export function isTransientNetworkError(err: unknown): boolean {
|
|
if (!err) return false;
|
|
|
|
const code = extractErrorCodeWithCause(err);
|
|
if (code && TRANSIENT_NETWORK_CODES.has(code)) return true;
|
|
|
|
// "fetch failed" TypeError from undici (Node's native fetch)
|
|
if (err instanceof TypeError && err.message === "fetch failed") {
|
|
const cause = getErrorCause(err);
|
|
if (cause) return isTransientNetworkError(cause);
|
|
return true;
|
|
}
|
|
|
|
// Check the cause chain recursively
|
|
const cause = getErrorCause(err);
|
|
if (cause && cause !== err) {
|
|
return isTransientNetworkError(cause);
|
|
}
|
|
|
|
// AggregateError may wrap multiple causes
|
|
if (err instanceof AggregateError && err.errors?.length) {
|
|
return err.errors.some((e) => isTransientNetworkError(e));
|
|
}
|
|
|
|
return false;
|
|
}
|
|
|
|
export function registerUnhandledRejectionHandler(handler: UnhandledRejectionHandler): () => void {
|
|
handlers.add(handler);
|
|
return () => {
|
|
handlers.delete(handler);
|
|
};
|
|
}
|
|
|
|
export function isUnhandledRejectionHandled(reason: unknown): boolean {
|
|
for (const handler of handlers) {
|
|
try {
|
|
if (handler(reason)) return true;
|
|
} catch (err) {
|
|
console.error(
|
|
"[openclaw] Unhandled rejection handler failed:",
|
|
err instanceof Error ? (err.stack ?? err.message) : err,
|
|
);
|
|
}
|
|
}
|
|
return false;
|
|
}
|
|
|
|
export function installUnhandledRejectionHandler(): void {
|
|
process.on("unhandledRejection", (reason, _promise) => {
|
|
if (isUnhandledRejectionHandled(reason)) return;
|
|
|
|
// AbortError is typically an intentional cancellation (e.g., during shutdown)
|
|
// Log it but don't crash - these are expected during graceful shutdown
|
|
if (isAbortError(reason)) {
|
|
console.warn("[openclaw] Suppressed AbortError:", formatUncaughtError(reason));
|
|
return;
|
|
}
|
|
|
|
if (isFatalError(reason)) {
|
|
console.error("[openclaw] FATAL unhandled rejection:", formatUncaughtError(reason));
|
|
process.exit(1);
|
|
return;
|
|
}
|
|
|
|
if (isConfigError(reason)) {
|
|
console.error("[openclaw] CONFIGURATION ERROR - requires fix:", formatUncaughtError(reason));
|
|
process.exit(1);
|
|
return;
|
|
}
|
|
|
|
if (isTransientNetworkError(reason)) {
|
|
// Log with more detail to help diagnose source (issue #4501)
|
|
const errorDetails = formatUncaughtError(reason);
|
|
const stack =
|
|
reason instanceof Error && reason.stack
|
|
? reason.stack.split("\n").slice(0, 5).join("\n")
|
|
: "";
|
|
console.warn(
|
|
"[openclaw] Non-fatal unhandled rejection (continuing):",
|
|
errorDetails,
|
|
stack ? `\nStack trace (truncated):\n${stack}` : "",
|
|
);
|
|
return;
|
|
}
|
|
|
|
console.error("[openclaw] Unhandled promise rejection:", formatUncaughtError(reason));
|
|
process.exit(1);
|
|
});
|
|
}
|