diff --git a/src/agents/pi-embedded-helpers.ts b/src/agents/pi-embedded-helpers.ts index 4a1c4fcc5..7acdd2e52 100644 --- a/src/agents/pi-embedded-helpers.ts +++ b/src/agents/pi-embedded-helpers.ts @@ -392,6 +392,11 @@ export function formatAssistantErrorText( return `LLM request rejected: ${invalidRequest[1]}`; } + // Check for overloaded errors (Anthropic API capacity) + if (isOverloadedErrorMessage(raw)) { + return "The AI service is temporarily overloaded. Please try again in a moment."; + } + // Keep it short for WhatsApp. return raw.length > 600 ? `${raw.slice(0, 600)}…` : raw; } @@ -414,6 +419,7 @@ const ERROR_PATTERNS = { "resource_exhausted", "usage limit", ], + overloaded: [/overloaded_error|"type"\s*:\s*"overloaded"/i, "overloaded"], timeout: [ "timeout", "timed out", @@ -496,6 +502,10 @@ export function isAuthErrorMessage(raw: string): boolean { return matchesErrorPatterns(raw, ERROR_PATTERNS.auth); } +export function isOverloadedErrorMessage(raw: string): boolean { + return matchesErrorPatterns(raw, ERROR_PATTERNS.overloaded); +} + export function isCloudCodeAssistFormatError(raw: string): boolean { return matchesErrorPatterns(raw, ERROR_PATTERNS.format); } @@ -517,6 +527,7 @@ export type FailoverReason = export function classifyFailoverReason(raw: string): FailoverReason | null { if (isRateLimitErrorMessage(raw)) return "rate_limit"; + if (isOverloadedErrorMessage(raw)) return "rate_limit"; // Treat overloaded as rate limit for failover if (isCloudCodeAssistFormatError(raw)) return "format"; if (isBillingErrorMessage(raw)) return "billing"; if (isTimeoutErrorMessage(raw)) return "timeout";