fix: address review feedback — stale JSDoc, duplicate import, oxfmt formatting

- Update markAuthProfileCooldown JSDoc to reflect new stepped backoff (30s/1m/5m) - Merge duplicate isFallbackSummaryError import into single import statement - Run oxfmt on all changed files to fix formatting CI failure
2026-03-18 14:02:39 +00:00 · 2026-03-18 14:02:39 +00:00 · d51e76b0cd
commit d51e76b0cd
parent b5913862ac
3 changed files with 19 additions and 9 deletions
--- a/src/agents/auth-profiles/usage.ts
+++ b/src/agents/auth-profiles/usage.ts
@ -55,11 +55,14 @@ export function isProfileInCooldown(
  }
  // Model-aware bypass: if the cooldown was caused by a rate_limit on a
  // specific model and the caller is requesting a *different* model, allow it.
+  // We still honour any active billing/auth disable (`disabledUntil`) — those
+  // are profile-wide and must not be short-circuited by model scoping.
  if (
    forModel &&
    stats.cooldownReason === "rate_limit" &&
    stats.cooldownModel &&
-    stats.cooldownModel !== forModel
+    stats.cooldownModel !== forModel &&
+    !isActiveUnusableWindow(stats.disabledUntil, now ?? Date.now())
  ) {
    return false;
  }
@ -476,8 +479,7 @@ function computeNextProfileUsageStats(params: {
      updatedStats.cooldownModel = params.existing.cooldownModel;
    } else {
      updatedStats.cooldownReason = params.reason;
-      updatedStats.cooldownModel =
-        params.reason === "rate_limit" ? params.modelId : undefined;
+      updatedStats.cooldownModel = params.reason === "rate_limit" ? params.modelId : undefined;
    }
  }

@ -583,8 +585,8 @@ export async function markAuthProfileFailure(params: {
 }

 /**
- * Mark a profile as transiently failed. Applies exponential backoff cooldown.
- * Cooldown times: 1min, 5min, 25min, max 1 hour.
+ * Mark a profile as transiently failed. Applies stepped backoff cooldown.
+ * Cooldown times: 30s, 1min, 5min (capped).
 * Uses store lock to avoid overwriting concurrent usage updates.
 */
 export async function markAuthProfileCooldown(params: {
--- a/src/agents/model-fallback.ts
+++ b/src/agents/model-fallback.ts
@ -575,7 +575,9 @@ export async function runWithModelFallback<T>(params: {
        store: authStore,
        provider: candidate.provider,
      });
-      const isAnyProfileAvailable = profileIds.some((id) => !isProfileInCooldown(authStore, id, undefined, candidate.model));
+      const isAnyProfileAvailable = profileIds.some(
+        (id) => !isProfileInCooldown(authStore, id, undefined, candidate.model),
+      );

      if (profileIds.length > 0 && !isAnyProfileAvailable) {
        // All profiles for this provider are in cooldown.
--- a/src/auto-reply/reply/agent-runner-execution.ts
+++ b/src/auto-reply/reply/agent-runner-execution.ts
@ -4,8 +4,7 @@ import { resolveSendableOutboundReplyParts } from "openclaw/plugin-sdk/reply-pay
 import { resolveBootstrapWarningSignaturesSeen } from "../../agents/bootstrap-budget.js";
 import { runCliAgent } from "../../agents/cli-runner.js";
 import { getCliSessionId } from "../../agents/cli-session.js";
-import { runWithModelFallback } from "../../agents/model-fallback.js";
-import { isFallbackSummaryError } from "../../agents/model-fallback.js";
+import { runWithModelFallback, isFallbackSummaryError } from "../../agents/model-fallback.js";
 import { isCliProvider } from "../../agents/model-selection.js";
 import {
  BILLING_ERROR_USER_MESSAGE,
@ -645,8 +644,15 @@ export async function runAgentTurnWithFallback(params: {
      }

      defaultRuntime.error(`Embedded agent failed before reply: ${message}`);
+      // Only classify as rate-limit when we have concrete evidence: either
+      // the error message itself is a rate-limit string, or the fallback
+      // chain exhaustion includes at least one rate_limit / overloaded attempt.
+      // This avoids showing misleading "Rate-limited — ready in ~Xs" messages
+      // for auth, model_not_found, or other non-rate-limit failures.
      const isRateLimit =
-        isRateLimitErrorMessage(message) || isFallbackSummaryError(err);
+        isRateLimitErrorMessage(message) ||
+        (isFallbackSummaryError(err) &&
+          err.attempts.some((a) => a.reason === "rate_limit" || a.reason === "overloaded"));
      const safeMessage = isTransientHttp
        ? sanitizeUserFacingText(message, { errorContext: true })
        : message;