From 907ff4ac8fea715562c20d4bb5e72cdf4f85c66a Mon Sep 17 00:00:00 2001
From: amabito <amabito@local>
Date: Wed, 18 Mar 2026 23:23:05 +0900
Subject: [PATCH 1/5] feat(heartbeat): add maxCostPerRun to cap embedded run
 cost

Adds a pre-call cost check in runHeartbeatOnce(). Estimated cost is
computed from context token count and model pricing before dispatching
to getReplyFromConfig(). If the estimate exceeds maxCostPerRun, the
run is skipped without invoking the model.

Fixes #49823
Ref #3181
---
 src/config/types.agent-defaults.ts          |   8 +
 src/infra/heartbeat-runner.cost-cap.test.ts | 206 ++++++++++++++++++++
 src/infra/heartbeat-runner.ts               |  99 ++++++++++
 3 files changed, 313 insertions(+)
 create mode 100644 src/infra/heartbeat-runner.cost-cap.test.ts

diff --git a/src/config/types.agent-defaults.ts b/src/config/types.agent-defaults.ts
index 68506e8be3c..a9ef7b82301 100644
--- a/src/config/types.agent-defaults.ts
+++ b/src/config/types.agent-defaults.ts
@@ -262,6 +262,14 @@ export type AgentDefaultsConfig = {
      * per-heartbeat token cost by avoiding the full session transcript.
      */
     isolatedSession?: boolean;
+    /**
+     * Maximum estimated cost (USD) for a single heartbeat run. If the
+     * estimated cost exceeds this value, the run is skipped before calling
+     * the model. Estimation uses approximate token count and model pricing.
+     *
+     * Default: undefined (no cap).
+     */
+    maxCostPerRun?: number;
     /**
      * When enabled, deliver the model's reasoning payload for heartbeat runs (when available)
      * as a separate message prefixed with `Reasoning:` (same as `/reasoning on`).
diff --git a/src/infra/heartbeat-runner.cost-cap.test.ts b/src/infra/heartbeat-runner.cost-cap.test.ts
new file mode 100644
index 00000000000..2478660a7b8
--- /dev/null
+++ b/src/infra/heartbeat-runner.cost-cap.test.ts
@@ -0,0 +1,206 @@
+import { afterEach, beforeEach, describe, expect, it, vi } from "vitest";
+import { telegramPlugin } from "../../extensions/telegram/src/channel.js";
+import { setTelegramRuntime } from "../../extensions/telegram/src/runtime.js";
+import { whatsappPlugin } from "../../extensions/whatsapp/src/channel.js";
+import { setWhatsAppRuntime } from "../../extensions/whatsapp/src/runtime.js";
+import * as replyModule from "../auto-reply/reply.js";
+import type { OpenClawConfig } from "../config/config.js";
+import { resolveMainSessionKey } from "../config/sessions.js";
+import { setActivePluginRegistry } from "../plugins/runtime.js";
+import { createPluginRuntime } from "../plugins/runtime/index.js";
+import { createTestRegistry } from "../test-utils/channel-plugins.js";
+import { estimateRunCost, runHeartbeatOnce } from "./heartbeat-runner.js";
+import { seedSessionStore, withTempHeartbeatSandbox } from "./heartbeat-runner.test-utils.js";
+
+// Avoid pulling optional runtime deps during isolated runs.
+vi.mock("jiti", () => ({ createJiti: () => () => ({}) }));
+
+// ---------------------------------------------------------------------------
+// Unit tests: estimateRunCost
+// ---------------------------------------------------------------------------
+
+describe("estimateRunCost", () => {
+  it("estimates cost for a known model", () => {
+    // 4000 chars = ~1000 tokens. claude-opus-4 = $15/M input tokens = $0.015/1K
+    const cost = estimateRunCost("x".repeat(4000), "claude-opus-4-20260901");
+    expect(cost).toBeCloseTo(0.015, 3);
+  });
+
+  it("estimates cost for a cheap model", () => {
+    // 4000 chars = ~1000 tokens. gemini-2.0-flash = $0.10/M = $0.0001/1K
+    const cost = estimateRunCost("x".repeat(4000), "gemini-2.0-flash");
+    expect(cost).toBeCloseTo(0.0001, 5);
+  });
+
+  it("uses conservative fallback for unknown models", () => {
+    const cost = estimateRunCost("x".repeat(4000), "some-unknown-model-v9");
+    expect(cost).toBeCloseTo(0.015, 3);
+  });
+
+  it("returns zero for empty prompt", () => {
+    const cost = estimateRunCost("", "claude-opus-4");
+    expect(cost).toBe(0);
+  });
+
+  it("returns non-zero for single-char prompt", () => {
+    // ceil(1/4) = 1 token
+    const cost = estimateRunCost("a", "claude-opus-4");
+    expect(cost).toBe(15 / 1_000_000);
+  });
+
+  it("handles large context (128K chars)", () => {
+    // 128000 chars = ~32000 tokens. claude-opus-4 = $15/M = $0.48
+    const cost = estimateRunCost("x".repeat(128_000), "claude-opus-4");
+    expect(cost).toBeCloseTo(0.48, 2);
+  });
+
+  it("is case-insensitive for model names", () => {
+    const lower = estimateRunCost("x".repeat(4000), "claude-opus-4");
+    const upper = estimateRunCost("x".repeat(4000), "CLAUDE-OPUS-4");
+    const mixed = estimateRunCost("x".repeat(4000), "Claude-Opus-4");
+    expect(lower).toBe(upper);
+    expect(lower).toBe(mixed);
+  });
+});
+
+describe("prefix matching ordering", () => {
+  it("gpt-4o matches gpt-4o pricing, not gpt-4", () => {
+    const cost4o = estimateRunCost("x".repeat(4000), "gpt-4o-2026-03-01");
+    const cost4 = estimateRunCost("x".repeat(4000), "gpt-4-0613");
+    expect(cost4o).toBeLessThan(cost4);
+    expect(cost4o).toBeCloseTo(0.0025, 4);
+  });
+
+  it("gpt-4-turbo matches gpt-4-turbo pricing, not gpt-4", () => {
+    const costTurbo = estimateRunCost("x".repeat(4000), "gpt-4-turbo-preview");
+    const cost4 = estimateRunCost("x".repeat(4000), "gpt-4-0613");
+    expect(costTurbo).toBeLessThan(cost4);
+    expect(costTurbo).toBeCloseTo(0.01, 4);
+  });
+
+  it("gpt-4 exact matches gpt-4 pricing", () => {
+    const cost = estimateRunCost("x".repeat(4000), "gpt-4-0613");
+    expect(cost).toBeCloseTo(0.03, 4);
+  });
+
+  it("o1-mini matches o1-mini pricing, not o1", () => {
+    const costMini = estimateRunCost("x".repeat(4000), "o1-mini-2026-01-01");
+    const costFull = estimateRunCost("x".repeat(4000), "o1-2026-01-01");
+    expect(costMini).toBeLessThan(costFull);
+    expect(costMini).toBeCloseTo(0.003, 4);
+  });
+
+  it("o3-mini matches o3-mini pricing, not o3", () => {
+    const costMini = estimateRunCost("x".repeat(4000), "o3-mini");
+    const costFull = estimateRunCost("x".repeat(4000), "o3-preview");
+    expect(costMini).toBeLessThan(costFull);
+    expect(costMini).toBeCloseTo(0.0011, 4);
+  });
+});
+
+// ---------------------------------------------------------------------------
+// Integration tests: runHeartbeatOnce with maxCostPerRun
+// ---------------------------------------------------------------------------
+
+beforeEach(() => {
+  const runtime = createPluginRuntime();
+  setTelegramRuntime(runtime);
+  setWhatsAppRuntime(runtime);
+  setActivePluginRegistry(
+    createTestRegistry([
+      { pluginId: "whatsapp", plugin: whatsappPlugin, source: "test" },
+      { pluginId: "telegram", plugin: telegramPlugin, source: "test" },
+    ]),
+  );
+});
+
+afterEach(() => {
+  vi.restoreAllMocks();
+});
+
+describe("runHeartbeatOnce – maxCostPerRun", () => {
+  async function runWithCostCap(params: {
+    maxCostPerRun?: number;
+    model?: string;
+  }) {
+    return withTempHeartbeatSandbox(
+      async ({ tmpDir, storePath, replySpy }) => {
+        const cfg: OpenClawConfig = {
+          agents: {
+            defaults: {
+              workspace: tmpDir,
+              heartbeat: {
+                every: "5m",
+                target: "whatsapp",
+                model: params.model ?? "claude-opus-4",
+                maxCostPerRun: params.maxCostPerRun,
+              },
+            },
+          },
+          channels: { whatsapp: { allowFrom: ["*"] } },
+          session: { store: storePath },
+        };
+        const sessionKey = resolveMainSessionKey(cfg);
+        await seedSessionStore(storePath, sessionKey, {
+          lastChannel: "whatsapp",
+          lastProvider: "whatsapp",
+          lastTo: "+1555",
+        });
+
+        replySpy.mockResolvedValue({ text: "HEARTBEAT_OK" });
+
+        const result = await runHeartbeatOnce({
+          cfg,
+          deps: { getQueueSize: () => 0, nowMs: () => 0 },
+        });
+
+        // Capture spy state before withTempHeartbeatSandbox restores it in finally.
+        const replyCallCount = replySpy.mock.calls.length;
+        return { result, replyCallCount };
+      },
+      { prefix: "openclaw-hb-costcap-" },
+    );
+  }
+
+  it("skips run when estimated cost exceeds maxCostPerRun", async () => {
+    const { result, replyCallCount } = await runWithCostCap({ maxCostPerRun: 0.0000001 });
+    expect(result).toEqual({ status: "skipped", reason: "cost-cap-exceeded" });
+    expect(replyCallCount).toBe(0);
+  });
+
+  it("proceeds when estimated cost is within maxCostPerRun", async () => {
+    const { result, replyCallCount } = await runWithCostCap({ maxCostPerRun: 100 });
+    expect(result).toEqual(expect.objectContaining({ status: "ran" }));
+    expect(replyCallCount).toBe(1);
+  });
+
+  it("proceeds when maxCostPerRun is not set", async () => {
+    const { result, replyCallCount } = await runWithCostCap({ maxCostPerRun: undefined });
+    expect(result).toEqual(expect.objectContaining({ status: "ran" }));
+    expect(replyCallCount).toBe(1);
+  });
+
+  it("skips all runs when maxCostPerRun is 0", async () => {
+    const { result, replyCallCount } = await runWithCostCap({ maxCostPerRun: 0 });
+    expect(result).toEqual({ status: "skipped", reason: "cost-cap-exceeded" });
+    expect(replyCallCount).toBe(0);
+  });
+
+  it("ignores negative maxCostPerRun (no cap)", async () => {
+    const { result, replyCallCount } = await runWithCostCap({ maxCostPerRun: -1 });
+    expect(result).toEqual(expect.objectContaining({ status: "ran" }));
+    expect(replyCallCount).toBe(1);
+  });
+
+  it("ignores NaN maxCostPerRun (no cap)", async () => {
+    const { result, replyCallCount } = await runWithCostCap({ maxCostPerRun: NaN });
+    expect(result).toEqual(expect.objectContaining({ status: "ran" }));
+    expect(replyCallCount).toBe(1);
+  });
+
+  it("ignores Infinity maxCostPerRun (no cap)", async () => {
+    const { result, replyCallCount } = await runWithCostCap({ maxCostPerRun: Infinity });
+    expect(result).toEqual(expect.objectContaining({ status: "ran" }));
+    expect(replyCallCount).toBe(1);
+  });
+});
diff --git a/src/infra/heartbeat-runner.ts b/src/infra/heartbeat-runner.ts
index 34b3a7b5f86..0a28c923502 100644
--- a/src/infra/heartbeat-runner.ts
+++ b/src/infra/heartbeat-runner.ts
@@ -713,6 +713,31 @@ export async function runHeartbeatOnce(opts: {
           bootstrapContextMode,
         }
       : { isHeartbeat: true, suppressToolErrorWarnings, bootstrapContextMode };
+
+    // Pre-call cost cap: estimate the cost of this run and skip if it
+    // exceeds maxCostPerRun.  Estimation is approximate (chars / 4 for
+    // token count, hardcoded pricing table with conservative fallback).
+    const maxCostPerRun = heartbeat?.maxCostPerRun;
+    if (typeof maxCostPerRun === "number" && Number.isFinite(maxCostPerRun) && maxCostPerRun >= 0) {
+      const estimatedCost = estimateRunCost(
+        ctx.Body,
+        heartbeatModelOverride ?? resolveDefaultModelId(cfg),
+      );
+      if (estimatedCost > maxCostPerRun) {
+        log.warn("heartbeat: skipping run, estimated cost exceeds maxCostPerRun", {
+          estimatedCost: estimatedCost.toFixed(4),
+          maxCostPerRun,
+          model: heartbeatModelOverride ?? "default",
+        });
+        emitHeartbeatEvent({
+          status: "skipped",
+          reason: "cost-cap-exceeded",
+          durationMs: Date.now() - startedAt,
+        });
+        return { status: "skipped", reason: "cost-cap-exceeded" };
+      }
+    }
+
     const replyResult = await getReplyFromConfig(ctx, replyOpts, cfg);
     const replyPayload = resolveHeartbeatReplyPayload(replyResult);
     const includeReasoning = heartbeat?.includeReasoning === true;
@@ -1180,3 +1205,77 @@ export function startHeartbeatRunner(opts: {
 
   return { stop: cleanup, updateConfig };
 }
+
+// ---------------------------------------------------------------------------
+// Cost estimation for maxCostPerRun
+// ---------------------------------------------------------------------------
+
+/** Per-input-token pricing (USD) for known model families. Conservative. */
+const MODEL_INPUT_PRICING: Record<string, number> = {
+  // Anthropic
+  "claude-opus-4": 15 / 1_000_000,
+  "claude-sonnet-4": 3 / 1_000_000,
+  "claude-haiku": 0.25 / 1_000_000,
+  // OpenAI
+  "gpt-4o": 2.5 / 1_000_000,
+  "gpt-4-turbo": 10 / 1_000_000,
+  "gpt-4": 30 / 1_000_000,
+  "gpt-3.5": 0.5 / 1_000_000,
+  "o1-mini": 3 / 1_000_000,
+  "o1": 15 / 1_000_000,
+  "o3-mini": 1.1 / 1_000_000,
+  "o3": 10 / 1_000_000,
+  // Google
+  "gemini-1.5-pro": 3.5 / 1_000_000,
+  "gemini-2.0-flash": 0.1 / 1_000_000,
+};
+
+/** Conservative fallback: assumes expensive model if unknown. */
+const FALLBACK_PRICE_PER_TOKEN = 15 / 1_000_000;
+
+/**
+ * Sorted prefixes (longest first) to guarantee that "gpt-4o" matches
+ * before "gpt-4" and "gpt-4-turbo" matches before "gpt-4".
+ */
+const SORTED_PRICING_ENTRIES = Object.entries(MODEL_INPUT_PRICING).sort(
+  ([a], [b]) => b.length - a.length,
+);
+
+/**
+ * Match a model id against the pricing table. Tries longest-prefix-first
+ * matching so "claude-opus-4-20260901" matches "claude-opus-4".
+ */
+function resolveInputPricePerToken(modelId: string): number {
+  const lower = modelId.toLowerCase();
+  for (const [prefix, price] of SORTED_PRICING_ENTRIES) {
+    if (lower.startsWith(prefix)) {
+      return price;
+    }
+  }
+  return FALLBACK_PRICE_PER_TOKEN;
+}
+
+/** Approximate token count from character length (chars / 4). */
+function estimateTokenCount(text: string): number {
+  return Math.ceil(text.length / 4);
+}
+
+/** Estimate input cost (USD) for a single run. */
+export function estimateRunCost(promptBody: string, modelId: string): number {
+  return estimateTokenCount(promptBody) * resolveInputPricePerToken(modelId);
+}
+
+/** Resolve the default model id from config. */
+function resolveDefaultModelId(cfg: OpenClawConfig): string {
+  const primary = cfg.agents?.defaults?.model;
+  if (typeof primary === "string") {
+    return primary;
+  }
+  if (primary && typeof primary === "object" && "primary" in primary) {
+    const p = (primary as Record<string, unknown>).primary;
+    if (typeof p === "string") {
+      return p;
+    }
+  }
+  return "unknown";
+}

From 191989a97dfc105010cd07ec09c932c797039577 Mon Sep 17 00:00:00 2001
From: amabito <amabito@local>
Date: Wed, 18 Mar 2026 23:26:37 +0900
Subject: [PATCH 2/5] fix: apply oxfmt formatting

---
 src/infra/heartbeat-runner.cost-cap.test.ts | 5 +----
 src/infra/heartbeat-runner.ts               | 4 ++--
 2 files changed, 3 insertions(+), 6 deletions(-)

diff --git a/src/infra/heartbeat-runner.cost-cap.test.ts b/src/infra/heartbeat-runner.cost-cap.test.ts
index 2478660a7b8..3c8e2c6d650 100644
--- a/src/infra/heartbeat-runner.cost-cap.test.ts
+++ b/src/infra/heartbeat-runner.cost-cap.test.ts
@@ -119,10 +119,7 @@ afterEach(() => {
 });
 
 describe("runHeartbeatOnce – maxCostPerRun", () => {
-  async function runWithCostCap(params: {
-    maxCostPerRun?: number;
-    model?: string;
-  }) {
+  async function runWithCostCap(params: { maxCostPerRun?: number; model?: string }) {
     return withTempHeartbeatSandbox(
       async ({ tmpDir, storePath, replySpy }) => {
         const cfg: OpenClawConfig = {
diff --git a/src/infra/heartbeat-runner.ts b/src/infra/heartbeat-runner.ts
index 0a28c923502..b1c09ae4e4d 100644
--- a/src/infra/heartbeat-runner.ts
+++ b/src/infra/heartbeat-runner.ts
@@ -1222,9 +1222,9 @@ const MODEL_INPUT_PRICING: Record<string, number> = {
   "gpt-4": 30 / 1_000_000,
   "gpt-3.5": 0.5 / 1_000_000,
   "o1-mini": 3 / 1_000_000,
-  "o1": 15 / 1_000_000,
+  o1: 15 / 1_000_000,
   "o3-mini": 1.1 / 1_000_000,
-  "o3": 10 / 1_000_000,
+  o3: 10 / 1_000_000,
   // Google
   "gemini-1.5-pro": 3.5 / 1_000_000,
   "gemini-2.0-flash": 0.1 / 1_000_000,

From 81e294118ef87e81775ad2a6ff83c5d7912fd9e6 Mon Sep 17 00:00:00 2001
From: amabito <amabito@local>
Date: Thu, 19 Mar 2026 00:33:07 +0900
Subject: [PATCH 3/5] refactor(heartbeat): use config model catalog for cost
 estimation

Prefer resolveModelCostConfig() from the config model catalog over
the hardcoded pricing table. Falls back to the hardcoded table when
the model is not in the catalog. Also fixes provider-prefixed model
names (e.g. "openai/gpt-4o") falling through to the fallback price,
and accepts cost.input = 0 for free/local models.

Fixes #49823
Ref #3181
---
 src/infra/heartbeat-runner.cost-cap.test.ts | 133 ++++++++++++++++++++
 src/infra/heartbeat-runner.ts               |  36 ++++--
 2 files changed, 162 insertions(+), 7 deletions(-)

diff --git a/src/infra/heartbeat-runner.cost-cap.test.ts b/src/infra/heartbeat-runner.cost-cap.test.ts
index 3c8e2c6d650..e65b48fb11c 100644
--- a/src/infra/heartbeat-runner.cost-cap.test.ts
+++ b/src/infra/heartbeat-runner.cost-cap.test.ts
@@ -98,6 +98,126 @@ describe("prefix matching ordering", () => {
   });
 });
 
+describe("config catalog lookup", () => {
+  it("uses catalog pricing when model is defined in config", () => {
+    const cfg = {
+      models: {
+        providers: {
+          custom: {
+            models: [
+              {
+                id: "my-cheap-model",
+                cost: { input: 0.5, output: 1, cacheRead: 0, cacheWrite: 0 },
+              },
+            ],
+          },
+        },
+      },
+    } as unknown as import("../config/config.js").OpenClawConfig;
+    // 4000 chars = 1000 tokens. catalog says $0.50/M = $0.0005/1K
+    const cost = estimateRunCost("x".repeat(4000), "custom/my-cheap-model", cfg);
+    expect(cost).toBeCloseTo(0.0005, 5);
+  });
+
+  it("falls back to hardcoded table when model not in catalog", () => {
+    const cfg = {
+      models: { providers: {} },
+    } as unknown as import("../config/config.js").OpenClawConfig;
+    const cost = estimateRunCost("x".repeat(4000), "claude-opus-4", cfg);
+    // Should still use hardcoded table: $15/M = $0.015/1K
+    expect(cost).toBeCloseTo(0.015, 3);
+  });
+
+  it("falls back to hardcoded table when cfg is undefined", () => {
+    const cost = estimateRunCost("x".repeat(4000), "claude-opus-4");
+    expect(cost).toBeCloseTo(0.015, 3);
+  });
+
+  it("falls back to hardcoded table for bare model name without provider/", () => {
+    const cfg = {
+      models: {
+        providers: {
+          anthropic: {
+            models: [
+              {
+                id: "claude-opus-4",
+                cost: { input: 15, output: 75, cacheRead: 0, cacheWrite: 0 },
+              },
+            ],
+          },
+        },
+      },
+    } as unknown as import("../config/config.js").OpenClawConfig;
+    // Bare name "claude-opus-4" has no provider/ prefix, so parseModelRef
+    // returns provider="" which fails catalog lookup. Falls back to hardcoded.
+    const cost = estimateRunCost("x".repeat(4000), "claude-opus-4", cfg);
+    expect(cost).toBeCloseTo(0.015, 3);
+  });
+
+  it("uses zero cost.input from catalog for free models", () => {
+    const cfg = {
+      models: {
+        providers: {
+          custom: {
+            models: [
+              {
+                id: "free-model",
+                cost: { input: 0, output: 0, cacheRead: 0, cacheWrite: 0 },
+              },
+            ],
+          },
+        },
+      },
+    } as unknown as import("../config/config.js").OpenClawConfig;
+    const cost = estimateRunCost("x".repeat(4000), "custom/free-model", cfg);
+    expect(cost).toBe(0); // free model = $0
+  });
+
+  it("uses zero cost.input from catalog (free/local model)", () => {
+    const cfg = {
+      models: {
+        providers: {
+          local: {
+            models: [
+              {
+                id: "llama3",
+                cost: { input: 0, output: 0, cacheRead: 0, cacheWrite: 0 },
+              },
+            ],
+          },
+        },
+      },
+    } as unknown as import("../config/config.js").OpenClawConfig;
+    const cost = estimateRunCost("x".repeat(4000), "local/llama3", cfg);
+    expect(cost).toBe(0); // free model = $0
+  });
+
+  it("matches hardcoded table with provider-prefixed model name", () => {
+    // "openai/gpt-4o" should strip "openai/" and match "gpt-4o" in hardcoded table
+    const cost = estimateRunCost("x".repeat(4000), "openai/gpt-4o");
+    expect(cost).toBeCloseTo(0.0025, 4); // gpt-4o = $2.5/M
+  });
+
+  it("ignores catalog entry with negative cost.input", () => {
+    const cfg = {
+      models: {
+        providers: {
+          custom: {
+            models: [
+              {
+                id: "bad-model",
+                cost: { input: -5, output: 1, cacheRead: 0, cacheWrite: 0 },
+              },
+            ],
+          },
+        },
+      },
+    } as unknown as import("../config/config.js").OpenClawConfig;
+    const cost = estimateRunCost("x".repeat(4000), "custom/bad-model", cfg);
+    expect(cost).toBeCloseTo(0.015, 3); // fallback
+  });
+});
+
 // ---------------------------------------------------------------------------
 // Integration tests: runHeartbeatOnce with maxCostPerRun
 // ---------------------------------------------------------------------------
@@ -200,4 +320,17 @@ describe("runHeartbeatOnce – maxCostPerRun", () => {
     expect(result).toEqual(expect.objectContaining({ status: "ran" }));
     expect(replyCallCount).toBe(1);
   });
+
+  it("proceeds for free catalog model when maxCostPerRun is 0", async () => {
+    // Free model: estimated cost = $0. maxCostPerRun = 0. 0 > 0 = false, so run proceeds.
+    // This uses heartbeat.model override which goes through the hardcoded table,
+    // not the catalog. A truly free model via catalog would also return $0.
+    const { result, replyCallCount } = await runWithCostCap({
+      maxCostPerRun: 0,
+      model: "gemini-2.0-flash", // cheapest in table, but still > $0 for non-empty prompt
+    });
+    // gemini-2.0-flash with HEARTBEAT.md context will have cost > 0, so it gets skipped
+    expect(result).toEqual({ status: "skipped", reason: "cost-cap-exceeded" });
+    expect(replyCallCount).toBe(0);
+  });
 });
diff --git a/src/infra/heartbeat-runner.ts b/src/infra/heartbeat-runner.ts
index b1c09ae4e4d..6d2f2f0e0c8 100644
--- a/src/infra/heartbeat-runner.ts
+++ b/src/infra/heartbeat-runner.ts
@@ -7,6 +7,7 @@ import {
 } from "../agents/agent-scope.js";
 import { appendCronStyleCurrentTimeLine } from "../agents/current-time.js";
 import { resolveEffectiveMessagesConfig } from "../agents/identity.js";
+import { parseModelRef } from "../agents/model-selection.js";
 import { DEFAULT_HEARTBEAT_FILENAME } from "../agents/workspace.js";
 import { resolveHeartbeatReplyPayload } from "../auto-reply/heartbeat-reply-payload.js";
 import {
@@ -44,6 +45,7 @@ import {
 } from "../routing/session-key.js";
 import { defaultRuntime, type RuntimeEnv } from "../runtime.js";
 import { escapeRegExp } from "../utils.js";
+import { resolveModelCostConfig } from "../utils/usage-format.js";
 import { formatErrorMessage, hasErrnoCode } from "./errors.js";
 import { isWithinActiveHours } from "./heartbeat-active-hours.js";
 import {
@@ -722,6 +724,7 @@ export async function runHeartbeatOnce(opts: {
       const estimatedCost = estimateRunCost(
         ctx.Body,
         heartbeatModelOverride ?? resolveDefaultModelId(cfg),
+        cfg,
       );
       if (estimatedCost > maxCostPerRun) {
         log.warn("heartbeat: skipping run, estimated cost exceeds maxCostPerRun", {
@@ -1242,11 +1245,27 @@ const SORTED_PRICING_ENTRIES = Object.entries(MODEL_INPUT_PRICING).sort(
 );
 
 /**
- * Match a model id against the pricing table. Tries longest-prefix-first
- * matching so "claude-opus-4-20260901" matches "claude-opus-4".
+ * Try the config model catalog first (exact match via resolveModelCostConfig),
+ * then fall back to prefix matching against the hardcoded table.
  */
-function resolveInputPricePerToken(modelId: string): number {
-  const lower = modelId.toLowerCase();
+function resolveInputPricePerToken(modelId: string, cfg?: OpenClawConfig): number {
+  if (cfg) {
+    const ref = parseModelRef(modelId, "");
+    if (ref) {
+      const costConfig = resolveModelCostConfig({
+        provider: ref.provider,
+        model: ref.model,
+        config: cfg,
+      });
+      if (costConfig && Number.isFinite(costConfig.input) && costConfig.input >= 0) {
+        return costConfig.input / 1_000_000;
+      }
+    }
+  }
+  // Strip provider prefix (e.g. "openai/gpt-4o" -> "gpt-4o") for hardcoded table match.
+  const slash = modelId.indexOf("/");
+  const bareModel = slash !== -1 ? modelId.slice(slash + 1) : modelId;
+  const lower = bareModel.toLowerCase();
   for (const [prefix, price] of SORTED_PRICING_ENTRIES) {
     if (lower.startsWith(prefix)) {
       return price;
@@ -1260,9 +1279,12 @@ function estimateTokenCount(text: string): number {
   return Math.ceil(text.length / 4);
 }
 
-/** Estimate input cost (USD) for a single run. */
-export function estimateRunCost(promptBody: string, modelId: string): number {
-  return estimateTokenCount(promptBody) * resolveInputPricePerToken(modelId);
+/**
+ * Estimate input cost (USD) for a single run. Checks the config model
+ * catalog first, falls back to the hardcoded pricing table.
+ */
+export function estimateRunCost(promptBody: string, modelId: string, cfg?: OpenClawConfig): number {
+  return estimateTokenCount(promptBody) * resolveInputPricePerToken(modelId, cfg);
 }
 
 /** Resolve the default model id from config. */

From c2c261798d6ef5c0cb371d0848bba9688ea1476c Mon Sep 17 00:00:00 2001
From: amabito <amabito@local>
Date: Thu, 19 Mar 2026 00:39:23 +0900
Subject: [PATCH 4/5] fix(heartbeat): use lastIndexOf for nested provider
 prefixes

Handles model refs like "openrouter/anthropic/claude-opus-4" by
stripping all provider segments before matching the hardcoded pricing
table. Also adds nested prefix and free model regression tests.

Fixes #49823
Ref #3181
---
 src/infra/heartbeat-runner.cost-cap.test.ts | 6 ++++++
 src/infra/heartbeat-runner.ts               | 5 +++--
 2 files changed, 9 insertions(+), 2 deletions(-)

diff --git a/src/infra/heartbeat-runner.cost-cap.test.ts b/src/infra/heartbeat-runner.cost-cap.test.ts
index e65b48fb11c..f91e7b7157b 100644
--- a/src/infra/heartbeat-runner.cost-cap.test.ts
+++ b/src/infra/heartbeat-runner.cost-cap.test.ts
@@ -198,6 +198,12 @@ describe("config catalog lookup", () => {
     expect(cost).toBeCloseTo(0.0025, 4); // gpt-4o = $2.5/M
   });
 
+  it("matches hardcoded table with nested provider prefix", () => {
+    // "openrouter/anthropic/claude-opus-4" should strip to "claude-opus-4"
+    const cost = estimateRunCost("x".repeat(4000), "openrouter/anthropic/claude-opus-4");
+    expect(cost).toBeCloseTo(0.015, 3); // claude-opus-4 = $15/M
+  });
+
   it("ignores catalog entry with negative cost.input", () => {
     const cfg = {
       models: {
diff --git a/src/infra/heartbeat-runner.ts b/src/infra/heartbeat-runner.ts
index 6d2f2f0e0c8..61aaa513178 100644
--- a/src/infra/heartbeat-runner.ts
+++ b/src/infra/heartbeat-runner.ts
@@ -1262,8 +1262,9 @@ function resolveInputPricePerToken(modelId: string, cfg?: OpenClawConfig): numbe
       }
     }
   }
-  // Strip provider prefix (e.g. "openai/gpt-4o" -> "gpt-4o") for hardcoded table match.
-  const slash = modelId.indexOf("/");
+  // Strip provider prefix (e.g. "openai/gpt-4o" or "openrouter/anthropic/claude-opus-4"
+  // -> "gpt-4o" / "claude-opus-4") for hardcoded table match.
+  const slash = modelId.lastIndexOf("/");
   const bareModel = slash !== -1 ? modelId.slice(slash + 1) : modelId;
   const lower = bareModel.toLowerCase();
   for (const [prefix, price] of SORTED_PRICING_ENTRIES) {

From bd8497f8dd9f73c6f67c7ec4af5d4dae9d1c318a Mon Sep 17 00:00:00 2001
From: "Keita A." <keita.a.0609@gmail.com>
Date: Thu, 19 Mar 2026 18:20:49 +0900
Subject: [PATCH 5/5] =?UTF-8?q?heartbeat-runner.cost-cap.test.ts=20?=
 =?UTF-8?q?=E3=82=92=E6=9B=B4=E6=96=B0?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Co-authored-by: greptile-apps[bot] <165735046+greptile-apps[bot]@users.noreply.github.com>
---
 src/infra/heartbeat-runner.cost-cap.test.ts | 9 +++++----
 1 file changed, 5 insertions(+), 4 deletions(-)

diff --git a/src/infra/heartbeat-runner.cost-cap.test.ts b/src/infra/heartbeat-runner.cost-cap.test.ts
index f91e7b7157b..53b74212fc8 100644
--- a/src/infra/heartbeat-runner.cost-cap.test.ts
+++ b/src/infra/heartbeat-runner.cost-cap.test.ts
@@ -327,10 +327,11 @@ describe("runHeartbeatOnce – maxCostPerRun", () => {
     expect(replyCallCount).toBe(1);
   });
 
-  it("proceeds for free catalog model when maxCostPerRun is 0", async () => {
-    // Free model: estimated cost = $0. maxCostPerRun = 0. 0 > 0 = false, so run proceeds.
-    // This uses heartbeat.model override which goes through the hardcoded table,
-    // not the catalog. A truly free model via catalog would also return $0.
+  it("skips cheap (non-free) model when maxCostPerRun is 0", async () => {
+    // gemini-2.0-flash costs $0.10/M input — non-zero — so with maxCostPerRun = 0
+    // the condition (estimatedCost > 0) is true and the run is skipped.
+    // Note: a *truly* free model (cost.input = 0 in catalog) would NOT be skipped
+    // because 0 > 0 === false. That scenario is covered by the unit tests above.
     const { result, replyCallCount } = await runWithCostCap({
       maxCostPerRun: 0,
       model: "gemini-2.0-flash", // cheapest in table, but still > $0 for non-empty prompt