openclaw/src/auto-reply/reply/get-reply-run.media-only.test.ts
Isis Anisoptera 432e0222dd
fix: restore auto-reply system events timeline (#34794) (thanks @anisoptera) (#34794)
Co-authored-by: Ayaan Zaidi <zaidi@uplause.io>
2026-03-05 07:56:14 +05:30

400 lines
13 KiB
TypeScript

import { beforeEach, describe, expect, it, vi } from "vitest";
import { runPreparedReply } from "./get-reply-run.js";
vi.mock("../../agents/auth-profiles/session-override.js", () => ({
resolveSessionAuthProfileOverride: vi.fn().mockResolvedValue(undefined),
}));
vi.mock("../../agents/pi-embedded.js", () => ({
abortEmbeddedPiRun: vi.fn().mockReturnValue(false),
isEmbeddedPiRunActive: vi.fn().mockReturnValue(false),
isEmbeddedPiRunStreaming: vi.fn().mockReturnValue(false),
resolveEmbeddedSessionLane: vi.fn().mockReturnValue("session:session-key"),
}));
vi.mock("../../config/sessions.js", () => ({
resolveGroupSessionKey: vi.fn().mockReturnValue(undefined),
resolveSessionFilePath: vi.fn().mockReturnValue("/tmp/session.jsonl"),
resolveSessionFilePathOptions: vi.fn().mockReturnValue({}),
updateSessionStore: vi.fn(),
}));
vi.mock("../../globals.js", () => ({
logVerbose: vi.fn(),
}));
vi.mock("../../process/command-queue.js", () => ({
clearCommandLane: vi.fn().mockReturnValue(0),
getQueueSize: vi.fn().mockReturnValue(0),
}));
vi.mock("../../routing/session-key.js", () => ({
normalizeMainKey: vi.fn().mockReturnValue("main"),
}));
vi.mock("../../utils/provider-utils.js", () => ({
isReasoningTagProvider: vi.fn().mockReturnValue(false),
}));
vi.mock("../command-detection.js", () => ({
hasControlCommand: vi.fn().mockReturnValue(false),
}));
vi.mock("./agent-runner.js", () => ({
runReplyAgent: vi.fn().mockResolvedValue({ text: "ok" }),
}));
vi.mock("./body.js", () => ({
applySessionHints: vi.fn().mockImplementation(async ({ baseBody }) => baseBody),
}));
vi.mock("./groups.js", () => ({
buildGroupIntro: vi.fn().mockReturnValue(""),
buildGroupChatContext: vi.fn().mockReturnValue(""),
}));
vi.mock("./inbound-meta.js", () => ({
buildInboundMetaSystemPrompt: vi.fn().mockReturnValue(""),
buildInboundUserContextPrefix: vi.fn().mockReturnValue(""),
}));
vi.mock("./queue.js", () => ({
resolveQueueSettings: vi.fn().mockReturnValue({ mode: "followup" }),
}));
vi.mock("./route-reply.js", () => ({
routeReply: vi.fn(),
}));
vi.mock("./session-updates.js", () => ({
ensureSkillSnapshot: vi.fn().mockImplementation(async ({ sessionEntry, systemSent }) => ({
sessionEntry,
systemSent,
skillsSnapshot: undefined,
})),
drainFormattedSystemEvents: vi.fn().mockResolvedValue(undefined),
}));
vi.mock("./typing-mode.js", () => ({
resolveTypingMode: vi.fn().mockReturnValue("off"),
}));
import { runReplyAgent } from "./agent-runner.js";
import { routeReply } from "./route-reply.js";
import { drainFormattedSystemEvents } from "./session-updates.js";
import { resolveTypingMode } from "./typing-mode.js";
function baseParams(
overrides: Partial<Parameters<typeof runPreparedReply>[0]> = {},
): Parameters<typeof runPreparedReply>[0] {
return {
ctx: {
Body: "",
RawBody: "",
CommandBody: "",
ThreadHistoryBody: "Earlier message in this thread",
OriginatingChannel: "slack",
OriginatingTo: "C123",
ChatType: "group",
},
sessionCtx: {
Body: "",
BodyStripped: "",
ThreadHistoryBody: "Earlier message in this thread",
MediaPath: "/tmp/input.png",
Provider: "slack",
ChatType: "group",
OriginatingChannel: "slack",
OriginatingTo: "C123",
},
cfg: { session: {}, channels: {}, agents: { defaults: {} } },
agentId: "default",
agentDir: "/tmp/agent",
agentCfg: {},
sessionCfg: {},
commandAuthorized: true,
command: {
isAuthorizedSender: true,
abortKey: "session-key",
ownerList: [],
senderIsOwner: false,
} as never,
commandSource: "",
allowTextCommands: true,
directives: {
hasThinkDirective: false,
thinkLevel: undefined,
} as never,
defaultActivation: "always",
resolvedThinkLevel: "high",
resolvedVerboseLevel: "off",
resolvedReasoningLevel: "off",
resolvedElevatedLevel: "off",
elevatedEnabled: false,
elevatedAllowed: false,
blockStreamingEnabled: false,
resolvedBlockStreamingBreak: "message_end",
modelState: {
resolveDefaultThinkingLevel: async () => "medium",
} as never,
provider: "anthropic",
model: "claude-opus-4-1",
typing: {
onReplyStart: vi.fn().mockResolvedValue(undefined),
cleanup: vi.fn(),
} as never,
defaultProvider: "anthropic",
defaultModel: "claude-opus-4-1",
timeoutMs: 30_000,
isNewSession: true,
resetTriggered: false,
systemSent: true,
sessionKey: "session-key",
workspaceDir: "/tmp/workspace",
abortedLastRun: false,
...overrides,
};
}
describe("runPreparedReply media-only handling", () => {
beforeEach(() => {
vi.clearAllMocks();
});
it("allows media-only prompts and preserves thread context in queued followups", async () => {
const result = await runPreparedReply(baseParams());
expect(result).toEqual({ text: "ok" });
const call = vi.mocked(runReplyAgent).mock.calls[0]?.[0];
expect(call).toBeTruthy();
expect(call?.followupRun.prompt).toContain("[Thread history - for context]");
expect(call?.followupRun.prompt).toContain("Earlier message in this thread");
expect(call?.followupRun.prompt).toContain("[User sent media without caption]");
});
it("keeps thread history context on follow-up turns", async () => {
const result = await runPreparedReply(
baseParams({
isNewSession: false,
}),
);
expect(result).toEqual({ text: "ok" });
const call = vi.mocked(runReplyAgent).mock.calls[0]?.[0];
expect(call).toBeTruthy();
expect(call?.followupRun.prompt).toContain("[Thread history - for context]");
expect(call?.followupRun.prompt).toContain("Earlier message in this thread");
});
it("returns the empty-body reply when there is no text and no media", async () => {
const result = await runPreparedReply(
baseParams({
ctx: {
Body: "",
RawBody: "",
CommandBody: "",
},
sessionCtx: {
Body: "",
BodyStripped: "",
Provider: "slack",
},
}),
);
expect(result).toEqual({
text: "I didn't receive any text in your message. Please resend or add a caption.",
});
expect(vi.mocked(runReplyAgent)).not.toHaveBeenCalled();
});
it("omits auth key labels from /new and /reset confirmation messages", async () => {
await runPreparedReply(
baseParams({
resetTriggered: true,
}),
);
const resetNoticeCall = vi.mocked(routeReply).mock.calls[0]?.[0] as
| { payload?: { text?: string } }
| undefined;
expect(resetNoticeCall?.payload?.text).toContain("✅ New session started · model:");
expect(resetNoticeCall?.payload?.text).not.toContain("🔑");
expect(resetNoticeCall?.payload?.text).not.toContain("api-key");
expect(resetNoticeCall?.payload?.text).not.toContain("env:");
});
it("skips reset notice when only webchat fallback routing is available", async () => {
await runPreparedReply(
baseParams({
resetTriggered: true,
ctx: {
Body: "",
RawBody: "",
CommandBody: "",
ThreadHistoryBody: "Earlier message in this thread",
OriginatingChannel: undefined,
OriginatingTo: undefined,
ChatType: "group",
},
command: {
isAuthorizedSender: true,
abortKey: "session-key",
ownerList: [],
senderIsOwner: false,
channel: "webchat",
from: undefined,
to: undefined,
} as never,
}),
);
expect(vi.mocked(routeReply)).not.toHaveBeenCalled();
});
it("uses inbound origin channel for run messageProvider", async () => {
await runPreparedReply(
baseParams({
ctx: {
Body: "",
RawBody: "",
CommandBody: "",
ThreadHistoryBody: "Earlier message in this thread",
OriginatingChannel: "webchat",
OriginatingTo: "session:abc",
ChatType: "group",
},
sessionCtx: {
Body: "",
BodyStripped: "",
ThreadHistoryBody: "Earlier message in this thread",
MediaPath: "/tmp/input.png",
Provider: "telegram",
ChatType: "group",
OriginatingChannel: "telegram",
OriginatingTo: "telegram:123",
},
}),
);
const call = vi.mocked(runReplyAgent).mock.calls[0]?.[0];
expect(call?.followupRun.run.messageProvider).toBe("webchat");
});
it("prefers Provider over Surface when origin channel is missing", async () => {
await runPreparedReply(
baseParams({
ctx: {
Body: "",
RawBody: "",
CommandBody: "",
ThreadHistoryBody: "Earlier message in this thread",
OriginatingChannel: undefined,
OriginatingTo: undefined,
Provider: "feishu",
Surface: "webchat",
ChatType: "group",
},
sessionCtx: {
Body: "",
BodyStripped: "",
ThreadHistoryBody: "Earlier message in this thread",
MediaPath: "/tmp/input.png",
Provider: "webchat",
ChatType: "group",
OriginatingChannel: undefined,
OriginatingTo: undefined,
},
}),
);
const call = vi.mocked(runReplyAgent).mock.calls[0]?.[0];
expect(call?.followupRun.run.messageProvider).toBe("feishu");
});
it("passes suppressTyping through typing mode resolution", async () => {
await runPreparedReply(
baseParams({
opts: {
suppressTyping: true,
},
}),
);
const call = vi.mocked(resolveTypingMode).mock.calls[0]?.[0] as
| { suppressTyping?: boolean }
| undefined;
expect(call?.suppressTyping).toBe(true);
});
it("routes queued system events into user prompt text, not system prompt context", async () => {
vi.mocked(drainFormattedSystemEvents).mockResolvedValueOnce("System: [t] Model switched.");
await runPreparedReply(baseParams());
const call = vi.mocked(runReplyAgent).mock.calls[0]?.[0];
expect(call).toBeTruthy();
expect(call?.commandBody).toContain("System: [t] Model switched.");
expect(call?.followupRun.run.extraSystemPrompt ?? "").not.toContain("Runtime System Events");
});
it("preserves first-token think hint when system events are prepended", async () => {
// drainFormattedSystemEvents returns just the events block; the caller prepends it.
// The hint must be extracted from the user body BEFORE prepending, so "System:"
// does not shadow the low|medium|high shorthand.
vi.mocked(drainFormattedSystemEvents).mockResolvedValueOnce("System: [t] Node connected.");
await runPreparedReply(
baseParams({
ctx: { Body: "low tell me about cats", RawBody: "low tell me about cats" },
sessionCtx: { Body: "low tell me about cats", BodyStripped: "low tell me about cats" },
resolvedThinkLevel: undefined,
}),
);
const call = vi.mocked(runReplyAgent).mock.calls[0]?.[0];
expect(call).toBeTruthy();
// Think hint extracted before events arrived — level must be "low", not the model default.
expect(call?.followupRun.run.thinkLevel).toBe("low");
// The stripped user text (no "low" token) must still appear after the event block.
expect(call?.commandBody).toContain("tell me about cats");
expect(call?.commandBody).not.toMatch(/^low\b/);
// System events are still present in the body.
expect(call?.commandBody).toContain("System: [t] Node connected.");
});
it("carries system events into followupRun.prompt for deferred turns", async () => {
// drainFormattedSystemEvents returns the events block; the caller prepends it to
// effectiveBaseBody for the queue path so deferred turns see events.
vi.mocked(drainFormattedSystemEvents).mockResolvedValueOnce("System: [t] Node connected.");
await runPreparedReply(baseParams());
const call = vi.mocked(runReplyAgent).mock.calls[0]?.[0];
expect(call).toBeTruthy();
expect(call?.followupRun.prompt).toContain("System: [t] Node connected.");
});
it("does not strip think-hint token from deferred queue body", async () => {
// In steer mode the inferred thinkLevel is never consumed, so the first token
// must not be stripped from the queue/steer body (followupRun.prompt).
vi.mocked(drainFormattedSystemEvents).mockResolvedValueOnce(undefined);
await runPreparedReply(
baseParams({
ctx: { Body: "low steer this conversation", RawBody: "low steer this conversation" },
sessionCtx: {
Body: "low steer this conversation",
BodyStripped: "low steer this conversation",
},
resolvedThinkLevel: undefined,
}),
);
const call = vi.mocked(runReplyAgent).mock.calls[0]?.[0];
expect(call).toBeTruthy();
// Queue body (used by steer mode) must keep the full original text.
expect(call?.followupRun.prompt).toContain("low steer this conversation");
});
});