mirror of
https://github.com/moltbot/moltbot.git
synced 2026-03-21 16:41:56 +00:00
288 lines
8.6 KiB
TypeScript
288 lines
8.6 KiB
TypeScript
import type { AgentMessage } from "@mariozechner/pi-agent-core";
|
|
import { beforeEach, describe, expect, it, vi } from "vitest";
|
|
import * as helpers from "./pi-embedded-helpers.js";
|
|
import {
|
|
expectGoogleModelApiFullSanitizeCall,
|
|
loadSanitizeSessionHistoryWithCleanMocks,
|
|
makeMockSessionManager,
|
|
makeInMemorySessionManager,
|
|
makeModelSnapshotEntry,
|
|
makeReasoningAssistantMessages,
|
|
makeSimpleUserMessages,
|
|
makeSnapshotChangedOpenAIReasoningScenario,
|
|
type SanitizeSessionHistoryFn,
|
|
sanitizeWithOpenAIResponses,
|
|
TEST_SESSION_ID,
|
|
} from "./pi-embedded-runner.sanitize-session-history.test-harness.js";
|
|
|
|
let sanitizeSessionHistory: SanitizeSessionHistoryFn;
|
|
|
|
// Mock dependencies
|
|
vi.mock("./pi-embedded-helpers.js", async () => {
|
|
const actual = await vi.importActual("./pi-embedded-helpers.js");
|
|
return {
|
|
...actual,
|
|
isGoogleModelApi: vi.fn(),
|
|
sanitizeSessionMessagesImages: vi.fn().mockImplementation(async (msgs) => msgs),
|
|
};
|
|
});
|
|
|
|
// We don't mock session-transcript-repair.js as it is a pure function and complicates mocking.
|
|
// We rely on the real implementation which should pass through our simple messages.
|
|
|
|
describe("sanitizeSessionHistory", () => {
|
|
const mockSessionManager = makeMockSessionManager();
|
|
const mockMessages = makeSimpleUserMessages();
|
|
|
|
beforeEach(async () => {
|
|
sanitizeSessionHistory = await loadSanitizeSessionHistoryWithCleanMocks();
|
|
});
|
|
|
|
it("sanitizes tool call ids for Google model APIs", async () => {
|
|
await expectGoogleModelApiFullSanitizeCall({
|
|
sanitizeSessionHistory,
|
|
messages: mockMessages,
|
|
sessionManager: mockSessionManager,
|
|
});
|
|
});
|
|
|
|
it("sanitizes tool call ids with strict9 for Mistral models", async () => {
|
|
vi.mocked(helpers.isGoogleModelApi).mockReturnValue(false);
|
|
|
|
await sanitizeSessionHistory({
|
|
messages: mockMessages,
|
|
modelApi: "openai-responses",
|
|
provider: "openrouter",
|
|
modelId: "mistralai/devstral-2512:free",
|
|
sessionManager: mockSessionManager,
|
|
sessionId: TEST_SESSION_ID,
|
|
});
|
|
|
|
expect(helpers.sanitizeSessionMessagesImages).toHaveBeenCalledWith(
|
|
mockMessages,
|
|
"session:history",
|
|
expect.objectContaining({
|
|
sanitizeMode: "full",
|
|
sanitizeToolCallIds: true,
|
|
toolCallIdMode: "strict9",
|
|
}),
|
|
);
|
|
});
|
|
|
|
it("sanitizes tool call ids for Anthropic APIs", async () => {
|
|
vi.mocked(helpers.isGoogleModelApi).mockReturnValue(false);
|
|
|
|
await sanitizeSessionHistory({
|
|
messages: mockMessages,
|
|
modelApi: "anthropic-messages",
|
|
provider: "anthropic",
|
|
sessionManager: mockSessionManager,
|
|
sessionId: TEST_SESSION_ID,
|
|
});
|
|
|
|
expect(helpers.sanitizeSessionMessagesImages).toHaveBeenCalledWith(
|
|
mockMessages,
|
|
"session:history",
|
|
expect.objectContaining({ sanitizeMode: "full", sanitizeToolCallIds: true }),
|
|
);
|
|
});
|
|
|
|
it("does not sanitize tool call ids for openai-responses", async () => {
|
|
vi.mocked(helpers.isGoogleModelApi).mockReturnValue(false);
|
|
|
|
await sanitizeWithOpenAIResponses({
|
|
sanitizeSessionHistory,
|
|
messages: mockMessages,
|
|
sessionManager: mockSessionManager,
|
|
});
|
|
|
|
expect(helpers.sanitizeSessionMessagesImages).toHaveBeenCalledWith(
|
|
mockMessages,
|
|
"session:history",
|
|
expect.objectContaining({ sanitizeMode: "images-only", sanitizeToolCallIds: false }),
|
|
);
|
|
});
|
|
|
|
it("annotates inter-session user messages before context sanitization", async () => {
|
|
vi.mocked(helpers.isGoogleModelApi).mockReturnValue(false);
|
|
|
|
const messages: AgentMessage[] = [
|
|
{
|
|
role: "user",
|
|
content: "forwarded instruction",
|
|
provenance: {
|
|
kind: "inter_session",
|
|
sourceSessionKey: "agent:main:req",
|
|
sourceTool: "sessions_send",
|
|
},
|
|
} as unknown as AgentMessage,
|
|
];
|
|
|
|
const result = await sanitizeSessionHistory({
|
|
messages,
|
|
modelApi: "openai-responses",
|
|
provider: "openai",
|
|
sessionManager: mockSessionManager,
|
|
sessionId: TEST_SESSION_ID,
|
|
});
|
|
|
|
const first = result[0] as Extract<AgentMessage, { role: "user" }>;
|
|
expect(first.role).toBe("user");
|
|
expect(typeof first.content).toBe("string");
|
|
expect(first.content as string).toContain("[Inter-session message]");
|
|
expect(first.content as string).toContain("sourceSession=agent:main:req");
|
|
});
|
|
|
|
it("keeps reasoning-only assistant messages for openai-responses", async () => {
|
|
vi.mocked(helpers.isGoogleModelApi).mockReturnValue(false);
|
|
|
|
const messages = [
|
|
{ role: "user", content: "hello" },
|
|
{
|
|
role: "assistant",
|
|
stopReason: "aborted",
|
|
content: [
|
|
{
|
|
type: "thinking",
|
|
thinking: "reasoning",
|
|
thinkingSignature: "sig",
|
|
},
|
|
],
|
|
},
|
|
] as unknown as AgentMessage[];
|
|
|
|
const result = await sanitizeSessionHistory({
|
|
messages,
|
|
modelApi: "openai-responses",
|
|
provider: "openai",
|
|
sessionManager: mockSessionManager,
|
|
sessionId: TEST_SESSION_ID,
|
|
});
|
|
|
|
expect(result).toHaveLength(2);
|
|
expect(result[1]?.role).toBe("assistant");
|
|
});
|
|
|
|
it("does not synthesize tool results for openai-responses", async () => {
|
|
const messages = [
|
|
{
|
|
role: "assistant",
|
|
content: [{ type: "toolCall", id: "call_1", name: "read", arguments: {} }],
|
|
},
|
|
] as unknown as AgentMessage[];
|
|
|
|
const result = await sanitizeSessionHistory({
|
|
messages,
|
|
modelApi: "openai-responses",
|
|
provider: "openai",
|
|
sessionManager: mockSessionManager,
|
|
sessionId: TEST_SESSION_ID,
|
|
});
|
|
|
|
expect(result).toHaveLength(1);
|
|
expect(result[0]?.role).toBe("assistant");
|
|
});
|
|
|
|
it("drops malformed tool calls missing input or arguments", async () => {
|
|
const messages = [
|
|
{
|
|
role: "assistant",
|
|
content: [{ type: "toolCall", id: "call_1", name: "read" }],
|
|
},
|
|
{ role: "user", content: "hello" },
|
|
] as unknown as AgentMessage[];
|
|
|
|
const result = await sanitizeSessionHistory({
|
|
messages,
|
|
modelApi: "openai-responses",
|
|
provider: "openai",
|
|
sessionManager: mockSessionManager,
|
|
sessionId: "test-session",
|
|
});
|
|
|
|
expect(result.map((msg) => msg.role)).toEqual(["user"]);
|
|
});
|
|
|
|
it("downgrades orphaned openai reasoning even when the model has not changed", async () => {
|
|
const sessionEntries = [
|
|
makeModelSnapshotEntry({
|
|
provider: "openai",
|
|
modelApi: "openai-responses",
|
|
modelId: "gpt-5.2-codex",
|
|
}),
|
|
];
|
|
const sessionManager = makeInMemorySessionManager(sessionEntries);
|
|
const messages = makeReasoningAssistantMessages({ thinkingSignature: "json" });
|
|
|
|
const result = await sanitizeWithOpenAIResponses({
|
|
sanitizeSessionHistory,
|
|
messages,
|
|
modelId: "gpt-5.2-codex",
|
|
sessionManager,
|
|
});
|
|
|
|
expect(result).toEqual([]);
|
|
});
|
|
|
|
it("downgrades orphaned openai reasoning when the model changes too", async () => {
|
|
const { sessionManager, messages, modelId } = makeSnapshotChangedOpenAIReasoningScenario();
|
|
|
|
const result = await sanitizeWithOpenAIResponses({
|
|
sanitizeSessionHistory,
|
|
messages,
|
|
modelId,
|
|
sessionManager,
|
|
});
|
|
|
|
expect(result).toEqual([]);
|
|
});
|
|
|
|
it("drops orphaned toolResult entries when switching from openai history to anthropic", async () => {
|
|
const sessionEntries = [
|
|
makeModelSnapshotEntry({
|
|
provider: "openai",
|
|
modelApi: "openai-responses",
|
|
modelId: "gpt-5.2",
|
|
}),
|
|
];
|
|
const sessionManager = makeInMemorySessionManager(sessionEntries);
|
|
const messages = [
|
|
{
|
|
role: "assistant",
|
|
content: [{ type: "toolCall", id: "tool_abc123", name: "read", arguments: {} }],
|
|
},
|
|
{
|
|
role: "toolResult",
|
|
toolCallId: "tool_abc123",
|
|
toolName: "read",
|
|
content: [{ type: "text", text: "ok" }],
|
|
} as unknown as AgentMessage,
|
|
{ role: "user", content: "continue" },
|
|
{
|
|
role: "toolResult",
|
|
toolCallId: "tool_01VihkDRptyLpX1ApUPe7ooU",
|
|
toolName: "read",
|
|
content: [{ type: "text", text: "stale result" }],
|
|
} as unknown as AgentMessage,
|
|
] as unknown as AgentMessage[];
|
|
|
|
const result = await sanitizeSessionHistory({
|
|
messages,
|
|
modelApi: "anthropic-messages",
|
|
provider: "anthropic",
|
|
modelId: "claude-opus-4-6",
|
|
sessionManager,
|
|
sessionId: TEST_SESSION_ID,
|
|
});
|
|
|
|
expect(result.map((msg) => msg.role)).toEqual(["assistant", "toolResult", "user"]);
|
|
expect(
|
|
result.some(
|
|
(msg) =>
|
|
msg.role === "toolResult" &&
|
|
(msg as { toolCallId?: string }).toolCallId === "tool_01VihkDRptyLpX1ApUPe7ooU",
|
|
),
|
|
).toBe(false);
|
|
});
|
|
});
|