914 lines
26 KiB
TypeScript
914 lines
26 KiB
TypeScript
import fs from "node:fs/promises";
|
|
import os from "node:os";
|
|
import path from "node:path";
|
|
import type { AgentMessage, AgentTool } from "@mariozechner/pi-agent-core";
|
|
import { SessionManager } from "@mariozechner/pi-coding-agent";
|
|
import { Type } from "@sinclair/typebox";
|
|
import { describe, expect, it, vi } from "vitest";
|
|
import type { ClawdbotConfig } from "../config/config.js";
|
|
import { resolveSessionAgentIds } from "./agent-scope.js";
|
|
import {
|
|
applyGoogleTurnOrderingFix,
|
|
buildEmbeddedSandboxInfo,
|
|
createSystemPromptOverride,
|
|
getDmHistoryLimitFromSessionKey,
|
|
limitHistoryTurns,
|
|
runEmbeddedPiAgent,
|
|
splitSdkTools,
|
|
} from "./pi-embedded-runner.js";
|
|
import type { SandboxContext } from "./sandbox.js";
|
|
|
|
vi.mock("@mariozechner/pi-ai", async () => {
|
|
const actual = await vi.importActual<typeof import("@mariozechner/pi-ai")>(
|
|
"@mariozechner/pi-ai",
|
|
);
|
|
return {
|
|
...actual,
|
|
streamSimple: (model: { api: string; provider: string; id: string }) => {
|
|
if (model.id === "mock-error") {
|
|
throw new Error("boom");
|
|
}
|
|
const stream = new actual.AssistantMessageEventStream();
|
|
queueMicrotask(() => {
|
|
stream.push({
|
|
type: "done",
|
|
reason: "stop",
|
|
message: {
|
|
role: "assistant",
|
|
content: [{ type: "text", text: "ok" }],
|
|
stopReason: "stop",
|
|
api: model.api,
|
|
provider: model.provider,
|
|
model: model.id,
|
|
usage: {
|
|
input: 1,
|
|
output: 1,
|
|
cacheRead: 0,
|
|
cacheWrite: 0,
|
|
totalTokens: 2,
|
|
cost: {
|
|
input: 0,
|
|
output: 0,
|
|
cacheRead: 0,
|
|
cacheWrite: 0,
|
|
total: 0,
|
|
},
|
|
},
|
|
timestamp: Date.now(),
|
|
},
|
|
});
|
|
});
|
|
return stream;
|
|
},
|
|
};
|
|
});
|
|
|
|
const makeOpenAiConfig = (modelIds: string[]) =>
|
|
({
|
|
models: {
|
|
providers: {
|
|
openai: {
|
|
api: "openai-responses",
|
|
apiKey: "sk-test",
|
|
baseUrl: "https://example.com",
|
|
models: modelIds.map((id) => ({
|
|
id,
|
|
name: `Mock ${id}`,
|
|
reasoning: false,
|
|
input: ["text"],
|
|
cost: { input: 0, output: 0, cacheRead: 0, cacheWrite: 0 },
|
|
contextWindow: 16_000,
|
|
maxTokens: 2048,
|
|
})),
|
|
},
|
|
},
|
|
},
|
|
}) satisfies ClawdbotConfig;
|
|
|
|
const textFromContent = (content: unknown) => {
|
|
if (typeof content === "string") return content;
|
|
if (Array.isArray(content) && content[0]?.type === "text") {
|
|
return (content[0] as { text?: string }).text;
|
|
}
|
|
return undefined;
|
|
};
|
|
|
|
const readSessionMessages = async (sessionFile: string) => {
|
|
const raw = await fs.readFile(sessionFile, "utf-8");
|
|
return raw
|
|
.split(/\r?\n/)
|
|
.filter(Boolean)
|
|
.map(
|
|
(line) =>
|
|
JSON.parse(line) as {
|
|
type?: string;
|
|
message?: { role?: string; content?: unknown };
|
|
},
|
|
)
|
|
.filter((entry) => entry.type === "message")
|
|
.map((entry) => entry.message as { role?: string; content?: unknown });
|
|
};
|
|
|
|
describe("buildEmbeddedSandboxInfo", () => {
|
|
it("returns undefined when sandbox is missing", () => {
|
|
expect(buildEmbeddedSandboxInfo()).toBeUndefined();
|
|
});
|
|
|
|
it("maps sandbox context into prompt info", () => {
|
|
const sandbox = {
|
|
enabled: true,
|
|
sessionKey: "session:test",
|
|
workspaceDir: "/tmp/clawdbot-sandbox",
|
|
agentWorkspaceDir: "/tmp/clawdbot-workspace",
|
|
workspaceAccess: "none",
|
|
containerName: "clawdbot-sbx-test",
|
|
containerWorkdir: "/workspace",
|
|
docker: {
|
|
image: "clawdbot-sandbox:bookworm-slim",
|
|
containerPrefix: "clawdbot-sbx-",
|
|
workdir: "/workspace",
|
|
readOnlyRoot: true,
|
|
tmpfs: ["/tmp"],
|
|
network: "none",
|
|
user: "1000:1000",
|
|
capDrop: ["ALL"],
|
|
env: { LANG: "C.UTF-8" },
|
|
},
|
|
tools: {
|
|
allow: ["exec"],
|
|
deny: ["browser"],
|
|
},
|
|
browserAllowHostControl: true,
|
|
browser: {
|
|
controlUrl: "http://localhost:9222",
|
|
noVncUrl: "http://localhost:6080",
|
|
containerName: "clawdbot-sbx-browser-test",
|
|
},
|
|
} satisfies SandboxContext;
|
|
|
|
expect(buildEmbeddedSandboxInfo(sandbox)).toEqual({
|
|
enabled: true,
|
|
workspaceDir: "/tmp/clawdbot-sandbox",
|
|
workspaceAccess: "none",
|
|
agentWorkspaceMount: undefined,
|
|
browserControlUrl: "http://localhost:9222",
|
|
browserNoVncUrl: "http://localhost:6080",
|
|
hostBrowserAllowed: true,
|
|
});
|
|
});
|
|
|
|
it("includes elevated info when allowed", () => {
|
|
const sandbox = {
|
|
enabled: true,
|
|
sessionKey: "session:test",
|
|
workspaceDir: "/tmp/clawdbot-sandbox",
|
|
agentWorkspaceDir: "/tmp/clawdbot-workspace",
|
|
workspaceAccess: "none",
|
|
containerName: "clawdbot-sbx-test",
|
|
containerWorkdir: "/workspace",
|
|
docker: {
|
|
image: "clawdbot-sandbox:bookworm-slim",
|
|
containerPrefix: "clawdbot-sbx-",
|
|
workdir: "/workspace",
|
|
readOnlyRoot: true,
|
|
tmpfs: ["/tmp"],
|
|
network: "none",
|
|
user: "1000:1000",
|
|
capDrop: ["ALL"],
|
|
env: { LANG: "C.UTF-8" },
|
|
},
|
|
tools: {
|
|
allow: ["exec"],
|
|
deny: ["browser"],
|
|
},
|
|
browserAllowHostControl: false,
|
|
} satisfies SandboxContext;
|
|
|
|
expect(
|
|
buildEmbeddedSandboxInfo(sandbox, {
|
|
enabled: true,
|
|
allowed: true,
|
|
defaultLevel: "on",
|
|
}),
|
|
).toEqual({
|
|
enabled: true,
|
|
workspaceDir: "/tmp/clawdbot-sandbox",
|
|
workspaceAccess: "none",
|
|
agentWorkspaceMount: undefined,
|
|
hostBrowserAllowed: false,
|
|
elevated: { allowed: true, defaultLevel: "on" },
|
|
});
|
|
});
|
|
});
|
|
|
|
describe("resolveSessionAgentIds", () => {
|
|
const cfg = {
|
|
agents: {
|
|
list: [{ id: "main" }, { id: "beta", default: true }],
|
|
},
|
|
} as ClawdbotConfig;
|
|
|
|
it("falls back to the configured default when sessionKey is missing", () => {
|
|
const { defaultAgentId, sessionAgentId } = resolveSessionAgentIds({
|
|
config: cfg,
|
|
});
|
|
expect(defaultAgentId).toBe("beta");
|
|
expect(sessionAgentId).toBe("beta");
|
|
});
|
|
|
|
it("falls back to the configured default when sessionKey is non-agent", () => {
|
|
const { sessionAgentId } = resolveSessionAgentIds({
|
|
sessionKey: "telegram:slash:123",
|
|
config: cfg,
|
|
});
|
|
expect(sessionAgentId).toBe("beta");
|
|
});
|
|
|
|
it("falls back to the configured default for global sessions", () => {
|
|
const { sessionAgentId } = resolveSessionAgentIds({
|
|
sessionKey: "global",
|
|
config: cfg,
|
|
});
|
|
expect(sessionAgentId).toBe("beta");
|
|
});
|
|
|
|
it("keeps the agent id for provider-qualified agent sessions", () => {
|
|
const { sessionAgentId } = resolveSessionAgentIds({
|
|
sessionKey: "agent:beta:slack:channel:C1",
|
|
config: cfg,
|
|
});
|
|
expect(sessionAgentId).toBe("beta");
|
|
});
|
|
|
|
it("uses the agent id from agent session keys", () => {
|
|
const { sessionAgentId } = resolveSessionAgentIds({
|
|
sessionKey: "agent:main:main",
|
|
config: cfg,
|
|
});
|
|
expect(sessionAgentId).toBe("main");
|
|
});
|
|
});
|
|
|
|
function createStubTool(name: string): AgentTool {
|
|
return {
|
|
name,
|
|
label: name,
|
|
description: "",
|
|
parameters: Type.Object({}),
|
|
execute: async () => ({ content: [], details: {} }),
|
|
};
|
|
}
|
|
|
|
describe("splitSdkTools", () => {
|
|
const tools = [
|
|
createStubTool("read"),
|
|
createStubTool("exec"),
|
|
createStubTool("edit"),
|
|
createStubTool("write"),
|
|
createStubTool("browser"),
|
|
];
|
|
|
|
it("routes all tools to customTools when sandboxed", () => {
|
|
const { builtInTools, customTools } = splitSdkTools({
|
|
tools,
|
|
sandboxEnabled: true,
|
|
});
|
|
expect(builtInTools).toEqual([]);
|
|
expect(customTools.map((tool) => tool.name)).toEqual([
|
|
"read",
|
|
"exec",
|
|
"edit",
|
|
"write",
|
|
"browser",
|
|
]);
|
|
});
|
|
|
|
it("routes all tools to customTools even when not sandboxed", () => {
|
|
const { builtInTools, customTools } = splitSdkTools({
|
|
tools,
|
|
sandboxEnabled: false,
|
|
});
|
|
expect(builtInTools).toEqual([]);
|
|
expect(customTools.map((tool) => tool.name)).toEqual([
|
|
"read",
|
|
"exec",
|
|
"edit",
|
|
"write",
|
|
"browser",
|
|
]);
|
|
});
|
|
});
|
|
|
|
describe("createSystemPromptOverride", () => {
|
|
it("returns the override prompt regardless of default prompt", () => {
|
|
const override = createSystemPromptOverride("OVERRIDE");
|
|
expect(override("DEFAULT")).toBe("OVERRIDE");
|
|
});
|
|
|
|
it("returns an empty string for blank overrides", () => {
|
|
const override = createSystemPromptOverride(" \n ");
|
|
expect(override("DEFAULT")).toBe("");
|
|
});
|
|
});
|
|
|
|
describe("applyGoogleTurnOrderingFix", () => {
|
|
const makeAssistantFirst = () =>
|
|
[
|
|
{
|
|
role: "assistant",
|
|
content: [
|
|
{ type: "toolCall", id: "call_1", name: "exec", arguments: {} },
|
|
],
|
|
},
|
|
] satisfies AgentMessage[];
|
|
|
|
it("prepends a bootstrap once and records a marker for Google models", () => {
|
|
const sessionManager = SessionManager.inMemory();
|
|
const warn = vi.fn();
|
|
const input = makeAssistantFirst();
|
|
const first = applyGoogleTurnOrderingFix({
|
|
messages: input,
|
|
modelApi: "google-generative-ai",
|
|
sessionManager,
|
|
sessionId: "session:1",
|
|
warn,
|
|
});
|
|
expect(first.messages[0]?.role).toBe("user");
|
|
expect(first.messages[1]?.role).toBe("assistant");
|
|
expect(warn).toHaveBeenCalledTimes(1);
|
|
expect(
|
|
sessionManager
|
|
.getEntries()
|
|
.some(
|
|
(entry) =>
|
|
entry.type === "custom" &&
|
|
entry.customType === "google-turn-ordering-bootstrap",
|
|
),
|
|
).toBe(true);
|
|
|
|
applyGoogleTurnOrderingFix({
|
|
messages: input,
|
|
modelApi: "google-generative-ai",
|
|
sessionManager,
|
|
sessionId: "session:1",
|
|
warn,
|
|
});
|
|
expect(warn).toHaveBeenCalledTimes(1);
|
|
});
|
|
|
|
it("skips non-Google models", () => {
|
|
const sessionManager = SessionManager.inMemory();
|
|
const warn = vi.fn();
|
|
const input = makeAssistantFirst();
|
|
const result = applyGoogleTurnOrderingFix({
|
|
messages: input,
|
|
modelApi: "openai",
|
|
sessionManager,
|
|
sessionId: "session:2",
|
|
warn,
|
|
});
|
|
expect(result.messages).toBe(input);
|
|
expect(warn).not.toHaveBeenCalled();
|
|
});
|
|
});
|
|
|
|
describe("limitHistoryTurns", () => {
|
|
const makeMessages = (roles: ("user" | "assistant")[]): AgentMessage[] =>
|
|
roles.map((role, i) => ({
|
|
role,
|
|
content: [{ type: "text", text: `message ${i}` }],
|
|
}));
|
|
|
|
it("returns all messages when limit is undefined", () => {
|
|
const messages = makeMessages(["user", "assistant", "user", "assistant"]);
|
|
expect(limitHistoryTurns(messages, undefined)).toBe(messages);
|
|
});
|
|
|
|
it("returns all messages when limit is 0", () => {
|
|
const messages = makeMessages(["user", "assistant", "user", "assistant"]);
|
|
expect(limitHistoryTurns(messages, 0)).toBe(messages);
|
|
});
|
|
|
|
it("returns all messages when limit is negative", () => {
|
|
const messages = makeMessages(["user", "assistant", "user", "assistant"]);
|
|
expect(limitHistoryTurns(messages, -1)).toBe(messages);
|
|
});
|
|
|
|
it("returns empty array when messages is empty", () => {
|
|
expect(limitHistoryTurns([], 5)).toEqual([]);
|
|
});
|
|
|
|
it("keeps all messages when fewer user turns than limit", () => {
|
|
const messages = makeMessages(["user", "assistant", "user", "assistant"]);
|
|
expect(limitHistoryTurns(messages, 10)).toBe(messages);
|
|
});
|
|
|
|
it("limits to last N user turns", () => {
|
|
const messages = makeMessages([
|
|
"user",
|
|
"assistant",
|
|
"user",
|
|
"assistant",
|
|
"user",
|
|
"assistant",
|
|
]);
|
|
const limited = limitHistoryTurns(messages, 2);
|
|
expect(limited.length).toBe(4);
|
|
expect(limited[0].content).toEqual([{ type: "text", text: "message 2" }]);
|
|
});
|
|
|
|
it("handles single user turn limit", () => {
|
|
const messages = makeMessages([
|
|
"user",
|
|
"assistant",
|
|
"user",
|
|
"assistant",
|
|
"user",
|
|
"assistant",
|
|
]);
|
|
const limited = limitHistoryTurns(messages, 1);
|
|
expect(limited.length).toBe(2);
|
|
expect(limited[0].content).toEqual([{ type: "text", text: "message 4" }]);
|
|
expect(limited[1].content).toEqual([{ type: "text", text: "message 5" }]);
|
|
});
|
|
|
|
it("handles messages with multiple assistant responses per user turn", () => {
|
|
const messages = makeMessages([
|
|
"user",
|
|
"assistant",
|
|
"assistant",
|
|
"user",
|
|
"assistant",
|
|
]);
|
|
const limited = limitHistoryTurns(messages, 1);
|
|
expect(limited.length).toBe(2);
|
|
expect(limited[0].role).toBe("user");
|
|
expect(limited[1].role).toBe("assistant");
|
|
});
|
|
|
|
it("preserves message content integrity", () => {
|
|
const messages: AgentMessage[] = [
|
|
{ role: "user", content: [{ type: "text", text: "first" }] },
|
|
{
|
|
role: "assistant",
|
|
content: [{ type: "toolCall", id: "1", name: "exec", arguments: {} }],
|
|
},
|
|
{ role: "user", content: [{ type: "text", text: "second" }] },
|
|
{ role: "assistant", content: [{ type: "text", text: "response" }] },
|
|
];
|
|
const limited = limitHistoryTurns(messages, 1);
|
|
expect(limited[0].content).toEqual([{ type: "text", text: "second" }]);
|
|
expect(limited[1].content).toEqual([{ type: "text", text: "response" }]);
|
|
});
|
|
});
|
|
|
|
describe("getDmHistoryLimitFromSessionKey", () => {
|
|
it("returns undefined when sessionKey is undefined", () => {
|
|
expect(getDmHistoryLimitFromSessionKey(undefined, {})).toBeUndefined();
|
|
});
|
|
|
|
it("returns undefined when config is undefined", () => {
|
|
expect(
|
|
getDmHistoryLimitFromSessionKey("telegram:dm:123", undefined),
|
|
).toBeUndefined();
|
|
});
|
|
|
|
it("returns dmHistoryLimit for telegram provider", () => {
|
|
const config = { telegram: { dmHistoryLimit: 15 } } as ClawdbotConfig;
|
|
expect(getDmHistoryLimitFromSessionKey("telegram:dm:123", config)).toBe(15);
|
|
});
|
|
|
|
it("returns dmHistoryLimit for whatsapp provider", () => {
|
|
const config = { whatsapp: { dmHistoryLimit: 20 } } as ClawdbotConfig;
|
|
expect(getDmHistoryLimitFromSessionKey("whatsapp:dm:123", config)).toBe(20);
|
|
});
|
|
|
|
it("returns dmHistoryLimit for agent-prefixed session keys", () => {
|
|
const config = { telegram: { dmHistoryLimit: 10 } } as ClawdbotConfig;
|
|
expect(
|
|
getDmHistoryLimitFromSessionKey("agent:main:telegram:dm:123", config),
|
|
).toBe(10);
|
|
});
|
|
|
|
it("returns undefined for non-dm session kinds", () => {
|
|
const config = {
|
|
slack: { dmHistoryLimit: 10 },
|
|
telegram: { dmHistoryLimit: 15 },
|
|
} as ClawdbotConfig;
|
|
expect(
|
|
getDmHistoryLimitFromSessionKey("agent:beta:slack:channel:C1", config),
|
|
).toBeUndefined();
|
|
expect(
|
|
getDmHistoryLimitFromSessionKey("telegram:slash:123", config),
|
|
).toBeUndefined();
|
|
});
|
|
|
|
it("returns undefined for unknown provider", () => {
|
|
const config = { telegram: { dmHistoryLimit: 15 } } as ClawdbotConfig;
|
|
expect(
|
|
getDmHistoryLimitFromSessionKey("unknown:dm:123", config),
|
|
).toBeUndefined();
|
|
});
|
|
|
|
it("returns undefined when provider config has no dmHistoryLimit", () => {
|
|
const config = { telegram: {} } as ClawdbotConfig;
|
|
expect(
|
|
getDmHistoryLimitFromSessionKey("telegram:dm:123", config),
|
|
).toBeUndefined();
|
|
});
|
|
|
|
it("handles all supported providers", () => {
|
|
const providers = [
|
|
"telegram",
|
|
"whatsapp",
|
|
"discord",
|
|
"slack",
|
|
"signal",
|
|
"imessage",
|
|
"msteams",
|
|
] as const;
|
|
|
|
for (const provider of providers) {
|
|
const config = { [provider]: { dmHistoryLimit: 5 } } as ClawdbotConfig;
|
|
expect(
|
|
getDmHistoryLimitFromSessionKey(`${provider}:dm:123`, config),
|
|
).toBe(5);
|
|
}
|
|
});
|
|
|
|
it("handles per-DM overrides for all supported providers", () => {
|
|
const providers = [
|
|
"telegram",
|
|
"whatsapp",
|
|
"discord",
|
|
"slack",
|
|
"signal",
|
|
"imessage",
|
|
"msteams",
|
|
] as const;
|
|
|
|
for (const provider of providers) {
|
|
// Test per-DM override takes precedence
|
|
const configWithOverride = {
|
|
[provider]: {
|
|
dmHistoryLimit: 20,
|
|
dms: { user123: { historyLimit: 7 } },
|
|
},
|
|
} as ClawdbotConfig;
|
|
expect(
|
|
getDmHistoryLimitFromSessionKey(
|
|
`${provider}:dm:user123`,
|
|
configWithOverride,
|
|
),
|
|
).toBe(7);
|
|
|
|
// Test fallback to provider default when user not in dms
|
|
expect(
|
|
getDmHistoryLimitFromSessionKey(
|
|
`${provider}:dm:otheruser`,
|
|
configWithOverride,
|
|
),
|
|
).toBe(20);
|
|
|
|
// Test with agent-prefixed key
|
|
expect(
|
|
getDmHistoryLimitFromSessionKey(
|
|
`agent:main:${provider}:dm:user123`,
|
|
configWithOverride,
|
|
),
|
|
).toBe(7);
|
|
}
|
|
});
|
|
|
|
it("returns per-DM override when set", () => {
|
|
const config = {
|
|
telegram: {
|
|
dmHistoryLimit: 15,
|
|
dms: { "123": { historyLimit: 5 } },
|
|
},
|
|
} as ClawdbotConfig;
|
|
expect(getDmHistoryLimitFromSessionKey("telegram:dm:123", config)).toBe(5);
|
|
});
|
|
|
|
it("falls back to provider default when per-DM not set", () => {
|
|
const config = {
|
|
telegram: {
|
|
dmHistoryLimit: 15,
|
|
dms: { "456": { historyLimit: 5 } },
|
|
},
|
|
} as ClawdbotConfig;
|
|
expect(getDmHistoryLimitFromSessionKey("telegram:dm:123", config)).toBe(15);
|
|
});
|
|
|
|
it("returns per-DM override for agent-prefixed keys", () => {
|
|
const config = {
|
|
telegram: {
|
|
dmHistoryLimit: 20,
|
|
dms: { "789": { historyLimit: 3 } },
|
|
},
|
|
} as ClawdbotConfig;
|
|
expect(
|
|
getDmHistoryLimitFromSessionKey("agent:main:telegram:dm:789", config),
|
|
).toBe(3);
|
|
});
|
|
|
|
it("handles userId with colons (e.g., email)", () => {
|
|
const config = {
|
|
msteams: {
|
|
dmHistoryLimit: 10,
|
|
dms: { "user@example.com": { historyLimit: 7 } },
|
|
},
|
|
} as ClawdbotConfig;
|
|
expect(
|
|
getDmHistoryLimitFromSessionKey("msteams:dm:user@example.com", config),
|
|
).toBe(7);
|
|
});
|
|
|
|
it("returns undefined when per-DM historyLimit is not set", () => {
|
|
const config = {
|
|
telegram: {
|
|
dms: { "123": {} },
|
|
},
|
|
} as ClawdbotConfig;
|
|
expect(
|
|
getDmHistoryLimitFromSessionKey("telegram:dm:123", config),
|
|
).toBeUndefined();
|
|
});
|
|
|
|
it("returns 0 when per-DM historyLimit is explicitly 0 (unlimited)", () => {
|
|
const config = {
|
|
telegram: {
|
|
dmHistoryLimit: 15,
|
|
dms: { "123": { historyLimit: 0 } },
|
|
},
|
|
} as ClawdbotConfig;
|
|
expect(getDmHistoryLimitFromSessionKey("telegram:dm:123", config)).toBe(0);
|
|
});
|
|
});
|
|
|
|
describe("runEmbeddedPiAgent", () => {
|
|
it("writes models.json into the provided agentDir", async () => {
|
|
const agentDir = await fs.mkdtemp(
|
|
path.join(os.tmpdir(), "clawdbot-agent-"),
|
|
);
|
|
const workspaceDir = await fs.mkdtemp(
|
|
path.join(os.tmpdir(), "clawdbot-workspace-"),
|
|
);
|
|
const sessionFile = path.join(workspaceDir, "session.jsonl");
|
|
|
|
const cfg = {
|
|
models: {
|
|
providers: {
|
|
minimax: {
|
|
baseUrl: "https://api.minimax.io/anthropic",
|
|
api: "anthropic-messages",
|
|
apiKey: "sk-minimax-test",
|
|
models: [
|
|
{
|
|
id: "MiniMax-M2.1",
|
|
name: "MiniMax M2.1",
|
|
reasoning: false,
|
|
input: ["text"],
|
|
cost: { input: 0, output: 0, cacheRead: 0, cacheWrite: 0 },
|
|
contextWindow: 200000,
|
|
maxTokens: 8192,
|
|
},
|
|
],
|
|
},
|
|
},
|
|
},
|
|
} satisfies ClawdbotConfig;
|
|
|
|
await expect(
|
|
runEmbeddedPiAgent({
|
|
sessionId: "session:test",
|
|
sessionKey: "agent:dev:test",
|
|
sessionFile,
|
|
workspaceDir,
|
|
config: cfg,
|
|
prompt: "hi",
|
|
provider: "definitely-not-a-provider",
|
|
model: "definitely-not-a-model",
|
|
timeoutMs: 1,
|
|
agentDir,
|
|
}),
|
|
).rejects.toThrow(/Unknown model:/);
|
|
|
|
await expect(
|
|
fs.stat(path.join(agentDir, "models.json")),
|
|
).resolves.toBeTruthy();
|
|
});
|
|
|
|
it("persists the first user message before assistant output", async () => {
|
|
const agentDir = await fs.mkdtemp(
|
|
path.join(os.tmpdir(), "clawdbot-agent-"),
|
|
);
|
|
const workspaceDir = await fs.mkdtemp(
|
|
path.join(os.tmpdir(), "clawdbot-workspace-"),
|
|
);
|
|
const sessionFile = path.join(workspaceDir, "session.jsonl");
|
|
|
|
const cfg = makeOpenAiConfig(["mock-1"]);
|
|
|
|
await runEmbeddedPiAgent({
|
|
sessionId: "session:test",
|
|
sessionKey: "agent:main:main",
|
|
sessionFile,
|
|
workspaceDir,
|
|
config: cfg,
|
|
prompt: "hello",
|
|
provider: "openai",
|
|
model: "mock-1",
|
|
timeoutMs: 5_000,
|
|
agentDir,
|
|
});
|
|
|
|
const messages = await readSessionMessages(sessionFile);
|
|
const firstUserIndex = messages.findIndex(
|
|
(message) =>
|
|
message?.role === "user" &&
|
|
textFromContent(message.content) === "hello",
|
|
);
|
|
const firstAssistantIndex = messages.findIndex(
|
|
(message) => message?.role === "assistant",
|
|
);
|
|
expect(firstUserIndex).toBeGreaterThanOrEqual(0);
|
|
if (firstAssistantIndex !== -1) {
|
|
expect(firstUserIndex).toBeLessThan(firstAssistantIndex);
|
|
}
|
|
});
|
|
|
|
it("persists the user message when prompt fails before assistant output", async () => {
|
|
const agentDir = await fs.mkdtemp(
|
|
path.join(os.tmpdir(), "clawdbot-agent-"),
|
|
);
|
|
const workspaceDir = await fs.mkdtemp(
|
|
path.join(os.tmpdir(), "clawdbot-workspace-"),
|
|
);
|
|
const sessionFile = path.join(workspaceDir, "session.jsonl");
|
|
|
|
const cfg = makeOpenAiConfig(["mock-error"]);
|
|
|
|
const result = await runEmbeddedPiAgent({
|
|
sessionId: "session:test",
|
|
sessionKey: "agent:main:main",
|
|
sessionFile,
|
|
workspaceDir,
|
|
config: cfg,
|
|
prompt: "boom",
|
|
provider: "openai",
|
|
model: "mock-error",
|
|
timeoutMs: 5_000,
|
|
agentDir,
|
|
});
|
|
expect(result.payloads[0]?.isError).toBe(true);
|
|
|
|
const messages = await readSessionMessages(sessionFile);
|
|
const userIndex = messages.findIndex(
|
|
(message) =>
|
|
message?.role === "user" && textFromContent(message.content) === "boom",
|
|
);
|
|
expect(userIndex).toBeGreaterThanOrEqual(0);
|
|
});
|
|
|
|
it("appends new user + assistant after existing transcript entries", async () => {
|
|
const agentDir = await fs.mkdtemp(
|
|
path.join(os.tmpdir(), "clawdbot-agent-"),
|
|
);
|
|
const workspaceDir = await fs.mkdtemp(
|
|
path.join(os.tmpdir(), "clawdbot-workspace-"),
|
|
);
|
|
const sessionFile = path.join(workspaceDir, "session.jsonl");
|
|
|
|
const sessionManager = SessionManager.open(sessionFile);
|
|
sessionManager.appendMessage({
|
|
role: "user",
|
|
content: [{ type: "text", text: "seed user" }],
|
|
});
|
|
sessionManager.appendMessage({
|
|
role: "assistant",
|
|
content: [{ type: "text", text: "seed assistant" }],
|
|
stopReason: "stop",
|
|
api: "openai-responses",
|
|
provider: "openai",
|
|
model: "mock-1",
|
|
usage: {
|
|
input: 1,
|
|
output: 1,
|
|
cacheRead: 0,
|
|
cacheWrite: 0,
|
|
totalTokens: 2,
|
|
cost: {
|
|
input: 0,
|
|
output: 0,
|
|
cacheRead: 0,
|
|
cacheWrite: 0,
|
|
total: 0,
|
|
},
|
|
},
|
|
timestamp: Date.now(),
|
|
});
|
|
|
|
const cfg = makeOpenAiConfig(["mock-1"]);
|
|
|
|
await runEmbeddedPiAgent({
|
|
sessionId: "session:test",
|
|
sessionKey: "agent:main:main",
|
|
sessionFile,
|
|
workspaceDir,
|
|
config: cfg,
|
|
prompt: "hello",
|
|
provider: "openai",
|
|
model: "mock-1",
|
|
timeoutMs: 5_000,
|
|
agentDir,
|
|
});
|
|
|
|
const messages = await readSessionMessages(sessionFile);
|
|
const seedUserIndex = messages.findIndex(
|
|
(message) =>
|
|
message?.role === "user" &&
|
|
textFromContent(message.content) === "seed user",
|
|
);
|
|
const seedAssistantIndex = messages.findIndex(
|
|
(message) =>
|
|
message?.role === "assistant" &&
|
|
textFromContent(message.content) === "seed assistant",
|
|
);
|
|
const newUserIndex = messages.findIndex(
|
|
(message) =>
|
|
message?.role === "user" &&
|
|
textFromContent(message.content) === "hello",
|
|
);
|
|
const newAssistantIndex = messages.findIndex(
|
|
(message, index) => index > newUserIndex && message?.role === "assistant",
|
|
);
|
|
expect(seedUserIndex).toBeGreaterThanOrEqual(0);
|
|
expect(seedAssistantIndex).toBeGreaterThan(seedUserIndex);
|
|
expect(newUserIndex).toBeGreaterThan(seedAssistantIndex);
|
|
expect(newAssistantIndex).toBeGreaterThan(newUserIndex);
|
|
});
|
|
|
|
it("persists multi-turn user/assistant ordering across runs", async () => {
|
|
const agentDir = await fs.mkdtemp(
|
|
path.join(os.tmpdir(), "clawdbot-agent-"),
|
|
);
|
|
const workspaceDir = await fs.mkdtemp(
|
|
path.join(os.tmpdir(), "clawdbot-workspace-"),
|
|
);
|
|
const sessionFile = path.join(workspaceDir, "session.jsonl");
|
|
|
|
const cfg = makeOpenAiConfig(["mock-1"]);
|
|
|
|
await runEmbeddedPiAgent({
|
|
sessionId: "session:test",
|
|
sessionKey: "agent:main:main",
|
|
sessionFile,
|
|
workspaceDir,
|
|
config: cfg,
|
|
prompt: "first",
|
|
provider: "openai",
|
|
model: "mock-1",
|
|
timeoutMs: 5_000,
|
|
agentDir,
|
|
});
|
|
|
|
await runEmbeddedPiAgent({
|
|
sessionId: "session:test",
|
|
sessionKey: "agent:main:main",
|
|
sessionFile,
|
|
workspaceDir,
|
|
config: cfg,
|
|
prompt: "second",
|
|
provider: "openai",
|
|
model: "mock-1",
|
|
timeoutMs: 5_000,
|
|
agentDir,
|
|
});
|
|
|
|
const messages = await readSessionMessages(sessionFile);
|
|
const firstUserIndex = messages.findIndex(
|
|
(message) =>
|
|
message?.role === "user" &&
|
|
textFromContent(message.content) === "first",
|
|
);
|
|
const firstAssistantIndex = messages.findIndex(
|
|
(message, index) =>
|
|
index > firstUserIndex && message?.role === "assistant",
|
|
);
|
|
const secondUserIndex = messages.findIndex(
|
|
(message) =>
|
|
message?.role === "user" &&
|
|
textFromContent(message.content) === "second",
|
|
);
|
|
const secondAssistantIndex = messages.findIndex(
|
|
(message, index) =>
|
|
index > secondUserIndex && message?.role === "assistant",
|
|
);
|
|
expect(firstUserIndex).toBeGreaterThanOrEqual(0);
|
|
expect(firstAssistantIndex).toBeGreaterThan(firstUserIndex);
|
|
expect(secondUserIndex).toBeGreaterThan(firstAssistantIndex);
|
|
expect(secondAssistantIndex).toBeGreaterThan(secondUserIndex);
|
|
});
|
|
});
|