perf(test): reduce hot-suite setup and duplicate test work

This commit is contained in:
Peter Steinberger
2026-02-13 23:30:35 +00:00
parent ab4a08a82a
commit e794ef0478
5 changed files with 65 additions and 239 deletions

View File

@@ -98,69 +98,7 @@ describe("block streaming", () => {
]); ]);
}); });
it("waits for block replies before returning final payloads", async () => { it("waits for block replies and preserves ordering when typing start is slow", async () => {
await withTempHome(async (home) => {
let releaseTyping: (() => void) | undefined;
const typingGate = new Promise<void>((resolve) => {
releaseTyping = resolve;
});
let resolveOnReplyStart: (() => void) | undefined;
const onReplyStartCalled = new Promise<void>((resolve) => {
resolveOnReplyStart = resolve;
});
const onReplyStart = vi.fn(() => {
resolveOnReplyStart?.();
return typingGate;
});
const onBlockReply = vi.fn().mockResolvedValue(undefined);
const impl = async (params: RunEmbeddedPiAgentParams) => {
void params.onBlockReply?.({ text: "hello" });
return {
payloads: [{ text: "hello" }],
meta: {
durationMs: 5,
agentMeta: { sessionId: "s", provider: "p", model: "m" },
},
};
};
piEmbeddedMock.runEmbeddedPiAgent.mockImplementation(impl);
const replyPromise = getReplyFromConfig(
{
Body: "ping",
From: "+1004",
To: "+2000",
MessageSid: "msg-123",
Provider: "discord",
},
{
onReplyStart,
onBlockReply,
disableBlockStreaming: false,
},
{
agents: {
defaults: {
model: "anthropic/claude-opus-4-5",
workspace: path.join(home, "openclaw"),
},
},
channels: { whatsapp: { allowFrom: ["*"] } },
session: { store: path.join(home, "sessions.json") },
},
);
await onReplyStartCalled;
releaseTyping?.();
const res = await replyPromise;
expect(res).toBeUndefined();
expect(onBlockReply).toHaveBeenCalledTimes(1);
});
});
it("preserves block reply ordering when typing start is slow", async () => {
await withTempHome(async (home) => { await withTempHome(async (home) => {
let releaseTyping: (() => void) | undefined; let releaseTyping: (() => void) | undefined;
const typingGate = new Promise<void>((resolve) => { const typingGate = new Promise<void>((resolve) => {
@@ -197,7 +135,7 @@ describe("block streaming", () => {
Body: "ping", Body: "ping",
From: "+1004", From: "+1004",
To: "+2000", To: "+2000",
MessageSid: "msg-125", MessageSid: "msg-123",
Provider: "telegram", Provider: "telegram",
}, },
{ {
@@ -309,7 +247,7 @@ describe("block streaming", () => {
}, },
{ {
onBlockReply, onBlockReply,
blockReplyTimeoutMs: 10, blockReplyTimeoutMs: 1,
disableBlockStreaming: false, disableBlockStreaming: false,
}, },
{ {

View File

@@ -140,31 +140,6 @@ describe("RawBody directive parsing", () => {
expectedIncludes: ["Thinking level set to high."], expectedIncludes: ["Thinking level set to high."],
}); });
await assertCommandReply({
message: {
Body: "[Context]\nJake: /model status\n[from: Jake]",
RawBody: "/model status",
From: "+1222",
To: "+1222",
ChatType: "group",
CommandAuthorized: true,
},
config: {
agents: {
defaults: {
model: "anthropic/claude-opus-4-5",
workspace: path.join(home, "openclaw-2"),
models: {
"anthropic/claude-opus-4-5": {},
},
},
},
channels: { whatsapp: { allowFrom: ["*"] } },
session: { store: path.join(home, "sessions-2.json") },
},
expectedIncludes: ["anthropic/claude-opus-4-5"],
});
await assertCommandReply({ await assertCommandReply({
message: { message: {
Body: "[Context]\nJake: /verbose on\n[from: Jake]", Body: "[Context]\nJake: /verbose on\n[from: Jake]",
@@ -178,11 +153,11 @@ describe("RawBody directive parsing", () => {
agents: { agents: {
defaults: { defaults: {
model: "anthropic/claude-opus-4-5", model: "anthropic/claude-opus-4-5",
workspace: path.join(home, "openclaw-3"), workspace: path.join(home, "openclaw-2"),
}, },
}, },
channels: { whatsapp: { allowFrom: ["*"] } }, channels: { whatsapp: { allowFrom: ["*"] } },
session: { store: path.join(home, "sessions-3.json") }, session: { store: path.join(home, "sessions-2.json") },
}, },
expectedIncludes: ["Verbose logging enabled."], expectedIncludes: ["Verbose logging enabled."],
}); });
@@ -204,11 +179,11 @@ describe("RawBody directive parsing", () => {
agents: { agents: {
defaults: { defaults: {
model: "anthropic/claude-opus-4-5", model: "anthropic/claude-opus-4-5",
workspace: path.join(home, "openclaw-4"), workspace: path.join(home, "openclaw-3"),
}, },
}, },
channels: { whatsapp: { allowFrom: ["+1222"] } }, channels: { whatsapp: { allowFrom: ["+1222"] } },
session: { store: path.join(home, "sessions-4.json") }, session: { store: path.join(home, "sessions-3.json") },
}, },
expectedIncludes: ["Session: agent:main:whatsapp:group:g1", "anthropic/claude-opus-4-5"], expectedIncludes: ["Session: agent:main:whatsapp:group:g1", "anthropic/claude-opus-4-5"],
}); });

View File

@@ -15,22 +15,22 @@ describe("waitForTransportReady", () => {
let attempts = 0; let attempts = 0;
const readyPromise = waitForTransportReady({ const readyPromise = waitForTransportReady({
label: "test transport", label: "test transport",
timeoutMs: 500, timeoutMs: 220,
logAfterMs: 120, logAfterMs: 60,
logIntervalMs: 100, logIntervalMs: 1_000,
pollIntervalMs: 80, pollIntervalMs: 50,
runtime, runtime,
check: async () => { check: async () => {
attempts += 1; attempts += 1;
if (attempts > 4) { if (attempts > 2) {
return { ok: true }; return { ok: true };
} }
return { ok: false, error: "not ready" }; return { ok: false, error: "not ready" };
}, },
}); });
for (let i = 0; i < 5; i += 1) { for (let i = 0; i < 3; i += 1) {
await vi.advanceTimersByTimeAsync(80); await vi.advanceTimersByTimeAsync(50);
} }
await readyPromise; await readyPromise;
@@ -41,14 +41,14 @@ describe("waitForTransportReady", () => {
const runtime = { log: vi.fn(), error: vi.fn(), exit: vi.fn() }; const runtime = { log: vi.fn(), error: vi.fn(), exit: vi.fn() };
const waitPromise = waitForTransportReady({ const waitPromise = waitForTransportReady({
label: "test transport", label: "test transport",
timeoutMs: 200, timeoutMs: 110,
logAfterMs: 0, logAfterMs: 0,
logIntervalMs: 100, logIntervalMs: 1_000,
pollIntervalMs: 50, pollIntervalMs: 50,
runtime, runtime,
check: async () => ({ ok: false, error: "still down" }), check: async () => ({ ok: false, error: "still down" }),
}); });
await vi.advanceTimersByTimeAsync(250); await vi.advanceTimersByTimeAsync(200);
await expect(waitPromise).rejects.toThrow("test transport not ready"); await expect(waitPromise).rejects.toThrow("test transport not ready");
expect(runtime.error).toHaveBeenCalled(); expect(runtime.error).toHaveBeenCalled();
}); });

View File

@@ -280,7 +280,7 @@ describe("memory index", () => {
expect(results[0]?.path).toContain("memory/2026-01-12.md"); expect(results[0]?.path).toContain("memory/2026-01-12.md");
}); });
it("hybrid weights can favor vector-only matches over keyword-only matches", async () => { it("hybrid weights shift ranking between vector and keyword matches", async () => {
const manyAlpha = Array.from({ length: 50 }, () => "Alpha").join(" "); const manyAlpha = Array.from({ length: 50 }, () => "Alpha").join(" ");
await fs.writeFile( await fs.writeFile(
path.join(workspaceDir, "memory", "vector-only.md"), path.join(workspaceDir, "memory", "vector-only.md"),
@@ -291,7 +291,7 @@ describe("memory index", () => {
`${manyAlpha} beta id123.`, `${manyAlpha} beta id123.`,
); );
const cfg = { const vectorWeightedCfg = {
agents: { agents: {
defaults: { defaults: {
workspace: workspaceDir, workspace: workspaceDir,
@@ -315,12 +315,15 @@ describe("memory index", () => {
list: [{ id: "main", default: true }], list: [{ id: "main", default: true }],
}, },
}; };
const result = await getMemorySearchManager({ cfg, agentId: "main" }); const vectorWeighted = await getMemorySearchManager({
expect(result.manager).not.toBeNull(); cfg: vectorWeightedCfg,
if (!result.manager) { agentId: "main",
});
expect(vectorWeighted.manager).not.toBeNull();
if (!vectorWeighted.manager) {
throw new Error("manager missing"); throw new Error("manager missing");
} }
manager = result.manager; manager = vectorWeighted.manager;
const status = manager.status(); const status = manager.status();
if (!status.fts?.available) { if (!status.fts?.available) {
@@ -328,28 +331,19 @@ describe("memory index", () => {
} }
await manager.sync({ force: true }); await manager.sync({ force: true });
const results = await manager.search("alpha beta id123"); const vectorResults = await manager.search("alpha beta id123");
expect(results.length).toBeGreaterThan(0); expect(vectorResults.length).toBeGreaterThan(0);
const paths = results.map((r) => r.path); const vectorPaths = vectorResults.map((r) => r.path);
expect(paths).toContain("memory/vector-only.md"); expect(vectorPaths).toContain("memory/vector-only.md");
expect(paths).toContain("memory/keyword-only.md"); expect(vectorPaths).toContain("memory/keyword-only.md");
const vectorOnly = results.find((r) => r.path === "memory/vector-only.md"); const vectorOnly = vectorResults.find((r) => r.path === "memory/vector-only.md");
const keywordOnly = results.find((r) => r.path === "memory/keyword-only.md"); const keywordOnly = vectorResults.find((r) => r.path === "memory/keyword-only.md");
expect((vectorOnly?.score ?? 0) > (keywordOnly?.score ?? 0)).toBe(true); expect((vectorOnly?.score ?? 0) > (keywordOnly?.score ?? 0)).toBe(true);
});
it("hybrid weights can favor keyword matches when text weight dominates", async () => { await manager.close();
const manyAlpha = Array.from({ length: 50 }, () => "Alpha").join(" "); manager = null;
await fs.writeFile(
path.join(workspaceDir, "memory", "vector-only.md"),
"Alpha beta. Alpha beta. Alpha beta. Alpha beta.",
);
await fs.writeFile(
path.join(workspaceDir, "memory", "keyword-only.md"),
`${manyAlpha} beta id123.`,
);
const cfg = { const textWeightedCfg = {
agents: { agents: {
defaults: { defaults: {
workspace: workspaceDir, workspace: workspaceDir,
@@ -357,7 +351,7 @@ describe("memory index", () => {
provider: "openai", provider: "openai",
model: "mock-embed", model: "mock-embed",
store: { path: indexPath, vector: { enabled: false } }, store: { path: indexPath, vector: { enabled: false } },
sync: { watch: false, onSessionStart: false, onSearch: true }, sync: { watch: false, onSessionStart: false, onSearch: false },
query: { query: {
minScore: 0, minScore: 0,
maxResults: 200, maxResults: 200,
@@ -373,27 +367,21 @@ describe("memory index", () => {
list: [{ id: "main", default: true }], list: [{ id: "main", default: true }],
}, },
}; };
const result = await getMemorySearchManager({ cfg, agentId: "main" });
expect(result.manager).not.toBeNull(); const textWeighted = await getMemorySearchManager({ cfg: textWeightedCfg, agentId: "main" });
if (!result.manager) { expect(textWeighted.manager).not.toBeNull();
if (!textWeighted.manager) {
throw new Error("manager missing"); throw new Error("manager missing");
} }
manager = result.manager; manager = textWeighted.manager;
const keywordResults = await manager.search("alpha beta id123");
const status = manager.status(); expect(keywordResults.length).toBeGreaterThan(0);
if (!status.fts?.available) { const keywordPaths = keywordResults.map((r) => r.path);
return; expect(keywordPaths).toContain("memory/vector-only.md");
} expect(keywordPaths).toContain("memory/keyword-only.md");
const vectorOnlyAfter = keywordResults.find((r) => r.path === "memory/vector-only.md");
await manager.sync({ force: true }); const keywordOnlyAfter = keywordResults.find((r) => r.path === "memory/keyword-only.md");
const results = await manager.search("alpha beta id123"); expect((keywordOnlyAfter?.score ?? 0) > (vectorOnlyAfter?.score ?? 0)).toBe(true);
expect(results.length).toBeGreaterThan(0);
const paths = results.map((r) => r.path);
expect(paths).toContain("memory/vector-only.md");
expect(paths).toContain("memory/keyword-only.md");
const vectorOnly = results.find((r) => r.path === "memory/vector-only.md");
const keywordOnly = results.find((r) => r.path === "memory/keyword-only.md");
expect((keywordOnly?.score ?? 0) > (vectorOnly?.score ?? 0)).toBe(true);
}); });
it("reports vector availability after probe", async () => { it("reports vector availability after probe", async () => {

View File

@@ -281,7 +281,7 @@ describe("memory indexing with OpenAI batches", () => {
expect(batchCreates).toBe(2); expect(batchCreates).toBe(2);
}); });
it("falls back to non-batch on failure and resets failures after success", async () => { it("tracks batch failures, resets on success, and disables after repeated failures", async () => {
const content = ["flaky", "batch"].join("\n\n"); const content = ["flaky", "batch"].join("\n\n");
await fs.writeFile(path.join(workspaceDir, "memory", "2026-01-09.md"), content); await fs.writeFile(path.join(workspaceDir, "memory", "2026-01-09.md"), content);
@@ -376,12 +376,14 @@ describe("memory indexing with OpenAI batches", () => {
} }
manager = result.manager; manager = result.manager;
// First failure: fallback to regular embeddings and increment failure count.
await manager.sync({ force: true }); await manager.sync({ force: true });
expect(embedBatch).toHaveBeenCalled(); expect(embedBatch).toHaveBeenCalled();
let status = manager.status(); let status = manager.status();
expect(status.batch?.enabled).toBe(true); expect(status.batch?.enabled).toBe(true);
expect(status.batch?.failures).toBe(1); expect(status.batch?.failures).toBe(1);
// Success should reset failure count.
embedBatch.mockClear(); embedBatch.mockClear();
mode = "ok"; mode = "ok";
await fs.writeFile( await fs.writeFile(
@@ -393,110 +395,33 @@ describe("memory indexing with OpenAI batches", () => {
expect(status.batch?.enabled).toBe(true); expect(status.batch?.enabled).toBe(true);
expect(status.batch?.failures).toBe(0); expect(status.batch?.failures).toBe(0);
expect(embedBatch).not.toHaveBeenCalled(); expect(embedBatch).not.toHaveBeenCalled();
});
it("disables batch after repeated failures and skips batch thereafter", async () => {
const content = ["repeat", "failures"].join("\n\n");
await fs.writeFile(path.join(workspaceDir, "memory", "2026-01-10.md"), content);
let uploadedRequests: Array<{ custom_id?: string }> = [];
const fetchMock = vi.fn(async (input: RequestInfo | URL, init?: RequestInit) => {
const url =
typeof input === "string" ? input : input instanceof URL ? input.toString() : input.url;
if (url.endsWith("/files")) {
const body = init?.body;
if (!(body instanceof FormData)) {
throw new Error("expected FormData upload");
}
for (const [key, value] of body.entries()) {
if (key !== "file") {
continue;
}
if (typeof value === "string") {
uploadedRequests = value
.split("\n")
.filter(Boolean)
.map((line) => JSON.parse(line) as { custom_id?: string });
} else {
const text = await value.text();
uploadedRequests = text
.split("\n")
.filter(Boolean)
.map((line) => JSON.parse(line) as { custom_id?: string });
}
}
return new Response(JSON.stringify({ id: "file_1" }), {
status: 200,
headers: { "Content-Type": "application/json" },
});
}
if (url.endsWith("/batches")) {
return new Response("batch failed", { status: 500 });
}
if (url.endsWith("/files/file_out/content")) {
const lines = uploadedRequests.map((request, index) =>
JSON.stringify({
custom_id: request.custom_id,
response: {
status_code: 200,
body: { data: [{ embedding: [index + 1, 0, 0], index: 0 }] },
},
}),
);
return new Response(lines.join("\n"), {
status: 200,
headers: { "Content-Type": "application/jsonl" },
});
}
throw new Error(`unexpected fetch ${url}`);
});
vi.stubGlobal("fetch", fetchMock);
const cfg = {
agents: {
defaults: {
workspace: workspaceDir,
memorySearch: {
provider: "openai",
model: "text-embedding-3-small",
store: { path: indexPath },
sync: { watch: false, onSessionStart: false, onSearch: false },
query: { minScore: 0 },
remote: { batch: { enabled: true, wait: true, pollIntervalMs: 1 } },
},
},
list: [{ id: "main", default: true }],
},
};
const result = await getMemorySearchManager({ cfg, agentId: "main" });
expect(result.manager).not.toBeNull();
if (!result.manager) {
throw new Error("manager missing");
}
manager = result.manager;
// Two more failures after reset should disable remote batching.
mode = "fail";
await fs.writeFile(
path.join(workspaceDir, "memory", "2026-01-09.md"),
["flaky", "batch", "fail-a"].join("\n\n"),
);
await manager.sync({ force: true }); await manager.sync({ force: true });
let status = manager.status(); status = manager.status();
expect(status.batch?.enabled).toBe(true); expect(status.batch?.enabled).toBe(true);
expect(status.batch?.failures).toBe(1); expect(status.batch?.failures).toBe(1);
embedBatch.mockClear();
await fs.writeFile( await fs.writeFile(
path.join(workspaceDir, "memory", "2026-01-10.md"), path.join(workspaceDir, "memory", "2026-01-09.md"),
["repeat", "failures", "again"].join("\n\n"), ["flaky", "batch", "fail-b"].join("\n\n"),
); );
await manager.sync({ force: true }); await manager.sync({ force: true });
status = manager.status(); status = manager.status();
expect(status.batch?.enabled).toBe(false); expect(status.batch?.enabled).toBe(false);
expect(status.batch?.failures).toBeGreaterThanOrEqual(2); expect(status.batch?.failures).toBeGreaterThanOrEqual(2);
// Once disabled, batch endpoints are skipped and fallback embeddings run directly.
const fetchCalls = fetchMock.mock.calls.length; const fetchCalls = fetchMock.mock.calls.length;
embedBatch.mockClear(); embedBatch.mockClear();
await fs.writeFile( await fs.writeFile(
path.join(workspaceDir, "memory", "2026-01-10.md"), path.join(workspaceDir, "memory", "2026-01-09.md"),
["repeat", "failures", "fallback"].join("\n\n"), ["flaky", "batch", "fallback"].join("\n\n"),
); );
await manager.sync({ force: true }); await manager.sync({ force: true });
expect(fetchMock.mock.calls.length).toBe(fetchCalls); expect(fetchMock.mock.calls.length).toBe(fetchCalls);