mirror of
https://github.com/langbot-app/LangBot.git
synced 2026-06-20 12:34:21 +00:00
3205 lines
121 KiB
TypeScript
3205 lines
121 KiB
TypeScript
import assert from "node:assert/strict";
|
|
import { test } from "node:test";
|
|
import { appendFileSync, existsSync, mkdtempSync, mkdirSync, readFileSync, rmSync, writeFileSync } from "node:fs";
|
|
import { spawnSync } from "node:child_process";
|
|
import { tmpdir } from "node:os";
|
|
import { join } from "node:path";
|
|
import type { CommandContext } from "../src/types.ts";
|
|
import { commandCaseList, commandCaseNew, commandCaseShow } from "../src/commands/case.ts";
|
|
import { commandEnvDoctor, commandEnvShow } from "../src/commands/env.ts";
|
|
import { commandFixtureCheck, commandFixtureList } from "../src/commands/fixture.ts";
|
|
import { commandLogGuard, commandLogScan, commandLogWatch } from "../src/commands/log.ts";
|
|
import { commandSuiteList, commandSuiteNew, commandSuitePlan, commandSuiteReport, commandSuiteRun, commandSuiteShow, commandSuiteStart } from "../src/commands/suite.ts";
|
|
import { commandTestPlan, commandTestRecommend, commandTestReport, commandTestResult, commandTestRun, commandTestStart } from "../src/commands/test.ts";
|
|
import { commandTroubleSearch } from "../src/commands/trouble.ts";
|
|
import { commandValidate } from "../src/commands/validate.ts";
|
|
import { commandIndex } from "../src/commands/skill.ts";
|
|
import { loadEnv } from "../src/fs.ts";
|
|
import { repoRoot } from "../src/cli.ts";
|
|
import {
|
|
classifyDebugChatResult,
|
|
findNewFailureSignal,
|
|
minExpectedOccurrences,
|
|
} from "../scripts/e2e/lib/debug-chat.mjs";
|
|
|
|
const root = process.cwd();
|
|
|
|
test("repo root detects the skills tree before generated bin exists", () => {
|
|
const tmp = mkdtempSync(join(tmpdir(), "lbs-root-no-bin-"));
|
|
try {
|
|
mkdirSync(join(tmp, "schemas"), { recursive: true });
|
|
mkdirSync(join(tmp, "skills", "langbot-testing"), { recursive: true });
|
|
writeFileSync(join(tmp, "skills.index.json"), "{}");
|
|
writeFileSync(join(tmp, "schemas", "case.schema.json"), "{}");
|
|
assert.equal(repoRoot(join(tmp, "skills", "langbot-testing")), tmp);
|
|
} finally {
|
|
rmSync(tmp, { recursive: true, force: true });
|
|
}
|
|
});
|
|
|
|
function ctx(args: string[]): CommandContext {
|
|
return { root, args };
|
|
}
|
|
|
|
function capture(fn: () => number): { code: number; output: string } {
|
|
const originalLog = console.log;
|
|
const lines: string[] = [];
|
|
console.log = (...args: unknown[]) => {
|
|
lines.push(args.map(String).join(" "));
|
|
};
|
|
try {
|
|
const code = fn();
|
|
return { code, output: lines.join("\n") };
|
|
} finally {
|
|
console.log = originalLog;
|
|
}
|
|
}
|
|
|
|
function captureAll(fn: () => number): { code: number; output: string; error: string } {
|
|
const originalLog = console.log;
|
|
const originalWrite = process.stderr.write;
|
|
const lines: string[] = [];
|
|
const errors: string[] = [];
|
|
console.log = (...args: unknown[]) => {
|
|
lines.push(args.map(String).join(" "));
|
|
};
|
|
process.stderr.write = ((chunk: string | Uint8Array) => {
|
|
errors.push(String(chunk));
|
|
return true;
|
|
}) as typeof process.stderr.write;
|
|
try {
|
|
const code = fn();
|
|
return { code, output: lines.join("\n"), error: errors.join("") };
|
|
} finally {
|
|
console.log = originalLog;
|
|
process.stderr.write = originalWrite;
|
|
}
|
|
}
|
|
|
|
function suiteResult(caseId: string, runId: string, status = "pass", evidence = ["ui", "screenshot", "console", "backend_log"]): string {
|
|
return JSON.stringify({
|
|
source: "final",
|
|
case_id: caseId,
|
|
run_id: `${runId}-${caseId}`,
|
|
status,
|
|
reason: `${caseId} ${status}`,
|
|
started_at_local: "2026-05-21T10:30:00.000+08:00",
|
|
finished_at_local: "2026-05-21T10:31:00.000+08:00",
|
|
evidence_collected: evidence,
|
|
});
|
|
}
|
|
|
|
function withEnv<T>(values: Record<string, string>, fn: () => T): T {
|
|
const previous = new Map(Object.keys(values).map((key) => [key, process.env[key]]));
|
|
try {
|
|
for (const [key, value] of Object.entries(values)) process.env[key] = value;
|
|
return fn();
|
|
} finally {
|
|
for (const [key, value] of previous) {
|
|
if (value === undefined) delete process.env[key];
|
|
else process.env[key] = value;
|
|
}
|
|
}
|
|
}
|
|
|
|
async function captureAsync(fn: () => Promise<number>): Promise<{ code: number; output: string }> {
|
|
const originalLog = console.log;
|
|
const lines: string[] = [];
|
|
console.log = (...args: unknown[]) => {
|
|
lines.push(args.map(String).join(" "));
|
|
};
|
|
try {
|
|
const code = await fn();
|
|
return { code, output: lines.join("\n") };
|
|
} finally {
|
|
console.log = originalLog;
|
|
}
|
|
}
|
|
|
|
test("validate accepts the repository assets", () => {
|
|
const result = capture(() => commandValidate(root));
|
|
assert.equal(result.code, 0);
|
|
assert.match(result.output, /^OK/m);
|
|
});
|
|
|
|
test("validate allows blank shared env values but requires declared keys", () => {
|
|
const tmp = mkdtempSync(join(tmpdir(), "lbs-validate-env-template-"));
|
|
try {
|
|
const schemasDir = join(tmp, "schemas");
|
|
const skillsDir = join(tmp, "skills");
|
|
const testingDir = join(skillsDir, "langbot-testing");
|
|
mkdirSync(schemasDir, { recursive: true });
|
|
mkdirSync(testingDir, { recursive: true });
|
|
for (const schemaName of ["case.schema.json", "suite.schema.json", "troubleshooting.schema.json", "skill-index.schema.json"]) {
|
|
writeFileSync(join(schemasDir, schemaName), "{}");
|
|
}
|
|
writeFileSync(join(testingDir, "SKILL.md"), "---\nname: langbot-testing\ndescription: Testing.\n---\n\n# Testing\n");
|
|
const envText = [
|
|
"LANGBOT_FRONTEND_URL=http://127.0.0.1:3000",
|
|
"LANGBOT_BACKEND_URL=http://127.0.0.1:5300",
|
|
"LANGBOT_DEV_FRONTEND_URL=http://127.0.0.1:3000",
|
|
"LANGBOT_REPO=",
|
|
"LANGBOT_WEB_REPO=",
|
|
"LANGBOT_BROWSER_PROFILE=",
|
|
"LANGBOT_CHROMIUM_EXECUTABLE=",
|
|
].join("\n");
|
|
writeFileSync(join(skillsDir, ".env"), envText);
|
|
writeFileSync(join(skillsDir, ".env.example"), envText);
|
|
|
|
const result = capture(() => commandValidate(tmp));
|
|
|
|
assert.equal(result.code, 0);
|
|
assert.match(result.output, /^OK/m);
|
|
} finally {
|
|
rmSync(tmp, { recursive: true, force: true });
|
|
}
|
|
});
|
|
|
|
test("index includes case summaries for agent discovery", () => {
|
|
const result = capture(() => commandIndex({ root, args: ["index"] }));
|
|
assert.equal(result.code, 0);
|
|
const index = JSON.parse(readFileSync(join(root, "skills.index.json"), "utf8"));
|
|
const testing = index.skills.find((skill: { name: string }) => skill.name === "langbot-testing");
|
|
assert.ok(testing);
|
|
assert.ok(testing.case_summaries.some((item: { id: string; priority: string; evidence_required: string[] }) => (
|
|
item.id === "pipeline-debug-chat" && item.priority === "p0" && item.evidence_required.includes("backend_log")
|
|
)));
|
|
assert.ok(testing.case_summaries.some((item: { id: string; setup_automation: string[]; setup_provides_env: string[] }) => (
|
|
item.id === "agent-runner-qa-debug-chat" &&
|
|
item.setup_automation.includes("case:agent-runner-live-install") &&
|
|
item.setup_provides_env.includes("LANGBOT_QA_AGENT_RUNNER_PIPELINE_URL")
|
|
)));
|
|
assert.ok(testing.suite_summaries.some((item: { id: string; cases: string[] }) => (
|
|
item.id === "core-smoke" && item.cases.includes("pipeline-debug-chat")
|
|
)));
|
|
assert.ok(testing.fixtures.some((item: { id: string; related_cases: string[] }) => (
|
|
item.id === "mcp-stdio-echo-server" && item.related_cases.includes("mcp-stdio-tool-call")
|
|
)));
|
|
});
|
|
|
|
test("index check detects stale index without writing", () => {
|
|
const path = join(root, "skills.index.json");
|
|
const current = capture(() => commandIndex({ root, args: ["index"] }));
|
|
assert.equal(current.code, 0);
|
|
|
|
const fresh = readFileSync(path, "utf8");
|
|
try {
|
|
const ok = capture(() => commandIndex({ root, args: ["index", "--check"] }));
|
|
assert.equal(ok.code, 0);
|
|
assert.match(ok.output, /^OK /);
|
|
|
|
writeFileSync(path, "{}\n");
|
|
const stale = captureAll(() => commandIndex({ root, args: ["index", "--check"] }));
|
|
assert.equal(stale.code, 1);
|
|
assert.match(stale.error, /index is stale/);
|
|
assert.equal(readFileSync(path, "utf8"), "{}\n");
|
|
} finally {
|
|
writeFileSync(path, fresh);
|
|
}
|
|
});
|
|
|
|
test("case list exposes seeded QA cases", () => {
|
|
const result = capture(() => commandCaseList(ctx(["case", "list"])));
|
|
assert.equal(result.code, 0);
|
|
assert.match(result.output, /pipeline-debug-chat/);
|
|
assert.match(result.output, /provider-deepseek/);
|
|
assert.match(result.output, /webui-login-state/);
|
|
});
|
|
|
|
test("case list JSON filters by reusable agent-selection metadata", () => {
|
|
const result = capture(() => commandCaseList(ctx([
|
|
"case",
|
|
"list",
|
|
"--json",
|
|
"--priority",
|
|
"p0",
|
|
"--automation",
|
|
])));
|
|
assert.equal(result.code, 0);
|
|
const rows = JSON.parse(result.output);
|
|
assert.ok(rows.length >= 2);
|
|
assert.ok(rows.every((row: { priority: string }) => row.priority === "p0"));
|
|
assert.ok(rows.every((row: { automation: string }) => row.automation));
|
|
assert.ok(rows.some((row: { id: string; evidence_required: string[]; readiness: string }) => (
|
|
row.id === "pipeline-debug-chat" && row.evidence_required.includes("backend_log") && row.readiness
|
|
)));
|
|
});
|
|
|
|
test("case list distinguishes machine readiness from manual precondition checks", () => {
|
|
const tmp = mkdtempSync(join(tmpdir(), "lbs-case-manual-readiness-"));
|
|
try {
|
|
const skillDir = join(tmp, "skills", "langbot-testing");
|
|
mkdirSync(join(skillDir, "cases"), { recursive: true });
|
|
writeFileSync(
|
|
join(skillDir, "SKILL.md"),
|
|
"---\nname: langbot-testing\ndescription: Testing.\n---\n\n# Testing\n",
|
|
);
|
|
writeFileSync(join(tmp, "skills", ".env"), "LANGBOT_FRONTEND_URL=http://127.0.0.1:3000\n");
|
|
writeFileSync(
|
|
join(skillDir, "cases", "manual-case.yaml"),
|
|
[
|
|
"id: manual-case",
|
|
"title: Manual Case",
|
|
"mode: agent-browser",
|
|
"area: pipeline",
|
|
"type: smoke",
|
|
"priority: p2",
|
|
"risk: medium",
|
|
"ci_eligible: false",
|
|
"tags:",
|
|
" - smoke",
|
|
"skills:",
|
|
" - langbot-testing",
|
|
"env:",
|
|
" - LANGBOT_FRONTEND_URL",
|
|
"preconditions:",
|
|
" - Confirm the target pipeline is safe to modify.",
|
|
"steps:",
|
|
" - Open the page.",
|
|
"checks:",
|
|
" - UI: Page opens.",
|
|
"evidence_required:",
|
|
" - ui",
|
|
].join("\n"),
|
|
);
|
|
|
|
const machineReady = capture(() => commandCaseList({ root: tmp, args: ["case", "list", "--machine-ready"] }));
|
|
assert.equal(machineReady.code, 0);
|
|
assert.match(machineReady.output, /manual-case/);
|
|
assert.match(machineReady.output, /manual-check/);
|
|
|
|
const ready = capture(() => commandCaseList({ root: tmp, args: ["case", "list", "--ready"] }));
|
|
assert.equal(ready.code, 0);
|
|
assert.doesNotMatch(ready.output, /manual-case/);
|
|
} finally {
|
|
rmSync(tmp, { recursive: true, force: true });
|
|
}
|
|
});
|
|
|
|
test("case show prints structured agent-browser case", () => {
|
|
const result = capture(() => commandCaseShow(ctx(["case", "show", "pipeline-debug-chat"])));
|
|
assert.equal(result.code, 0);
|
|
assert.match(result.output, /^id: pipeline-debug-chat/m);
|
|
assert.match(result.output, /^mode: agent-browser/m);
|
|
assert.match(result.output, /^checks:/m);
|
|
});
|
|
|
|
test("case new writes required selection metadata", () => {
|
|
const tmp = mkdtempSync(join(tmpdir(), "lbs-case-new-"));
|
|
try {
|
|
const skillDir = join(tmp, "skills", "langbot-testing");
|
|
mkdirSync(skillDir, { recursive: true });
|
|
writeFileSync(
|
|
join(skillDir, "SKILL.md"),
|
|
"---\nname: langbot-testing\ndescription: Testing.\n---\n\n# Testing\n",
|
|
);
|
|
|
|
const result = capture(() => commandCaseNew({
|
|
root: tmp,
|
|
args: ["case", "new", "new-case", "--title", "New Case"],
|
|
}));
|
|
|
|
assert.equal(result.code, 0);
|
|
const text = readFileSync(join(skillDir, "cases", "new-case.yaml"), "utf8");
|
|
assert.match(text, /^priority: p2/m);
|
|
assert.match(text, /^risk: medium/m);
|
|
assert.match(text, /^ci_eligible: false/m);
|
|
assert.match(text, /^evidence_required:/m);
|
|
} finally {
|
|
rmSync(tmp, { recursive: true, force: true });
|
|
}
|
|
});
|
|
|
|
test("suite list and plan expose reusable case groups", () => {
|
|
const list = capture(() => commandSuiteList(ctx(["suite", "list", "--json", "--priority", "p0"])));
|
|
assert.equal(list.code, 0);
|
|
const suites = JSON.parse(list.output);
|
|
assert.ok(suites.some((suite: { id: string; cases: string[] }) => (
|
|
suite.id === "core-smoke" && suite.cases.includes("webui-login-state")
|
|
)));
|
|
|
|
const plan = capture(() => commandSuitePlan(ctx(["suite", "plan", "core-smoke", "--json"])));
|
|
assert.equal(plan.code, 0);
|
|
const suitePlan = JSON.parse(plan.output);
|
|
assert.equal(suitePlan.id, "core-smoke");
|
|
assert.ok(suitePlan.cases.some((item: { id: string; evidence_required: string[] }) => (
|
|
item.id === "pipeline-debug-chat" && item.evidence_required.includes("backend_log")
|
|
)));
|
|
assert.ok(suitePlan.commands.some((item: { id: string; automation: string }) => (
|
|
item.id === "pipeline-debug-chat" && item.automation.includes("test run")
|
|
)));
|
|
|
|
const localAgent = capture(() => commandSuitePlan(ctx(["suite", "plan", "local-agent-gate", "--json"])));
|
|
assert.equal(localAgent.code, 0);
|
|
const localAgentPlan = JSON.parse(localAgent.output);
|
|
assert.ok(["ready", "missing", "manual_check"].includes(localAgentPlan.readiness.status));
|
|
const basic = localAgentPlan.cases.find((item: { id: string }) => item.id === "local-agent-basic-debug-chat");
|
|
assert.equal(basic.automation_readiness.pipeline_env_required, true);
|
|
});
|
|
|
|
test("suite show prints structured suite YAML", () => {
|
|
const result = capture(() => commandSuiteShow(ctx(["suite", "show", "local-agent-gate"])));
|
|
assert.equal(result.code, 0);
|
|
assert.match(result.output, /^id: local-agent-gate/m);
|
|
assert.match(result.output, /^cases:/m);
|
|
assert.match(result.output, /local-agent-effective-prompt-debug-chat/);
|
|
});
|
|
|
|
test("suite start creates a run handoff with per-case evidence commands", () => {
|
|
const tmp = mkdtempSync(join(tmpdir(), "lbs-suite-start-"));
|
|
try {
|
|
const evidenceRoot = join(tmp, "evidence");
|
|
const result = capture(() => commandSuiteStart(ctx([
|
|
"suite",
|
|
"start",
|
|
"core-smoke",
|
|
"--run-id",
|
|
"core-smoke-local",
|
|
"--evidence-dir",
|
|
evidenceRoot,
|
|
"--json",
|
|
])));
|
|
assert.equal(result.code, 0);
|
|
const start = JSON.parse(result.output);
|
|
assert.equal(start.suite.id, "core-smoke");
|
|
assert.equal(start.run_id, "core-smoke-local");
|
|
assert.equal(start.evidence_root, evidenceRoot);
|
|
assert.equal(start.manifest_path, join(evidenceRoot, "suite-start.json"));
|
|
assert.equal(start.handoff_path, join(evidenceRoot, "suite-start.md"));
|
|
assert.match(start.report_command, /bin\/lbs suite report core-smoke/);
|
|
assert.ok(existsSync(join(evidenceRoot, "suite-start.json")));
|
|
assert.ok(existsSync(join(evidenceRoot, "suite-start.md")));
|
|
const pipeline = start.cases.find((item: { id: string }) => item.id === "pipeline-debug-chat");
|
|
assert.ok(pipeline);
|
|
assert.ok(existsSync(join(evidenceRoot, "pipeline-debug-chat")));
|
|
assert.match(pipeline.automation_command, /bin\/lbs test run pipeline-debug-chat/);
|
|
assert.match(pipeline.report_command, /--evidence-dir .+pipeline-debug-chat/);
|
|
assert.match(pipeline.result_command_template, /bin\/lbs test result pipeline-debug-chat/);
|
|
} finally {
|
|
rmSync(tmp, { recursive: true, force: true });
|
|
}
|
|
});
|
|
|
|
test("suite report aggregates case result JSON files", () => {
|
|
const tmp = mkdtempSync(join(tmpdir(), "lbs-suite-report-"));
|
|
try {
|
|
const evidenceRoot = join(tmp, "suite-evidence");
|
|
const runId = "suite-report-run";
|
|
for (const [caseId, status] of [
|
|
["webui-login-state", "pass"],
|
|
["pipeline-debug-chat", "pass"],
|
|
["local-agent-basic-debug-chat", "env_issue"],
|
|
]) {
|
|
const dir = join(evidenceRoot, caseId);
|
|
mkdirSync(dir, { recursive: true });
|
|
writeFileSync(
|
|
join(dir, "result.json"),
|
|
suiteResult(caseId, runId, status),
|
|
);
|
|
}
|
|
|
|
const result = capture(() => commandSuiteReport(ctx([
|
|
"suite",
|
|
"report",
|
|
"core-smoke",
|
|
"--run-id",
|
|
runId,
|
|
"--evidence-dir",
|
|
evidenceRoot,
|
|
"--json",
|
|
])));
|
|
|
|
assert.equal(result.code, 0);
|
|
const report = JSON.parse(result.output);
|
|
assert.equal(report.status, "env_issue");
|
|
assert.equal(report.counts.pass, 2);
|
|
assert.equal(report.counts.env_issue, 1);
|
|
assert.ok(report.cases.some((item: { id: string; result: { status: string } }) => (
|
|
item.id === "local-agent-basic-debug-chat" && item.result.status === "env_issue"
|
|
)));
|
|
} finally {
|
|
rmSync(tmp, { recursive: true, force: true });
|
|
}
|
|
});
|
|
|
|
test("suite report treats pass without required evidence as incomplete", () => {
|
|
const tmp = mkdtempSync(join(tmpdir(), "lbs-suite-report-evidence-"));
|
|
try {
|
|
const evidenceRoot = join(tmp, "suite-evidence");
|
|
const runId = "suite-report-evidence";
|
|
for (const caseId of ["webui-login-state", "pipeline-debug-chat", "local-agent-basic-debug-chat"]) {
|
|
const dir = join(evidenceRoot, caseId);
|
|
mkdirSync(dir, { recursive: true });
|
|
writeFileSync(
|
|
join(dir, "result.json"),
|
|
suiteResult(caseId, runId, "pass", ["ui"]),
|
|
);
|
|
}
|
|
|
|
const result = capture(() => commandSuiteReport(ctx([
|
|
"suite",
|
|
"report",
|
|
"core-smoke",
|
|
"--run-id",
|
|
runId,
|
|
"--evidence-dir",
|
|
evidenceRoot,
|
|
"--json",
|
|
])));
|
|
|
|
assert.equal(result.code, 0);
|
|
const report = JSON.parse(result.output);
|
|
assert.equal(report.status, "incomplete");
|
|
assert.ok(report.cases.some((item: { id: string; result: { evidence_missing: string[] } }) => (
|
|
item.id === "pipeline-debug-chat" && item.result.evidence_missing.includes("backend_log")
|
|
)));
|
|
} finally {
|
|
rmSync(tmp, { recursive: true, force: true });
|
|
}
|
|
});
|
|
|
|
test("suite report marks missing case evidence as incomplete", () => {
|
|
const tmp = mkdtempSync(join(tmpdir(), "lbs-suite-report-missing-"));
|
|
try {
|
|
const evidenceRoot = join(tmp, "suite-evidence");
|
|
const runId = "suite-report-missing";
|
|
mkdirSync(join(evidenceRoot, "webui-login-state"), { recursive: true });
|
|
writeFileSync(join(evidenceRoot, "webui-login-state", "result.json"), suiteResult("webui-login-state", runId, "pass"));
|
|
|
|
const result = capture(() => commandSuiteReport(ctx([
|
|
"suite",
|
|
"report",
|
|
"core-smoke",
|
|
"--run-id",
|
|
runId,
|
|
"--evidence-dir",
|
|
evidenceRoot,
|
|
"--json",
|
|
])));
|
|
|
|
assert.equal(result.code, 0);
|
|
const report = JSON.parse(result.output);
|
|
assert.equal(report.status, "incomplete");
|
|
assert.ok(report.cases.some((item: { id: string; result: { status: string } }) => (
|
|
item.id === "pipeline-debug-chat" && item.result.status === "missing"
|
|
)));
|
|
} finally {
|
|
rmSync(tmp, { recursive: true, force: true });
|
|
}
|
|
});
|
|
|
|
test("suite report rejects result files from the wrong case or run", () => {
|
|
const tmp = mkdtempSync(join(tmpdir(), "lbs-suite-report-mismatch-"));
|
|
try {
|
|
const evidenceRoot = join(tmp, "suite-evidence");
|
|
const runId = "suite-report-mismatch";
|
|
for (const caseId of ["webui-login-state", "pipeline-debug-chat", "local-agent-basic-debug-chat"]) {
|
|
const dir = join(evidenceRoot, caseId);
|
|
mkdirSync(dir, { recursive: true });
|
|
writeFileSync(join(dir, "result.json"), suiteResult(caseId, runId, "pass"));
|
|
}
|
|
writeFileSync(join(evidenceRoot, "pipeline-debug-chat", "result.json"), suiteResult("webui-login-state", runId, "pass"));
|
|
writeFileSync(join(evidenceRoot, "local-agent-basic-debug-chat", "result.json"), suiteResult("local-agent-basic-debug-chat", "old-run", "pass"));
|
|
|
|
const result = capture(() => commandSuiteReport(ctx([
|
|
"suite",
|
|
"report",
|
|
"core-smoke",
|
|
"--run-id",
|
|
runId,
|
|
"--evidence-dir",
|
|
evidenceRoot,
|
|
"--json",
|
|
])));
|
|
|
|
assert.equal(result.code, 0);
|
|
const report = JSON.parse(result.output);
|
|
assert.equal(report.status, "fail");
|
|
assert.ok(report.cases.some((item: { id: string; result: { status: string; reason: string } }) => (
|
|
item.id === "pipeline-debug-chat" && item.result.status === "invalid" && item.result.reason.includes("case_id mismatch")
|
|
)));
|
|
assert.ok(report.cases.some((item: { id: string; result: { status: string; reason: string } }) => (
|
|
item.id === "local-agent-basic-debug-chat" && item.result.status === "invalid" && item.result.reason.includes("run_id mismatch")
|
|
)));
|
|
} finally {
|
|
rmSync(tmp, { recursive: true, force: true });
|
|
}
|
|
});
|
|
|
|
test("suite run executes automated cases and aggregates a verdict", () => {
|
|
const tmp = mkdtempSync(join(tmpdir(), "lbs-suite-run-"));
|
|
try {
|
|
const skillDir = join(tmp, "skills", "langbot-testing");
|
|
const casesDir = join(skillDir, "cases");
|
|
const suitesDir = join(skillDir, "suites");
|
|
const scriptsDir = join(tmp, "scripts");
|
|
mkdirSync(casesDir, { recursive: true });
|
|
mkdirSync(suitesDir, { recursive: true });
|
|
mkdirSync(scriptsDir, { recursive: true });
|
|
writeFileSync(join(skillDir, "SKILL.md"), "---\nname: langbot-testing\ndescription: Testing.\n---\n\n# Testing\n");
|
|
writeFileSync(join(tmp, "skills", ".env"), "");
|
|
writeFileSync(
|
|
join(casesDir, "one.yaml"),
|
|
[
|
|
"id: one",
|
|
"title: One",
|
|
"mode: probe",
|
|
"area: qa",
|
|
"type: smoke",
|
|
"priority: p2",
|
|
"risk: low",
|
|
"ci_eligible: true",
|
|
"automation: scripts/pass.mjs",
|
|
"evidence_required:",
|
|
" - filesystem",
|
|
].join("\n"),
|
|
);
|
|
writeFileSync(
|
|
join(casesDir, "two.yaml"),
|
|
[
|
|
"id: two",
|
|
"title: Two",
|
|
"mode: probe",
|
|
"area: qa",
|
|
"type: smoke",
|
|
"priority: p2",
|
|
"risk: low",
|
|
"ci_eligible: true",
|
|
"automation: scripts/pass.mjs",
|
|
"evidence_required:",
|
|
" - filesystem",
|
|
].join("\n"),
|
|
);
|
|
writeFileSync(
|
|
join(suitesDir, "mini.yaml"),
|
|
[
|
|
"id: mini",
|
|
"title: Mini",
|
|
"description: Mini suite.",
|
|
"type: smoke",
|
|
"priority: p2",
|
|
"tags:",
|
|
" - qa",
|
|
"cases:",
|
|
" - one",
|
|
" - two",
|
|
].join("\n"),
|
|
);
|
|
writeFileSync(
|
|
join(scriptsDir, "pass.mjs"),
|
|
[
|
|
"import { mkdirSync, writeFileSync } from 'node:fs';",
|
|
"import { join } from 'node:path';",
|
|
"mkdirSync(process.env.LBS_EVIDENCE_DIR, { recursive: true });",
|
|
"writeFileSync(join(process.env.LBS_EVIDENCE_DIR, 'result.json'), JSON.stringify({",
|
|
" case_id: process.env.LBS_CASE_ID,",
|
|
" run_id: process.env.LBS_RUN_ID,",
|
|
" status: 'pass',",
|
|
" reason: `${process.env.LBS_CASE_ID} pass`,",
|
|
" evidence_collected: ['filesystem']",
|
|
"}));",
|
|
"writeFileSync(join(process.env.LBS_EVIDENCE_DIR, 'automation-result.json'), JSON.stringify({ status: 'pass' }));",
|
|
].join("\n"),
|
|
);
|
|
|
|
const result = capture(() => commandSuiteRun({
|
|
root: tmp,
|
|
args: ["suite", "run", "mini", "--run-id", "mini-run", "--evidence-dir", join(tmp, "evidence"), "--json"],
|
|
}));
|
|
|
|
assert.equal(result.code, 0);
|
|
const payload = JSON.parse(result.output);
|
|
assert.equal(payload.report.status, "pass");
|
|
assert.equal(payload.report.counts.pass, 2);
|
|
assert.deepEqual(payload.executions.map((item: { status: string }) => item.status), ["ok", "ok"]);
|
|
assert.ok(existsSync(join(tmp, "evidence", "one", "result.json")));
|
|
assert.ok(existsSync(join(tmp, "evidence", "two", "result.json")));
|
|
} finally {
|
|
rmSync(tmp, { recursive: true, force: true });
|
|
}
|
|
});
|
|
|
|
test("suite run JSON captures failed case output", () => {
|
|
const tmp = mkdtempSync(join(tmpdir(), "lbs-suite-run-fail-"));
|
|
try {
|
|
const skillDir = join(tmp, "skills", "langbot-testing");
|
|
const casesDir = join(skillDir, "cases");
|
|
const suitesDir = join(skillDir, "suites");
|
|
const scriptsDir = join(tmp, "scripts");
|
|
mkdirSync(casesDir, { recursive: true });
|
|
mkdirSync(suitesDir, { recursive: true });
|
|
mkdirSync(scriptsDir, { recursive: true });
|
|
writeFileSync(join(skillDir, "SKILL.md"), "---\nname: langbot-testing\ndescription: Testing.\n---\n\n# Testing\n");
|
|
writeFileSync(join(tmp, "skills", ".env"), "");
|
|
writeFileSync(
|
|
join(casesDir, "fail-case.yaml"),
|
|
[
|
|
"id: fail-case",
|
|
"title: Fail Case",
|
|
"mode: probe",
|
|
"area: qa",
|
|
"type: smoke",
|
|
"priority: p2",
|
|
"risk: low",
|
|
"ci_eligible: true",
|
|
"automation: scripts/fail.mjs",
|
|
].join("\n"),
|
|
);
|
|
writeFileSync(
|
|
join(suitesDir, "mini.yaml"),
|
|
[
|
|
"id: mini",
|
|
"title: Mini",
|
|
"description: Mini suite.",
|
|
"type: smoke",
|
|
"priority: p2",
|
|
"tags:",
|
|
" - qa",
|
|
"cases:",
|
|
" - fail-case",
|
|
].join("\n"),
|
|
);
|
|
writeFileSync(join(scriptsDir, "fail.mjs"), "console.error('child failure detail'); process.exit(1);\n");
|
|
|
|
const result = capture(() => commandSuiteRun({
|
|
root: tmp,
|
|
args: ["suite", "run", "mini", "--run-id", "mini-run", "--evidence-dir", join(tmp, "evidence"), "--json"],
|
|
}));
|
|
|
|
assert.equal(result.code, 1);
|
|
const payload = JSON.parse(result.output);
|
|
assert.equal(payload.executions[0].status, "nonzero");
|
|
assert.match(payload.executions[0].stderr, /child failure detail/);
|
|
assert.equal(payload.report.status, "fail");
|
|
} finally {
|
|
rmSync(tmp, { recursive: true, force: true });
|
|
}
|
|
});
|
|
|
|
test("suite run failure cannot be masked by stale pass result", () => {
|
|
const tmp = mkdtempSync(join(tmpdir(), "lbs-suite-run-stale-pass-"));
|
|
try {
|
|
const skillDir = join(tmp, "skills", "langbot-testing");
|
|
const casesDir = join(skillDir, "cases");
|
|
const suitesDir = join(skillDir, "suites");
|
|
const scriptsDir = join(tmp, "scripts");
|
|
const evidenceDir = join(tmp, "evidence");
|
|
mkdirSync(casesDir, { recursive: true });
|
|
mkdirSync(suitesDir, { recursive: true });
|
|
mkdirSync(scriptsDir, { recursive: true });
|
|
mkdirSync(join(evidenceDir, "fail-case"), { recursive: true });
|
|
writeFileSync(join(skillDir, "SKILL.md"), "---\nname: langbot-testing\ndescription: Testing.\n---\n\n# Testing\n");
|
|
writeFileSync(join(tmp, "skills", ".env"), "");
|
|
writeFileSync(
|
|
join(casesDir, "fail-case.yaml"),
|
|
[
|
|
"id: fail-case",
|
|
"title: Fail Case",
|
|
"mode: probe",
|
|
"area: qa",
|
|
"type: smoke",
|
|
"priority: p2",
|
|
"risk: low",
|
|
"ci_eligible: true",
|
|
"automation: scripts/fail.mjs",
|
|
"evidence_required:",
|
|
" - filesystem",
|
|
].join("\n"),
|
|
);
|
|
writeFileSync(
|
|
join(suitesDir, "mini.yaml"),
|
|
[
|
|
"id: mini",
|
|
"title: Mini",
|
|
"description: Mini suite.",
|
|
"type: smoke",
|
|
"priority: p2",
|
|
"tags:",
|
|
" - qa",
|
|
"cases:",
|
|
" - fail-case",
|
|
].join("\n"),
|
|
);
|
|
writeFileSync(join(scriptsDir, "fail.mjs"), "process.exit(1);\n");
|
|
writeFileSync(join(evidenceDir, "fail-case", "result.json"), JSON.stringify({
|
|
case_id: "fail-case",
|
|
run_id: "stale-run-fail-case",
|
|
status: "pass",
|
|
evidence_collected: ["filesystem"],
|
|
}));
|
|
|
|
const result = capture(() => commandSuiteRun({
|
|
root: tmp,
|
|
args: ["suite", "run", "mini", "--run-id", "stale-run", "--evidence-dir", evidenceDir, "--json"],
|
|
}));
|
|
|
|
assert.equal(result.code, 1);
|
|
const payload = JSON.parse(result.output);
|
|
assert.equal(payload.executions[0].status, "nonzero");
|
|
assert.equal(payload.report.status, "fail");
|
|
assert.equal(payload.report.execution_status, "fail");
|
|
} finally {
|
|
rmSync(tmp, { recursive: true, force: true });
|
|
}
|
|
});
|
|
|
|
test("suite run dry-run plans automation without creating evidence", () => {
|
|
const tmp = mkdtempSync(join(tmpdir(), "lbs-suite-run-dry-"));
|
|
try {
|
|
const skillDir = join(tmp, "skills", "langbot-testing");
|
|
const casesDir = join(skillDir, "cases");
|
|
const suitesDir = join(skillDir, "suites");
|
|
const scriptsDir = join(tmp, "scripts");
|
|
mkdirSync(casesDir, { recursive: true });
|
|
mkdirSync(suitesDir, { recursive: true });
|
|
mkdirSync(scriptsDir, { recursive: true });
|
|
writeFileSync(join(skillDir, "SKILL.md"), "---\nname: langbot-testing\ndescription: Testing.\n---\n\n# Testing\n");
|
|
writeFileSync(join(tmp, "skills", ".env"), "");
|
|
writeFileSync(
|
|
join(casesDir, "dry-case.yaml"),
|
|
[
|
|
"id: dry-case",
|
|
"title: Dry Case",
|
|
"mode: probe",
|
|
"area: qa",
|
|
"type: smoke",
|
|
"priority: p2",
|
|
"risk: low",
|
|
"ci_eligible: true",
|
|
"automation: scripts/fail-if-run.mjs",
|
|
].join("\n"),
|
|
);
|
|
writeFileSync(
|
|
join(suitesDir, "dry-suite.yaml"),
|
|
[
|
|
"id: dry-suite",
|
|
"title: Dry Suite",
|
|
"description: Dry run suite.",
|
|
"type: smoke",
|
|
"priority: p2",
|
|
"tags:",
|
|
" - qa",
|
|
"cases:",
|
|
" - dry-case",
|
|
].join("\n"),
|
|
);
|
|
writeFileSync(join(scriptsDir, "fail-if-run.mjs"), "process.exit(9);\n");
|
|
|
|
const evidenceDir = join(tmp, "evidence");
|
|
const result = capture(() => commandSuiteRun({
|
|
root: tmp,
|
|
args: ["suite", "run", "dry-suite", "--run-id", "dry-run", "--evidence-dir", evidenceDir, "--dry-run", "--json"],
|
|
}));
|
|
|
|
assert.equal(result.code, 0);
|
|
const payload = JSON.parse(result.output);
|
|
assert.equal(payload.executions[0].status, "planned");
|
|
assert.match(payload.executions[0].command, /test run dry-case/);
|
|
assert.equal(payload.report.status, "incomplete");
|
|
assert.equal(existsSync(evidenceDir), false);
|
|
assert.equal(existsSync(join(tmp, "reports", "dry-run.md")), false);
|
|
|
|
const markdown = capture(() => commandSuiteRun({
|
|
root: tmp,
|
|
args: ["suite", "run", "dry-suite", "--run-id", "dry-run-markdown", "--evidence-dir", join(tmp, "evidence-md"), "--dry-run"],
|
|
}));
|
|
assert.equal(markdown.code, 0);
|
|
assert.match(markdown.output, /# Suite Report: dry-suite/);
|
|
assert.equal(existsSync(join(tmp, "reports", "dry-run-markdown.md")), false);
|
|
assert.equal(existsSync(join(tmp, "evidence-md")), false);
|
|
} finally {
|
|
rmSync(tmp, { recursive: true, force: true });
|
|
}
|
|
});
|
|
|
|
test("suite run skips manual-check cases unless explicitly included", () => {
|
|
const tmp = mkdtempSync(join(tmpdir(), "lbs-suite-run-manual-"));
|
|
try {
|
|
const skillDir = join(tmp, "skills", "langbot-testing");
|
|
const casesDir = join(skillDir, "cases");
|
|
const suitesDir = join(skillDir, "suites");
|
|
const scriptsDir = join(tmp, "scripts");
|
|
mkdirSync(casesDir, { recursive: true });
|
|
mkdirSync(suitesDir, { recursive: true });
|
|
mkdirSync(scriptsDir, { recursive: true });
|
|
writeFileSync(join(skillDir, "SKILL.md"), "---\nname: langbot-testing\ndescription: Testing.\n---\n\n# Testing\n");
|
|
writeFileSync(join(tmp, "skills", ".env"), "");
|
|
writeFileSync(
|
|
join(casesDir, "manual-case.yaml"),
|
|
[
|
|
"id: manual-case",
|
|
"title: Manual Case",
|
|
"mode: probe",
|
|
"area: qa",
|
|
"type: smoke",
|
|
"priority: p2",
|
|
"risk: low",
|
|
"ci_eligible: true",
|
|
"preconditions:",
|
|
" - Confirm this case is safe to run.",
|
|
"automation: scripts/pass.mjs",
|
|
"evidence_required:",
|
|
" - filesystem",
|
|
].join("\n"),
|
|
);
|
|
writeFileSync(
|
|
join(suitesDir, "manual-suite.yaml"),
|
|
[
|
|
"id: manual-suite",
|
|
"title: Manual Suite",
|
|
"description: Manual check suite.",
|
|
"type: smoke",
|
|
"priority: p2",
|
|
"tags:",
|
|
" - qa",
|
|
"cases:",
|
|
" - manual-case",
|
|
].join("\n"),
|
|
);
|
|
writeFileSync(
|
|
join(scriptsDir, "pass.mjs"),
|
|
[
|
|
"import { mkdirSync, writeFileSync } from 'node:fs';",
|
|
"import { join } from 'node:path';",
|
|
"mkdirSync(process.env.LBS_EVIDENCE_DIR, { recursive: true });",
|
|
"writeFileSync(join(process.env.LBS_EVIDENCE_DIR, 'result.json'), JSON.stringify({ case_id: process.env.LBS_CASE_ID, run_id: process.env.LBS_RUN_ID, status: 'pass', evidence_collected: ['filesystem'] }));",
|
|
].join("\n"),
|
|
);
|
|
|
|
const skipped = capture(() => commandSuiteRun({
|
|
root: tmp,
|
|
args: ["suite", "run", "manual-suite", "--run-id", "manual-run", "--evidence-dir", join(tmp, "evidence"), "--json"],
|
|
}));
|
|
assert.equal(skipped.code, 1);
|
|
const skippedPayload = JSON.parse(skipped.output);
|
|
assert.equal(skippedPayload.executions[0].status, "skipped");
|
|
assert.match(skippedPayload.executions[0].reason, /manual_check/);
|
|
assert.equal(existsSync(join(tmp, "evidence", "manual-case", "result.json")), false);
|
|
|
|
const included = capture(() => commandSuiteRun({
|
|
root: tmp,
|
|
args: ["suite", "run", "manual-suite", "--run-id", "manual-run-included", "--evidence-dir", join(tmp, "evidence-included"), "--include-manual-check", "--json"],
|
|
}));
|
|
assert.equal(included.code, 0);
|
|
const includedPayload = JSON.parse(included.output);
|
|
assert.equal(includedPayload.executions[0].status, "ok");
|
|
assert.equal(includedPayload.report.status, "pass");
|
|
assert.ok(existsSync(join(tmp, "evidence-included", "manual-case", "result.json")));
|
|
} finally {
|
|
rmSync(tmp, { recursive: true, force: true });
|
|
}
|
|
});
|
|
|
|
test("suite run skips cases with missing machine readiness unless explicitly included", () => {
|
|
const tmp = mkdtempSync(join(tmpdir(), "lbs-suite-run-readiness-"));
|
|
try {
|
|
const skillDir = join(tmp, "skills", "langbot-testing");
|
|
const casesDir = join(skillDir, "cases");
|
|
const suitesDir = join(skillDir, "suites");
|
|
const fixturesDir = join(skillDir, "fixtures");
|
|
const scriptsDir = join(tmp, "scripts");
|
|
mkdirSync(casesDir, { recursive: true });
|
|
mkdirSync(suitesDir, { recursive: true });
|
|
mkdirSync(fixturesDir, { recursive: true });
|
|
mkdirSync(scriptsDir, { recursive: true });
|
|
writeFileSync(join(skillDir, "SKILL.md"), "---\nname: langbot-testing\ndescription: Testing.\n---\n\n# Testing\n");
|
|
writeFileSync(join(tmp, "skills", ".env"), "");
|
|
writeFileSync(
|
|
join(casesDir, "not-ready-case.yaml"),
|
|
[
|
|
"id: not-ready-case",
|
|
"title: Not Ready Case",
|
|
"mode: probe",
|
|
"area: qa",
|
|
"type: smoke",
|
|
"priority: p2",
|
|
"risk: low",
|
|
"ci_eligible: true",
|
|
"env:",
|
|
" - LBS_TEST_SUITE_RUN_MISSING_ENV",
|
|
"automation_env:",
|
|
" - LBS_TEST_SUITE_RUN_MISSING_AUTOMATION_ENV",
|
|
"automation: scripts/pass.mjs",
|
|
"evidence_required:",
|
|
" - filesystem",
|
|
].join("\n"),
|
|
);
|
|
writeFileSync(
|
|
join(fixturesDir, "fixtures.json"),
|
|
`${JSON.stringify([{
|
|
id: "missing-fixture",
|
|
title: "Missing fixture",
|
|
kind: "file",
|
|
path: "fixtures/missing.txt",
|
|
related_cases: ["not-ready-case"],
|
|
checks: ["exists"],
|
|
}], null, 2)}\n`,
|
|
);
|
|
writeFileSync(
|
|
join(suitesDir, "readiness-suite.yaml"),
|
|
[
|
|
"id: readiness-suite",
|
|
"title: Readiness Suite",
|
|
"description: Readiness suite.",
|
|
"type: smoke",
|
|
"priority: p2",
|
|
"tags:",
|
|
" - qa",
|
|
"cases:",
|
|
" - not-ready-case",
|
|
].join("\n"),
|
|
);
|
|
writeFileSync(
|
|
join(scriptsDir, "pass.mjs"),
|
|
[
|
|
"import { mkdirSync, writeFileSync } from 'node:fs';",
|
|
"import { join } from 'node:path';",
|
|
"mkdirSync(process.env.LBS_EVIDENCE_DIR, { recursive: true });",
|
|
"writeFileSync(join(process.env.LBS_EVIDENCE_DIR, 'result.json'), JSON.stringify({ case_id: process.env.LBS_CASE_ID, run_id: process.env.LBS_RUN_ID, status: 'pass', evidence_collected: ['filesystem'] }));",
|
|
].join("\n"),
|
|
);
|
|
|
|
const skipped = capture(() => commandSuiteRun({
|
|
root: tmp,
|
|
args: ["suite", "run", "readiness-suite", "--run-id", "readiness-run", "--evidence-dir", join(tmp, "evidence"), "--json"],
|
|
}));
|
|
assert.equal(skipped.code, 1);
|
|
const skippedPayload = JSON.parse(skipped.output);
|
|
assert.equal(skippedPayload.executions[0].status, "skipped");
|
|
assert.match(skippedPayload.executions[0].reason, /readiness missing/);
|
|
assert.match(skippedPayload.executions[0].reason, /LBS_TEST_SUITE_RUN_MISSING_ENV/);
|
|
assert.match(skippedPayload.executions[0].reason, /LBS_TEST_SUITE_RUN_MISSING_AUTOMATION_ENV/);
|
|
assert.match(skippedPayload.executions[0].reason, /missing-fixture/);
|
|
assert.equal(existsSync(join(tmp, "evidence", "not-ready-case", "result.json")), false);
|
|
|
|
const included = capture(() => commandSuiteRun({
|
|
root: tmp,
|
|
args: ["suite", "run", "readiness-suite", "--run-id", "readiness-run-included", "--evidence-dir", join(tmp, "evidence-included"), "--include-not-ready", "--json"],
|
|
}));
|
|
assert.equal(included.code, 0);
|
|
const includedPayload = JSON.parse(included.output);
|
|
assert.equal(includedPayload.executions[0].status, "ok");
|
|
assert.equal(includedPayload.report.status, "pass");
|
|
assert.ok(existsSync(join(tmp, "evidence-included", "not-ready-case", "result.json")));
|
|
} finally {
|
|
rmSync(tmp, { recursive: true, force: true });
|
|
}
|
|
});
|
|
|
|
test("suite new writes a reusable suite skeleton", () => {
|
|
const tmp = mkdtempSync(join(tmpdir(), "lbs-suite-new-"));
|
|
try {
|
|
const skillDir = join(tmp, "skills", "langbot-testing");
|
|
mkdirSync(skillDir, { recursive: true });
|
|
writeFileSync(
|
|
join(skillDir, "SKILL.md"),
|
|
"---\nname: langbot-testing\ndescription: Testing.\n---\n\n# Testing\n",
|
|
);
|
|
|
|
const result = capture(() => commandSuiteNew({
|
|
root: tmp,
|
|
args: ["suite", "new", "new-suite", "--title", "New Suite"],
|
|
}));
|
|
|
|
assert.equal(result.code, 0);
|
|
const text = readFileSync(join(skillDir, "suites", "new-suite.yaml"), "utf8");
|
|
assert.match(text, /^description:/m);
|
|
assert.match(text, /^priority: p2/m);
|
|
assert.match(text, /^cases:/m);
|
|
} finally {
|
|
rmSync(tmp, { recursive: true, force: true });
|
|
}
|
|
});
|
|
|
|
test("fixture list and check expose reusable fixture readiness", () => {
|
|
const list = capture(() => commandFixtureList(ctx(["fixture", "list", "langbot-testing", "--json"])));
|
|
assert.equal(list.code, 0);
|
|
const fixtures = JSON.parse(list.output);
|
|
assert.ok(fixtures.some((item: { id: string; exists: boolean }) => (
|
|
item.id === "mcp-stdio-echo-server" && item.exists === true
|
|
)));
|
|
|
|
const check = capture(() => commandFixtureCheck(ctx(["fixture", "check", "langbot-testing", "--json"])));
|
|
assert.equal(check.code, 0);
|
|
const report = JSON.parse(check.output);
|
|
assert.equal(report.status, "pass");
|
|
assert.ok(report.fixtures.some((item: { id: string }) => item.id === "qa-plugin-smoke-package"));
|
|
});
|
|
|
|
test("fixture check reports missing manifest paths", () => {
|
|
const tmp = mkdtempSync(join(tmpdir(), "lbs-fixture-check-"));
|
|
try {
|
|
const skillDir = join(tmp, "skills", "langbot-testing");
|
|
mkdirSync(join(skillDir, "fixtures"), { recursive: true });
|
|
writeFileSync(
|
|
join(skillDir, "SKILL.md"),
|
|
"---\nname: langbot-testing\ndescription: Testing.\n---\n\n# Testing\n",
|
|
);
|
|
writeFileSync(
|
|
join(skillDir, "fixtures", "fixtures.json"),
|
|
JSON.stringify([{ id: "missing-fixture", title: "Missing Fixture", path: "fixtures/missing.txt" }]),
|
|
);
|
|
|
|
const result = capture(() => commandFixtureCheck({ root: tmp, args: ["fixture", "check", "langbot-testing", "--json"] }));
|
|
|
|
assert.equal(result.code, 1);
|
|
const report = JSON.parse(result.output);
|
|
assert.equal(report.status, "fail");
|
|
assert.ok(report.findings.some((finding: { id?: string }) => finding.id === "missing-fixture"));
|
|
} finally {
|
|
rmSync(tmp, { recursive: true, force: true });
|
|
}
|
|
});
|
|
|
|
test("fixture check verifies QA AgentRunner source shape", () => {
|
|
const tmp = mkdtempSync(join(tmpdir(), "lbs-fixture-check-"));
|
|
try {
|
|
const skillDir = join(tmp, "skills", "langbot-testing");
|
|
const fixtureDir = join(skillDir, "fixtures", "plugins", "qa-agent-runner");
|
|
mkdirSync(join(fixtureDir, "components", "agent_runner"), { recursive: true });
|
|
writeFileSync(
|
|
join(skillDir, "SKILL.md"),
|
|
"---\nname: langbot-testing\ndescription: Testing.\n---\n\n# Testing\n",
|
|
);
|
|
writeFileSync(
|
|
join(skillDir, "fixtures", "fixtures.json"),
|
|
JSON.stringify([{
|
|
id: "qa-agent-runner-source",
|
|
title: "QA AgentRunner",
|
|
path: "fixtures/plugins/qa-agent-runner/manifest.yaml",
|
|
checks: ["exists", "qa_agent_runner_source"],
|
|
}]),
|
|
);
|
|
writeFileSync(join(fixtureDir, "manifest.yaml"), "spec:\n components:\n AgentRunner: {}\nexecution:\n python:\n attr: QAAgentRunnerPlugin\n");
|
|
|
|
const result = capture(() => commandFixtureCheck({ root: tmp, args: ["fixture", "check", "langbot-testing", "--json"] }));
|
|
|
|
assert.equal(result.code, 1);
|
|
const report = JSON.parse(result.output);
|
|
assert.ok(report.findings.some((finding: { kind?: string; path?: string }) => (
|
|
finding.kind === "fixture_check_missing_file"
|
|
&& finding.path?.endsWith("components/agent_runner/default.py")
|
|
)));
|
|
} finally {
|
|
rmSync(tmp, { recursive: true, force: true });
|
|
}
|
|
});
|
|
|
|
test("fixture check accepts complete QA AgentRunner source shape", () => {
|
|
const result = capture(() => commandFixtureCheck(ctx(["fixture", "check", "langbot-testing", "--json"])));
|
|
assert.equal(result.code, 0);
|
|
const report = JSON.parse(result.output);
|
|
assert.ok(report.fixtures.some((item: { id: string; checks: string[] }) => (
|
|
item.id === "qa-agent-runner-source" && item.checks.includes("qa_agent_runner_source")
|
|
)));
|
|
});
|
|
|
|
test("fixture check rejects invalid plugin package files", () => {
|
|
const tmp = mkdtempSync(join(tmpdir(), "lbs-fixture-check-"));
|
|
try {
|
|
const skillDir = join(tmp, "skills", "langbot-testing");
|
|
mkdirSync(join(skillDir, "fixtures"), { recursive: true });
|
|
writeFileSync(
|
|
join(skillDir, "SKILL.md"),
|
|
"---\nname: langbot-testing\ndescription: Testing.\n---\n\n# Testing\n",
|
|
);
|
|
writeFileSync(join(skillDir, "fixtures", "bad.lbpkg"), "not a zip");
|
|
writeFileSync(
|
|
join(skillDir, "fixtures", "fixtures.json"),
|
|
JSON.stringify([{
|
|
id: "bad-package",
|
|
title: "Bad Package",
|
|
path: "fixtures/bad.lbpkg",
|
|
checks: ["exists", "zip_package"],
|
|
}]),
|
|
);
|
|
|
|
const result = capture(() => commandFixtureCheck({ root: tmp, args: ["fixture", "check", "langbot-testing", "--json"] }));
|
|
|
|
assert.equal(result.code, 1);
|
|
const report = JSON.parse(result.output);
|
|
assert.ok(report.findings.some((finding: { kind?: string; id?: string }) => (
|
|
finding.kind === "fixture_check_invalid_zip" && finding.id === "bad-package"
|
|
)));
|
|
} finally {
|
|
rmSync(tmp, { recursive: true, force: true });
|
|
}
|
|
});
|
|
|
|
test("debug chat classifier prefers latest response leaf over body counts", () => {
|
|
const result = classifyDebugChatResult({
|
|
beforeText: "OK from an older chat",
|
|
afterText: "OK from an older chat\nUser: say OK\nBot: OK",
|
|
expectedText: "OK",
|
|
prompt: "say OK",
|
|
latestExpectedLeaf: "Bot: OK",
|
|
latestFailureLeaf: "",
|
|
});
|
|
|
|
assert.equal(result.status, "pass");
|
|
assert.match(result.reason, /latest visible response leaf/);
|
|
});
|
|
|
|
test("debug chat classifier distinguishes new failure signals from old history", () => {
|
|
assert.equal(
|
|
findNewFailureSignal("Agent runner temporarily unavailable", "Agent runner temporarily unavailable"),
|
|
"",
|
|
);
|
|
assert.equal(
|
|
findNewFailureSignal("", "Agent runner temporarily unavailable"),
|
|
"Agent runner temporarily unavailable",
|
|
);
|
|
|
|
const result = classifyDebugChatResult({
|
|
beforeText: "",
|
|
afterText: "Agent runner temporarily unavailable",
|
|
expectedText: "OK",
|
|
prompt: "say OK",
|
|
latestExpectedLeaf: "",
|
|
latestFailureLeaf: "Agent runner temporarily unavailable",
|
|
});
|
|
|
|
assert.equal(result.status, "fail");
|
|
assert.match(result.reason, /known failure signal/);
|
|
|
|
const custom = classifyDebugChatResult({
|
|
beforeText: "",
|
|
afterText: "Bot: qa-plugin-smoke:mcp-ok-local-agent",
|
|
expectedText: "qa_mcp_echo:mcp-ok-local-agent",
|
|
prompt: "call mcp",
|
|
latestExpectedLeaf: "",
|
|
latestFailureLeaf: "Bot: qa-plugin-smoke:mcp-ok-local-agent",
|
|
failureSignals: ["qa-plugin-smoke:mcp-ok-local-agent"],
|
|
});
|
|
|
|
assert.equal(custom.status, "fail");
|
|
assert.equal(custom.failure_signal, "qa-plugin-smoke:mcp-ok-local-agent");
|
|
});
|
|
|
|
test("debug chat classifier lets new failure signals override stale expected history", () => {
|
|
const result = classifyDebugChatResult({
|
|
beforeText: "Bot: qa_mcp_echo:mcp-ok-local-agent",
|
|
afterText: [
|
|
"Bot: qa_mcp_echo:mcp-ok-local-agent",
|
|
"User: Call qa_mcp_echo",
|
|
"Bot: Agent runner temporarily unavailable.",
|
|
].join("\n"),
|
|
expectedText: "qa_mcp_echo:mcp-ok-local-agent",
|
|
prompt: "Call qa_mcp_echo",
|
|
latestExpectedLeaf: "Bot: qa_mcp_echo:mcp-ok-local-agent",
|
|
latestFailureLeaf: "Bot: Agent runner temporarily unavailable.",
|
|
});
|
|
|
|
assert.equal(result.status, "fail");
|
|
assert.equal(result.failure_signal, "Agent runner temporarily unavailable");
|
|
});
|
|
|
|
test("debug chat classifier does not pass on stale expected history without a new occurrence", () => {
|
|
const result = classifyDebugChatResult({
|
|
beforeText: "Bot: qa_mcp_echo:mcp-ok-local-agent",
|
|
afterText: [
|
|
"Bot: qa_mcp_echo:mcp-ok-local-agent",
|
|
"User: Call qa_mcp_echo",
|
|
].join("\n"),
|
|
expectedText: "qa_mcp_echo:mcp-ok-local-agent",
|
|
prompt: "Call qa_mcp_echo",
|
|
latestExpectedLeaf: "Bot: qa_mcp_echo:mcp-ok-local-agent",
|
|
latestFailureLeaf: "",
|
|
});
|
|
|
|
assert.equal(result.status, "fail");
|
|
assert.equal(result.final_count, 1);
|
|
assert.equal(result.min_expected_count, 2);
|
|
});
|
|
|
|
test("debug chat classifier accounts for prompt echo occurrences", () => {
|
|
assert.equal(minExpectedOccurrences("", "OK", "say OK"), 2);
|
|
const result = classifyDebugChatResult({
|
|
beforeText: "",
|
|
afterText: "User: say OK",
|
|
expectedText: "OK",
|
|
prompt: "say OK",
|
|
latestExpectedLeaf: "User: say OK",
|
|
latestFailureLeaf: "",
|
|
});
|
|
|
|
assert.equal(result.status, "fail");
|
|
assert.equal(result.min_expected_count, 2);
|
|
assert.equal(result.final_count, 1);
|
|
});
|
|
|
|
test("debug chat classifier requires new assistant evidence when message bubbles are available", () => {
|
|
const prompt = "If all steps succeed, final answer must be E2E_OK:skill";
|
|
const result = classifyDebugChatResult({
|
|
beforeText: "",
|
|
afterText: `User: ${prompt}`,
|
|
expectedText: "E2E_OK:skill",
|
|
prompt,
|
|
latestExpectedLeaf: prompt,
|
|
latestFailureLeaf: "",
|
|
beforeMessages: [],
|
|
afterMessages: [{ role: "user", text: prompt }],
|
|
latestAssistantText: "",
|
|
});
|
|
|
|
assert.equal(result.status, "fail");
|
|
assert.match(result.reason, /new assistant message/);
|
|
assert.equal(result.before_assistant_expected_count, 0);
|
|
assert.equal(result.after_assistant_expected_count, 0);
|
|
});
|
|
|
|
test("debug chat classifier passes when expected text appears in a new assistant message", () => {
|
|
const prompt = "Return only E2E_OK:skill";
|
|
const result = classifyDebugChatResult({
|
|
beforeText: "",
|
|
afterText: `User: ${prompt}\nBot: E2E_OK:skill`,
|
|
expectedText: "E2E_OK:skill",
|
|
prompt,
|
|
latestExpectedLeaf: "E2E_OK:skill",
|
|
latestFailureLeaf: "",
|
|
beforeMessages: [],
|
|
afterMessages: [
|
|
{ role: "user", text: prompt },
|
|
{ role: "assistant", text: "E2E_OK:skill" },
|
|
],
|
|
latestAssistantText: "E2E_OK:skill",
|
|
});
|
|
|
|
assert.equal(result.status, "pass");
|
|
assert.match(result.reason, /new assistant message/);
|
|
assert.equal(result.before_assistant_expected_count, 0);
|
|
assert.equal(result.after_assistant_expected_count, 1);
|
|
});
|
|
|
|
test("debug chat classifier allows a recovered failure when latest assistant is successful", () => {
|
|
const expectedText = "E2E_OK:skill";
|
|
const result = classifyDebugChatResult({
|
|
beforeText: "",
|
|
afterText: [
|
|
"Bot: Agent runner temporarily unavailable",
|
|
`Bot: recovered and completed ${expectedText}`,
|
|
].join("\n"),
|
|
expectedText,
|
|
prompt: "Modify the existing skill",
|
|
latestExpectedLeaf: `recovered and completed ${expectedText}`,
|
|
latestFailureLeaf: "Agent runner temporarily unavailable",
|
|
beforeMessages: [],
|
|
afterMessages: [
|
|
{ role: "assistant", text: "Agent runner temporarily unavailable" },
|
|
{ role: "assistant", text: `recovered and completed ${expectedText}` },
|
|
],
|
|
latestAssistantText: `recovered and completed ${expectedText}`,
|
|
});
|
|
|
|
assert.equal(result.status, "pass");
|
|
assert.equal(result.before_assistant_expected_count, 0);
|
|
assert.equal(result.after_assistant_expected_count, 1);
|
|
});
|
|
|
|
test("env doctor explains a missing backend listener with a startup hint", async () => {
|
|
const tmp = mkdtempSync(join(tmpdir(), "lbs-env-doctor-"));
|
|
try {
|
|
const skillsDir = join(tmp, "skills");
|
|
const repoDir = join(tmp, "LangBot");
|
|
const webDir = join(repoDir, "web");
|
|
const browserProfile = join(tmp, "browser-profile");
|
|
const chromium = join(tmp, "chromium");
|
|
mkdirSync(skillsDir, { recursive: true });
|
|
mkdirSync(webDir, { recursive: true });
|
|
mkdirSync(browserProfile, { recursive: true });
|
|
writeFileSync(chromium, "");
|
|
writeFileSync(
|
|
join(skillsDir, ".env"),
|
|
[
|
|
"LANGBOT_BACKEND_URL=http://127.0.0.1:59998",
|
|
"LANGBOT_FRONTEND_URL=http://127.0.0.1:59998",
|
|
"LANGBOT_DEV_FRONTEND_URL=http://127.0.0.1:59998",
|
|
`LANGBOT_REPO=${repoDir}`,
|
|
`LANGBOT_WEB_REPO=${webDir}`,
|
|
`LANGBOT_BROWSER_PROFILE=${browserProfile}`,
|
|
`LANGBOT_CHROMIUM_EXECUTABLE=${chromium}`,
|
|
"LANGBOT_PROXY_HTTP=http://127.0.0.1:7890",
|
|
"LANGBOT_PROXY_SOCKS=socks5://127.0.0.1:7890",
|
|
"LANGBOT_NO_PROXY=localhost,127.0.0.1,::1",
|
|
].join("\n"),
|
|
);
|
|
|
|
const result = await captureAsync(() => commandEnvDoctor({ root: tmp, args: ["env", "doctor"] }));
|
|
|
|
assert.equal(result.code, 1);
|
|
assert.match(result.output, /FAIL: LANGBOT_BACKEND_URL: no HTTP service reachable because 127\.0\.0\.1:59998 is not listening/);
|
|
assert.match(result.output, new RegExp(`WARN: LANGBOT_BACKEND_URL: start backend: cd ${repoDir.replace(/[.*+?^${}()|[\]\\]/g, "\\$&")} && uv run main.py`));
|
|
assert.match(result.output, new RegExp(`WARN: LANGBOT_FRONTEND_URL: start frontend: cd ${webDir.replace(/[.*+?^${}()|[\]\\]/g, "\\$&")} && pnpm dev`));
|
|
} finally {
|
|
rmSync(tmp, { recursive: true, force: true });
|
|
}
|
|
});
|
|
|
|
test("env doctor does not require proxy variables", async () => {
|
|
const tmp = mkdtempSync(join(tmpdir(), "lbs-env-doctor-no-proxy-"));
|
|
try {
|
|
const skillsDir = join(tmp, "skills");
|
|
const repoDir = join(tmp, "LangBot");
|
|
const webDir = join(repoDir, "web");
|
|
const browserProfile = join(tmp, "browser-profile");
|
|
const chromium = join(tmp, "chromium");
|
|
mkdirSync(skillsDir, { recursive: true });
|
|
mkdirSync(webDir, { recursive: true });
|
|
mkdirSync(browserProfile, { recursive: true });
|
|
writeFileSync(chromium, "");
|
|
writeFileSync(
|
|
join(skillsDir, ".env"),
|
|
[
|
|
"LANGBOT_BACKEND_URL=http://127.0.0.1:59997",
|
|
"LANGBOT_FRONTEND_URL=http://127.0.0.1:59997",
|
|
"LANGBOT_DEV_FRONTEND_URL=http://127.0.0.1:59997",
|
|
`LANGBOT_REPO=${repoDir}`,
|
|
`LANGBOT_WEB_REPO=${webDir}`,
|
|
`LANGBOT_BROWSER_PROFILE=${browserProfile}`,
|
|
`LANGBOT_CHROMIUM_EXECUTABLE=${chromium}`,
|
|
].join("\n"),
|
|
);
|
|
|
|
const result = await captureAsync(() => commandEnvDoctor({ root: tmp, args: ["env", "doctor"] }));
|
|
|
|
assert.equal(result.code, 1);
|
|
assert.doesNotMatch(result.output, /missing LANGBOT_PROXY|missing LANGBOT_NO_PROXY/);
|
|
} finally {
|
|
rmSync(tmp, { recursive: true, force: true });
|
|
}
|
|
});
|
|
|
|
test("env show redacts secret-like values by default", () => {
|
|
const tmp = mkdtempSync(join(tmpdir(), "lbs-env-show-redact-"));
|
|
try {
|
|
mkdirSync(join(tmp, "skills"), { recursive: true });
|
|
writeFileSync(
|
|
join(tmp, "skills", ".env"),
|
|
[
|
|
"LANGBOT_FRONTEND_URL=http://127.0.0.1:3000",
|
|
"LANGBOT_API_KEY=sk-test-secret",
|
|
"LANGBOT_PROXY_HTTP=http://user:pass@127.0.0.1:7890",
|
|
].join("\n"),
|
|
);
|
|
|
|
const text = capture(() => commandEnvShow({ root: tmp, args: ["env", "show"] }));
|
|
assert.equal(text.code, 0);
|
|
assert.match(text.output, /LANGBOT_API_KEY=\[redacted\]/);
|
|
assert.match(text.output, /LANGBOT_PROXY_HTTP=http:\/\/\[redacted\]@127\.0\.0\.1:7890/);
|
|
assert.doesNotMatch(text.output, /sk-test-secret|user:pass/);
|
|
|
|
const json = capture(() => commandEnvShow({ root: tmp, args: ["env", "show", "--json"] }));
|
|
assert.equal(json.code, 0);
|
|
const parsed = JSON.parse(json.output);
|
|
assert.equal(parsed.LANGBOT_API_KEY, "[redacted]");
|
|
assert.equal(parsed.LANGBOT_PROXY_HTTP, "http://[redacted]@127.0.0.1:7890");
|
|
} finally {
|
|
rmSync(tmp, { recursive: true, force: true });
|
|
}
|
|
});
|
|
|
|
test("test plan renders agent-browser QA guidance", () => {
|
|
const result = capture(() => commandTestPlan(ctx(["test", "plan", "pipeline-debug-chat"])));
|
|
assert.equal(result.code, 0);
|
|
assert.match(result.output, /Mode: agent-browser/);
|
|
assert.match(result.output, /Use browser\/UI interaction as the primary QA path/);
|
|
assert.match(result.output, /API\/curl\/log checks are diagnostic only/);
|
|
assert.match(result.output, /## Browser Steps/);
|
|
assert.match(result.output, /## Success Signals/);
|
|
assert.match(result.output, /## Required Evidence/);
|
|
assert.match(result.output, /## Automation Readiness/);
|
|
assert.match(result.output, /## Fixture Readiness/);
|
|
assert.match(result.output, /## Manual Readiness/);
|
|
assert.match(result.output, /backend_log/);
|
|
});
|
|
|
|
test("test plan JSON is parseable and includes troubleshooting patterns", () => {
|
|
const result = capture(() => commandTestPlan(ctx(["test", "plan", "pipeline-debug-chat", "--json"])));
|
|
assert.equal(result.code, 0);
|
|
const plan = JSON.parse(result.output);
|
|
assert.equal(plan.id, "pipeline-debug-chat");
|
|
assert.equal(plan.mode, "agent-browser");
|
|
assert.ok(["ready", "missing"].includes(plan.automation_readiness.status));
|
|
assert.ok(plan.automation_readiness.defaulted.includes("LANGBOT_E2E_PROMPT"));
|
|
assert.ok(plan.automation_readiness.defaulted.includes("LANGBOT_E2E_EXPECTED_TEXT"));
|
|
assert.equal(plan.manual_readiness.status, "manual_check");
|
|
assert.ok(plan.success_patterns.includes("Streaming completed"));
|
|
assert.ok(plan.troubleshooting.some((entry: { id: string }) => entry.id === "plugin-runtime-timeout"));
|
|
});
|
|
|
|
test("test plan JSON exposes missing case-specific pipeline readiness", () => {
|
|
const result = capture(() => commandTestPlan(ctx(["test", "plan", "local-agent-basic-debug-chat", "--json"])));
|
|
assert.equal(result.code, 0);
|
|
const plan = JSON.parse(result.output);
|
|
assert.equal(plan.env_readiness.status, "ready");
|
|
assert.ok(["ready", "missing"].includes(plan.automation_readiness.status));
|
|
assert.ok(plan.automation_readiness.pipeline_env_required);
|
|
assert.ok(
|
|
plan.automation_readiness.missing.includes("LANGBOT_LOCAL_AGENT_PIPELINE_URL|LANGBOT_LOCAL_AGENT_PIPELINE_NAME")
|
|
|| plan.automation_readiness.configured.some((key: string) => key.startsWith("LANGBOT_LOCAL_AGENT_PIPELINE_")),
|
|
);
|
|
});
|
|
|
|
test("generic pipeline readiness accepts either URL or name target", () => {
|
|
const originalUrl = process.env.LANGBOT_PIPELINE_URL;
|
|
const originalName = process.env.LANGBOT_PIPELINE_NAME;
|
|
try {
|
|
withEnv({
|
|
LANGBOT_BROWSER_PROFILE: "/tmp/langbot-test-profile",
|
|
LANGBOT_CHROMIUM_EXECUTABLE: "/tmp/langbot-test-chromium",
|
|
}, () => {
|
|
process.env.LANGBOT_PIPELINE_URL = "http://127.0.0.1:3000/home/pipelines?id=only-url";
|
|
process.env.LANGBOT_PIPELINE_NAME = "";
|
|
|
|
const ready = capture(() => commandTestPlan(ctx(["test", "plan", "pipeline-debug-chat", "--json"])));
|
|
assert.equal(ready.code, 0);
|
|
const plan = JSON.parse(ready.output);
|
|
assert.equal(plan.env_readiness.status, "ready");
|
|
assert.equal(plan.automation_readiness.status, "ready");
|
|
assert.ok(plan.automation_readiness.required.includes("LANGBOT_PIPELINE_URL|LANGBOT_PIPELINE_NAME"));
|
|
});
|
|
|
|
process.env.LANGBOT_PIPELINE_URL = "";
|
|
process.env.LANGBOT_PIPELINE_NAME = "";
|
|
|
|
const missing = capture(() => commandTestPlan(ctx(["test", "plan", "pipeline-debug-chat", "--json"])));
|
|
assert.equal(missing.code, 0);
|
|
const missingPlan = JSON.parse(missing.output);
|
|
assert.equal(missingPlan.env_readiness.status, "missing");
|
|
assert.ok(missingPlan.env_readiness.missing.includes("LANGBOT_PIPELINE_URL|LANGBOT_PIPELINE_NAME"));
|
|
assert.equal(missingPlan.automation_readiness.status, "missing");
|
|
assert.ok(missingPlan.automation_readiness.missing.includes("LANGBOT_PIPELINE_URL|LANGBOT_PIPELINE_NAME"));
|
|
} finally {
|
|
if (originalUrl === undefined) delete process.env.LANGBOT_PIPELINE_URL;
|
|
else process.env.LANGBOT_PIPELINE_URL = originalUrl;
|
|
if (originalName === undefined) delete process.env.LANGBOT_PIPELINE_NAME;
|
|
else process.env.LANGBOT_PIPELINE_NAME = originalName;
|
|
}
|
|
});
|
|
|
|
test("test recommend maps AgentRunner ledger changes to focused probes", () => {
|
|
const result = capture(() => commandTestRecommend(ctx([
|
|
"test",
|
|
"recommend",
|
|
"--file",
|
|
"LangBot/src/langbot/pkg/agent/runner/run_ledger_store.py",
|
|
"--file",
|
|
"LangBot/tests/unit_tests/agent/test_run_ledger_store.py",
|
|
"--json",
|
|
])));
|
|
assert.equal(result.code, 0);
|
|
const report = JSON.parse(result.output);
|
|
const ids = report.recommendations.map((item: { id: string }) => item.id);
|
|
assert.ok(ids.includes("agent-runner-ledger-invariants"));
|
|
assert.ok(ids.includes("agent-runner-ledger-stress"));
|
|
assert.ok(ids.includes("agent-runner-ledger-contention"));
|
|
assert.ok(ids.includes("agent-runner-async-db-readiness"));
|
|
assert.ok(ids.includes("agent-runner-ledger-concurrency"));
|
|
assert.ok(report.commands.every((command: string) => !command.startsWith("bin/lbs test run ") || command.endsWith(" --dry-run")));
|
|
assert.ok(report.notes.some((note: string) => note.includes("Remove --dry-run")));
|
|
});
|
|
|
|
test("test recommend maps AgentRunner result changes to fixture contract", () => {
|
|
const result = capture(() => commandTestRecommend(ctx([
|
|
"test",
|
|
"recommend",
|
|
"--file",
|
|
"langbot-plugin-sdk/src/langbot_plugin/api/entities/builtin/agent_runner/result.py",
|
|
"--json",
|
|
])));
|
|
assert.equal(result.code, 0);
|
|
const report = JSON.parse(result.output);
|
|
const ids = report.recommendations.map((item: { id: string }) => item.id);
|
|
assert.ok(ids.includes("agent-runner-fixture-contract"));
|
|
assert.ok(ids.includes("agent-runner-behavior-matrix"));
|
|
assert.ok(!ids.includes("agent-runner-ledger-invariants"));
|
|
});
|
|
|
|
test("test recommend maps QA AgentRunner fixture changes to live install", () => {
|
|
const result = capture(() => commandTestRecommend(ctx([
|
|
"test",
|
|
"recommend",
|
|
"--file",
|
|
"langbot-skills/skills/langbot-testing/fixtures/plugins/qa-agent-runner/components/agent_runner/default.py",
|
|
"--json",
|
|
])));
|
|
assert.equal(result.code, 0);
|
|
const report = JSON.parse(result.output);
|
|
const ids = report.recommendations.map((item: { id: string }) => item.id);
|
|
assert.ok(ids.includes("agent-runner-fixture-contract"));
|
|
assert.ok(ids.includes("agent-runner-live-install"));
|
|
assert.ok(ids.includes("agent-runner-qa-debug-chat"));
|
|
});
|
|
|
|
test("test recommend maps QA plugin smoke fixture changes to live install", () => {
|
|
const result = capture(() => commandTestRecommend(ctx([
|
|
"test",
|
|
"recommend",
|
|
"--file",
|
|
"langbot-skills/skills/langbot-testing/fixtures/plugins/qa-plugin-smoke/main.py",
|
|
"--json",
|
|
])));
|
|
assert.equal(result.code, 0);
|
|
const report = JSON.parse(result.output);
|
|
const ids = report.recommendations.map((item: { id: string }) => item.id);
|
|
assert.ok(ids.includes("qa-plugin-smoke-live-install"));
|
|
});
|
|
|
|
test("test recommend keeps git status paths intact", () => {
|
|
const tmp = mkdtempSync(join(tmpdir(), "lbs-recommend-git-"));
|
|
const originalRepos = {
|
|
LANGBOT_REPO: process.env.LANGBOT_REPO,
|
|
LANGBOT_PLUGIN_SDK_REPO: process.env.LANGBOT_PLUGIN_SDK_REPO,
|
|
LANGBOT_AGENT_RUNNER_REPO: process.env.LANGBOT_AGENT_RUNNER_REPO,
|
|
LANGBOT_LOCAL_AGENT_REPO: process.env.LANGBOT_LOCAL_AGENT_REPO,
|
|
};
|
|
try {
|
|
const repo = join(tmp, "LangBot");
|
|
mkdirSync(join(repo, "src", "langbot", "pkg", "agent", "runner"), { recursive: true });
|
|
spawnSync("git", ["init"], { cwd: repo });
|
|
spawnSync("git", ["config", "user.email", "qa@example.test"], { cwd: repo });
|
|
spawnSync("git", ["config", "user.name", "QA"], { cwd: repo });
|
|
writeFileSync(join(repo, "README.md"), "test\n");
|
|
writeFileSync(join(repo, "src", "langbot", "pkg", "agent", "runner", "run_ledger_store.py"), "# test\n");
|
|
spawnSync("git", ["add", "README.md", "src/langbot/pkg/agent/runner/run_ledger_store.py"], { cwd: repo });
|
|
spawnSync("git", ["commit", "-m", "init"], { cwd: repo });
|
|
writeFileSync(join(repo, "src", "langbot", "pkg", "agent", "runner", "run_ledger_store.py"), "# changed\n");
|
|
|
|
process.env.LANGBOT_REPO = repo;
|
|
process.env.LANGBOT_PLUGIN_SDK_REPO = join(tmp, "missing-sdk");
|
|
process.env.LANGBOT_AGENT_RUNNER_REPO = join(tmp, "missing-runner");
|
|
process.env.LANGBOT_LOCAL_AGENT_REPO = join(tmp, "missing-local");
|
|
const result = capture(() => commandTestRecommend({ root, args: ["test", "recommend", "--json"] }));
|
|
|
|
assert.equal(result.code, 0);
|
|
const report = JSON.parse(result.output);
|
|
assert.ok(report.changed_files.includes("LangBot/src/langbot/pkg/agent/runner/run_ledger_store.py"));
|
|
assert.ok(!report.changed_files.some((file: string) => file.includes("LangBot/rc/")));
|
|
} finally {
|
|
for (const [key, value] of Object.entries(originalRepos)) {
|
|
if (value === undefined) delete process.env[key];
|
|
else process.env[key] = value;
|
|
}
|
|
rmSync(tmp, { recursive: true, force: true });
|
|
}
|
|
});
|
|
|
|
test("test start creates a run handoff with a bounded report command", () => {
|
|
const result = capture(() => commandTestStart(ctx(["test", "start", "pipeline-debug-chat"])));
|
|
assert.equal(result.code, 0);
|
|
assert.match(result.output, /^# Test Start: pipeline-debug-chat/m);
|
|
assert.match(result.output, /bin\/lbs test plan pipeline-debug-chat/);
|
|
assert.match(result.output, /bin\/lbs test run pipeline-debug-chat --run-id .+ --output reports\/evidence\/.+pipeline-debug-chat/);
|
|
assert.match(result.output, /bin\/lbs test report pipeline-debug-chat --since ".+" --console-log reports\/evidence\/.+\/console\.log --evidence-dir reports\/evidence\/.+ --output reports\/.+pipeline-debug-chat\.md/);
|
|
assert.match(result.output, /Streaming completed/);
|
|
});
|
|
|
|
test("test start JSON is parseable for agent orchestration", () => {
|
|
const result = capture(() => commandTestStart(ctx(["test", "start", "pipeline-debug-chat", "--json"])));
|
|
assert.equal(result.code, 0);
|
|
const start = JSON.parse(result.output);
|
|
assert.equal(start.case.id, "pipeline-debug-chat");
|
|
assert.match(start.run_id, /pipeline-debug-chat$/);
|
|
assert.match(start.started_at_local, /\d{4}-\d{2}-\d{2}T/);
|
|
assert.match(start.report_command, /--since/);
|
|
assert.match(start.result_command_template, /bin\/lbs test result pipeline-debug-chat/);
|
|
assert.match(start.automation.command, /bin\/lbs test run pipeline-debug-chat/);
|
|
assert.ok(start.success_patterns.includes("Streaming completed"));
|
|
assert.ok(start.evidence_required.includes("backend_log"));
|
|
});
|
|
|
|
test("test result writes a suite-readable result.json and enforces pass evidence", () => {
|
|
const tmp = mkdtempSync(join(tmpdir(), "lbs-test-result-"));
|
|
try {
|
|
const evidenceDir = join(tmp, "pipeline-run");
|
|
const ok = capture(() => commandTestResult(ctx([
|
|
"test",
|
|
"result",
|
|
"pipeline-debug-chat",
|
|
"--result",
|
|
"pass",
|
|
"--reason",
|
|
"Debug Chat returned OK and logs were clean.",
|
|
"--evidence-dir",
|
|
evidenceDir,
|
|
"--started-at",
|
|
"2026-05-21T10:30:00.000+08:00",
|
|
"--evidence",
|
|
"ui,screenshot,console,backend_log",
|
|
"--json",
|
|
])));
|
|
|
|
assert.equal(ok.code, 0);
|
|
const record = JSON.parse(ok.output);
|
|
assert.equal(record.source, "final");
|
|
assert.equal(record.status, "pass");
|
|
assert.equal(record.evidence_status, "complete");
|
|
assert.deepEqual(record.evidence_missing, []);
|
|
assert.equal(JSON.parse(readFileSync(join(evidenceDir, "result.json"), "utf8")).case_id, "pipeline-debug-chat");
|
|
|
|
const missing = captureAll(() => commandTestResult(ctx([
|
|
"test",
|
|
"result",
|
|
"pipeline-debug-chat",
|
|
"--result",
|
|
"pass",
|
|
"--reason",
|
|
"Missing backend evidence should not be accepted as pass.",
|
|
"--evidence-dir",
|
|
join(tmp, "missing-evidence"),
|
|
"--evidence",
|
|
"ui",
|
|
])));
|
|
assert.equal(missing.code, 1);
|
|
assert.match(missing.error, /missing required evidence/);
|
|
} finally {
|
|
rmSync(tmp, { recursive: true, force: true });
|
|
}
|
|
});
|
|
|
|
test("test run dry-run exposes case automation script and evidence paths", () => {
|
|
const result = capture(() => commandTestRun(ctx([
|
|
"test",
|
|
"run",
|
|
"pipeline-debug-chat",
|
|
"--run-id",
|
|
"run-123",
|
|
"--output",
|
|
"reports/evidence/run-123",
|
|
"--dry-run",
|
|
])));
|
|
assert.equal(result.code, 0);
|
|
assert.match(result.output, /^# Test Automation: pipeline-debug-chat/m);
|
|
assert.match(result.output, /scripts\/e2e\/pipeline-debug-chat\.mjs/);
|
|
assert.match(result.output, /console_log: reports\/evidence\/run-123\/console\.log/);
|
|
assert.match(result.output, /automation_result_json: reports\/evidence\/run-123\/automation-result\.json/);
|
|
assert.match(result.output, /result_json: reports\/evidence\/run-123\/result\.json/);
|
|
assert.match(result.output, /LANGBOT_PIPELINE_URL/);
|
|
});
|
|
|
|
test("test run dry-run JSON is parseable for automation orchestration", () => {
|
|
const result = capture(() => commandTestRun(ctx([
|
|
"test",
|
|
"run",
|
|
"webui-login-state",
|
|
"--run-id",
|
|
"login-run",
|
|
"--dry-run",
|
|
"--json",
|
|
])));
|
|
assert.equal(result.code, 0);
|
|
const run = JSON.parse(result.output);
|
|
assert.equal(run.case.id, "webui-login-state");
|
|
assert.equal(run.run_id, "login-run");
|
|
assert.equal(run.automation.script, "scripts/e2e/webui-login-state.mjs");
|
|
assert.equal(run.automation.exists, true);
|
|
assert.match(run.automation.automation_result_json, /automation-result\.json$/);
|
|
assert.match(run.automation.result_json, /result\.json$/);
|
|
assert.match(run.automation.report_command, /--console-log/);
|
|
});
|
|
|
|
test("test run JSON executes automation unless dry-run is explicit", () => {
|
|
const tmp = mkdtempSync(join(tmpdir(), "lbs-run-json-exec-"));
|
|
try {
|
|
const skillDir = join(tmp, "skills", "langbot-testing");
|
|
const casesDir = join(skillDir, "cases");
|
|
const scriptsDir = join(tmp, "scripts");
|
|
mkdirSync(casesDir, { recursive: true });
|
|
mkdirSync(scriptsDir, { recursive: true });
|
|
writeFileSync(join(skillDir, "SKILL.md"), "---\nname: langbot-testing\ndescription: Testing.\n---\n\n# Testing\n");
|
|
writeFileSync(join(tmp, "skills", ".env"), "");
|
|
writeFileSync(
|
|
join(casesDir, "json-exec.yaml"),
|
|
[
|
|
"id: json-exec",
|
|
"title: JSON Exec",
|
|
"mode: probe",
|
|
"area: qa",
|
|
"type: smoke",
|
|
"priority: p2",
|
|
"risk: low",
|
|
"ci_eligible: true",
|
|
"automation: scripts/write-marker.mjs",
|
|
].join("\n"),
|
|
);
|
|
writeFileSync(
|
|
join(scriptsDir, "write-marker.mjs"),
|
|
[
|
|
"import { writeFileSync } from 'node:fs';",
|
|
"import { join } from 'node:path';",
|
|
"writeFileSync(join(process.env.LBS_ROOT, 'json-ran.txt'), 'yes');",
|
|
].join("\n"),
|
|
);
|
|
|
|
const result = capture(() => commandTestRun({
|
|
root: tmp,
|
|
args: ["test", "run", "json-exec", "--run-id", "json-run", "--json"],
|
|
}));
|
|
|
|
assert.equal(result.code, 0);
|
|
assert.equal(readFileSync(join(tmp, "json-ran.txt"), "utf8"), "yes");
|
|
const payload = JSON.parse(result.output);
|
|
assert.equal(payload.exit_status, 0);
|
|
assert.equal(payload.automation_execution.status, "ok");
|
|
} finally {
|
|
rmSync(tmp, { recursive: true, force: true });
|
|
}
|
|
});
|
|
|
|
test("test run lets explicit environment override automation defaults", () => {
|
|
const tmp = mkdtempSync(join(tmpdir(), "lbs-run-env-override-"));
|
|
const originalPatch = process.env.LANGBOT_E2E_RUNNER_CONFIG_PATCH_JSON;
|
|
try {
|
|
const skillDir = join(tmp, "skills", "langbot-testing");
|
|
const casesDir = join(skillDir, "cases");
|
|
const scriptsDir = join(tmp, "scripts");
|
|
mkdirSync(casesDir, { recursive: true });
|
|
mkdirSync(scriptsDir, { recursive: true });
|
|
writeFileSync(join(skillDir, "SKILL.md"), "---\nname: langbot-testing\ndescription: Testing.\n---\n\n# Testing\n");
|
|
writeFileSync(join(tmp, "skills", ".env"), "");
|
|
writeFileSync(
|
|
join(casesDir, "env-override.yaml"),
|
|
[
|
|
"id: env-override",
|
|
"title: Env Override",
|
|
"mode: agent-browser",
|
|
"area: pipeline",
|
|
"type: smoke",
|
|
"priority: p2",
|
|
"risk: low",
|
|
"ci_eligible: false",
|
|
"automation: scripts/write-env.mjs",
|
|
"automation_runner_config_patch_json: '{\"source\":\"default\"}'",
|
|
].join("\n"),
|
|
);
|
|
writeFileSync(
|
|
join(scriptsDir, "write-env.mjs"),
|
|
[
|
|
"import { writeFileSync } from 'node:fs';",
|
|
"import { join } from 'node:path';",
|
|
"writeFileSync(join(process.env.LBS_ROOT, 'env-out.json'), JSON.stringify({",
|
|
" patch: process.env.LANGBOT_E2E_RUNNER_CONFIG_PATCH_JSON,",
|
|
"}));",
|
|
].join("\n"),
|
|
);
|
|
|
|
process.env.LANGBOT_E2E_RUNNER_CONFIG_PATCH_JSON = '{"source":"explicit"}';
|
|
const result = capture(() => commandTestRun({
|
|
root: tmp,
|
|
args: ["test", "run", "env-override", "--run-id", "env-run"],
|
|
}));
|
|
|
|
assert.equal(result.code, 0);
|
|
const observed = JSON.parse(readFileSync(join(tmp, "env-out.json"), "utf8"));
|
|
assert.equal(observed.patch, '{"source":"explicit"}');
|
|
} finally {
|
|
if (originalPatch === undefined) delete process.env.LANGBOT_E2E_RUNNER_CONFIG_PATCH_JSON;
|
|
else process.env.LANGBOT_E2E_RUNNER_CONFIG_PATCH_JSON = originalPatch;
|
|
rmSync(tmp, { recursive: true, force: true });
|
|
}
|
|
});
|
|
|
|
test("test run expands env references in automation defaults", () => {
|
|
const tmp = mkdtempSync(join(tmpdir(), "lbs-run-env-expand-"));
|
|
try {
|
|
const skillDir = join(tmp, "skills", "langbot-testing");
|
|
const casesDir = join(skillDir, "cases");
|
|
const scriptsDir = join(tmp, "scripts");
|
|
mkdirSync(casesDir, { recursive: true });
|
|
mkdirSync(scriptsDir, { recursive: true });
|
|
writeFileSync(join(skillDir, "SKILL.md"), "---\nname: langbot-testing\ndescription: Testing.\n---\n\n# Testing\n");
|
|
writeFileSync(join(tmp, "skills", ".env"), "QA_KB_UUID=kb-from-env\nQA_MODEL_UUID=model-from-env\n");
|
|
writeFileSync(
|
|
join(casesDir, "env-expand.yaml"),
|
|
[
|
|
"id: env-expand",
|
|
"title: Env Expand",
|
|
"mode: agent-browser",
|
|
"area: pipeline",
|
|
"type: smoke",
|
|
"priority: p2",
|
|
"risk: low",
|
|
"ci_eligible: false",
|
|
"automation: scripts/write-expanded-env.mjs",
|
|
"automation_runner_config_patch_json: '{\"knowledge-bases\":[\"${QA_KB_UUID}\"],\"model\":{\"primary\":\"${QA_MODEL_UUID}\"}}'",
|
|
].join("\n"),
|
|
);
|
|
writeFileSync(
|
|
join(scriptsDir, "write-expanded-env.mjs"),
|
|
[
|
|
"import { writeFileSync } from 'node:fs';",
|
|
"import { join } from 'node:path';",
|
|
"writeFileSync(join(process.env.LBS_ROOT, 'expanded-env-out.json'), JSON.stringify({",
|
|
" patch: process.env.LANGBOT_E2E_RUNNER_CONFIG_PATCH_JSON,",
|
|
"}));",
|
|
].join("\n"),
|
|
);
|
|
|
|
const dryRun = capture(() => commandTestRun({
|
|
root: tmp,
|
|
args: ["test", "run", "env-expand", "--run-id", "env-expand-dry", "--dry-run", "--json"],
|
|
}));
|
|
assert.equal(dryRun.code, 0);
|
|
const plan = JSON.parse(dryRun.output);
|
|
assert.equal(
|
|
plan.automation.env_defaults.LANGBOT_E2E_RUNNER_CONFIG_PATCH_JSON,
|
|
'{"knowledge-bases":["kb-from-env"],"model":{"primary":"model-from-env"}}',
|
|
);
|
|
|
|
const run = capture(() => commandTestRun({
|
|
root: tmp,
|
|
args: ["test", "run", "env-expand", "--run-id", "env-expand-run"],
|
|
}));
|
|
assert.equal(run.code, 0);
|
|
const observed = JSON.parse(readFileSync(join(tmp, "expanded-env-out.json"), "utf8"));
|
|
assert.equal(observed.patch, '{"knowledge-bases":["kb-from-env"],"model":{"primary":"model-from-env"}}');
|
|
} finally {
|
|
rmSync(tmp, { recursive: true, force: true });
|
|
}
|
|
});
|
|
|
|
test("test run setup automation isolates evidence and reloads env", () => {
|
|
const tmp = mkdtempSync(join(tmpdir(), "lbs-run-setup-automation-"));
|
|
try {
|
|
const skillDir = join(tmp, "skills", "langbot-testing");
|
|
const casesDir = join(skillDir, "cases");
|
|
const scriptsDir = join(tmp, "scripts");
|
|
mkdirSync(casesDir, { recursive: true });
|
|
mkdirSync(scriptsDir, { recursive: true });
|
|
writeFileSync(join(skillDir, "SKILL.md"), "---\nname: langbot-testing\ndescription: Testing.\n---\n\n# Testing\n");
|
|
writeFileSync(join(tmp, "skills", ".env"), "SETUP_VALUE=\n");
|
|
writeFileSync(
|
|
join(casesDir, "setup-main.yaml"),
|
|
[
|
|
"id: setup-main",
|
|
"title: Setup Main",
|
|
"mode: agent-browser",
|
|
"area: pipeline",
|
|
"type: smoke",
|
|
"priority: p2",
|
|
"risk: low",
|
|
"ci_eligible: false",
|
|
"env:",
|
|
" - SETUP_VALUE",
|
|
"setup_automation:",
|
|
" - \"node:scripts/write-setup-env.mjs --write-env\"",
|
|
"setup_provides_env:",
|
|
" - SETUP_VALUE",
|
|
"automation: scripts/read-setup-env.mjs",
|
|
].join("\n"),
|
|
);
|
|
writeFileSync(
|
|
join(casesDir, "setup-env-issue.yaml"),
|
|
[
|
|
"id: setup-env-issue",
|
|
"title: Setup Env Issue",
|
|
"mode: agent-browser",
|
|
"area: pipeline",
|
|
"type: smoke",
|
|
"priority: p2",
|
|
"risk: low",
|
|
"ci_eligible: false",
|
|
"setup_automation:",
|
|
" - \"node:scripts/write-setup-env-issue.mjs\"",
|
|
"automation: scripts/read-setup-env.mjs",
|
|
].join("\n"),
|
|
);
|
|
writeFileSync(
|
|
join(casesDir, "setup-fail-after-pass.yaml"),
|
|
[
|
|
"id: setup-fail-after-pass",
|
|
"title: Setup Fail After Pass",
|
|
"mode: agent-browser",
|
|
"area: pipeline",
|
|
"type: smoke",
|
|
"priority: p2",
|
|
"risk: low",
|
|
"ci_eligible: false",
|
|
"setup_automation:",
|
|
" - \"node:scripts/write-setup-pass-then-fail.mjs\"",
|
|
"automation: scripts/read-setup-env.mjs",
|
|
].join("\n"),
|
|
);
|
|
writeFileSync(
|
|
join(scriptsDir, "write-setup-env.mjs"),
|
|
[
|
|
"import { mkdirSync, writeFileSync } from 'node:fs';",
|
|
"import { dirname, join } from 'node:path';",
|
|
"const local = join(process.env.LBS_ROOT, 'skills', '.env.local');",
|
|
"writeFileSync(local, 'SETUP_VALUE=from-setup\\n');",
|
|
"mkdirSync(process.env.LBS_EVIDENCE_DIR, { recursive: true });",
|
|
"writeFileSync(join(process.env.LBS_EVIDENCE_DIR, 'automation-result.json'), JSON.stringify({ status: 'pass', stage: 'setup' }));",
|
|
"writeFileSync(join(process.env.LBS_EVIDENCE_DIR, 'result.json'), JSON.stringify({ status: 'pass', stage: 'setup' }));",
|
|
"writeFileSync(join(dirname(process.env.LBS_EVIDENCE_DIR), 'setup-ran.txt'), 'yes');",
|
|
].join("\n"),
|
|
);
|
|
writeFileSync(
|
|
join(scriptsDir, "read-setup-env.mjs"),
|
|
[
|
|
"import { mkdirSync, writeFileSync } from 'node:fs';",
|
|
"import { join } from 'node:path';",
|
|
"mkdirSync(process.env.LBS_EVIDENCE_DIR, { recursive: true });",
|
|
"writeFileSync(join(process.env.LBS_ROOT, 'main-observed.json'), JSON.stringify({ value: process.env.SETUP_VALUE }));",
|
|
"writeFileSync(join(process.env.LBS_EVIDENCE_DIR, 'automation-result.json'), JSON.stringify({ status: 'pass', stage: 'main' }));",
|
|
"writeFileSync(join(process.env.LBS_EVIDENCE_DIR, 'result.json'), JSON.stringify({ status: 'pass', stage: 'main' }));",
|
|
"if (process.env.SETUP_VALUE !== 'from-setup') process.exit(1);",
|
|
].join("\n"),
|
|
);
|
|
writeFileSync(
|
|
join(scriptsDir, "write-setup-env-issue.mjs"),
|
|
[
|
|
"import { mkdirSync, writeFileSync } from 'node:fs';",
|
|
"import { join } from 'node:path';",
|
|
"mkdirSync(process.env.LBS_EVIDENCE_DIR, { recursive: true });",
|
|
"writeFileSync(join(process.env.LBS_EVIDENCE_DIR, 'automation-result.json'), JSON.stringify({ status: 'env_issue', reason: 'setup env missing' }));",
|
|
"process.exit(2);",
|
|
].join("\n"),
|
|
);
|
|
writeFileSync(
|
|
join(scriptsDir, "write-setup-pass-then-fail.mjs"),
|
|
[
|
|
"import { mkdirSync, writeFileSync } from 'node:fs';",
|
|
"import { join } from 'node:path';",
|
|
"mkdirSync(process.env.LBS_EVIDENCE_DIR, { recursive: true });",
|
|
"writeFileSync(join(process.env.LBS_EVIDENCE_DIR, 'automation-result.json'), JSON.stringify({ status: 'pass', reason: 'stale pass before crash' }));",
|
|
"process.exit(1);",
|
|
].join("\n"),
|
|
);
|
|
|
|
const dryRun = capture(() => commandTestRun({
|
|
root: tmp,
|
|
args: ["test", "run", "setup-main", "--run-id", "setup-run", "--output", join(tmp, "evidence"), "--dry-run", "--json"],
|
|
}));
|
|
assert.equal(dryRun.code, 0);
|
|
const plan = JSON.parse(dryRun.output);
|
|
assert.equal(plan.setup_automation.length, 1);
|
|
assert.match(plan.setup_automation[0].evidence_dir, /setup\/01-write-setup-env$/);
|
|
assert.match(plan.setup_automation[0].command, /^node scripts\/write-setup-env\.mjs --write-env$/);
|
|
assert.equal(plan.setup_automation[0].dry_run_command, "");
|
|
assert.equal(existsSync(join(tmp, "skills", ".env.local")), false);
|
|
|
|
const run = capture(() => commandTestRun({
|
|
root: tmp,
|
|
args: ["test", "run", "setup-main", "--run-id", "setup-run", "--output", join(tmp, "evidence")],
|
|
}));
|
|
assert.equal(run.code, 0);
|
|
const observed = JSON.parse(readFileSync(join(tmp, "main-observed.json"), "utf8"));
|
|
assert.equal(observed.value, "from-setup");
|
|
const setupResult = JSON.parse(readFileSync(join(tmp, "evidence", "setup", "01-write-setup-env", "automation-result.json"), "utf8"));
|
|
const mainResult = JSON.parse(readFileSync(join(tmp, "evidence", "automation-result.json"), "utf8"));
|
|
assert.equal(setupResult.stage, "setup");
|
|
assert.equal(mainResult.stage, "main");
|
|
|
|
const envIssue = capture(() => commandTestRun({
|
|
root: tmp,
|
|
args: ["test", "run", "setup-env-issue", "--run-id", "setup-env-issue-run", "--output", join(tmp, "evidence-env-issue")],
|
|
}));
|
|
assert.equal(envIssue.code, 2);
|
|
const parentResult = JSON.parse(readFileSync(join(tmp, "evidence-env-issue", "automation-result.json"), "utf8"));
|
|
assert.equal(parentResult.status, "env_issue");
|
|
assert.equal(parentResult.reason, "setup env missing");
|
|
|
|
const failAfterPass = capture(() => commandTestRun({
|
|
root: tmp,
|
|
args: ["test", "run", "setup-fail-after-pass", "--run-id", "setup-fail-after-pass-run", "--output", join(tmp, "evidence-fail-after-pass")],
|
|
}));
|
|
assert.equal(failAfterPass.code, 1);
|
|
const failAfterPassResult = JSON.parse(readFileSync(join(tmp, "evidence-fail-after-pass", "automation-result.json"), "utf8"));
|
|
assert.equal(failAfterPassResult.status, "fail");
|
|
assert.equal(failAfterPassResult.reason, "stale pass before crash");
|
|
} finally {
|
|
rmSync(tmp, { recursive: true, force: true });
|
|
}
|
|
});
|
|
|
|
test("test run setup automation can execute another case outside this source repo", () => {
|
|
const tmp = mkdtempSync(join(tmpdir(), "lbs-run-setup-case-"));
|
|
try {
|
|
const skillDir = join(tmp, "skills", "langbot-testing");
|
|
const casesDir = join(skillDir, "cases");
|
|
const scriptsDir = join(tmp, "scripts");
|
|
mkdirSync(casesDir, { recursive: true });
|
|
mkdirSync(scriptsDir, { recursive: true });
|
|
writeFileSync(join(skillDir, "SKILL.md"), "---\nname: langbot-testing\ndescription: Testing.\n---\n\n# Testing\n");
|
|
writeFileSync(join(tmp, "skills", ".env"), "SETUP_VALUE=\n");
|
|
writeFileSync(
|
|
join(casesDir, "setup-child.yaml"),
|
|
[
|
|
"id: setup-child",
|
|
"title: Setup Child",
|
|
"mode: probe",
|
|
"area: qa",
|
|
"type: smoke",
|
|
"priority: p2",
|
|
"risk: low",
|
|
"ci_eligible: true",
|
|
"automation: scripts/write-child-env.mjs",
|
|
].join("\n"),
|
|
);
|
|
writeFileSync(
|
|
join(casesDir, "setup-parent.yaml"),
|
|
[
|
|
"id: setup-parent",
|
|
"title: Setup Parent",
|
|
"mode: probe",
|
|
"area: qa",
|
|
"type: smoke",
|
|
"priority: p2",
|
|
"risk: low",
|
|
"ci_eligible: true",
|
|
"setup_automation:",
|
|
" - \"case:setup-child\"",
|
|
"setup_provides_env:",
|
|
" - SETUP_VALUE",
|
|
"automation: scripts/read-child-env.mjs",
|
|
].join("\n"),
|
|
);
|
|
writeFileSync(
|
|
join(scriptsDir, "write-child-env.mjs"),
|
|
[
|
|
"import { mkdirSync, writeFileSync } from 'node:fs';",
|
|
"import { join } from 'node:path';",
|
|
"writeFileSync(join(process.env.LBS_ROOT, 'skills', '.env.local'), 'SETUP_VALUE=from-child\\n');",
|
|
"mkdirSync(process.env.LBS_EVIDENCE_DIR, { recursive: true });",
|
|
"writeFileSync(join(process.env.LBS_EVIDENCE_DIR, 'automation-result.json'), JSON.stringify({ status: 'pass' }));",
|
|
"writeFileSync(join(process.env.LBS_EVIDENCE_DIR, 'result.json'), JSON.stringify({ status: 'pass' }));",
|
|
].join("\n"),
|
|
);
|
|
writeFileSync(
|
|
join(scriptsDir, "read-child-env.mjs"),
|
|
[
|
|
"import { mkdirSync, writeFileSync } from 'node:fs';",
|
|
"import { join } from 'node:path';",
|
|
"mkdirSync(process.env.LBS_EVIDENCE_DIR, { recursive: true });",
|
|
"writeFileSync(join(process.env.LBS_EVIDENCE_DIR, 'automation-result.json'), JSON.stringify({ status: 'pass', value: process.env.SETUP_VALUE }));",
|
|
"writeFileSync(join(process.env.LBS_EVIDENCE_DIR, 'result.json'), JSON.stringify({ status: 'pass', value: process.env.SETUP_VALUE }));",
|
|
"if (process.env.SETUP_VALUE !== 'from-child') process.exit(1);",
|
|
].join("\n"),
|
|
);
|
|
|
|
const run = capture(() => commandTestRun({
|
|
root: tmp,
|
|
args: ["test", "run", "setup-parent", "--run-id", "setup-parent-run", "--output", join(tmp, "evidence")],
|
|
}));
|
|
|
|
assert.equal(run.code, 0);
|
|
assert.ok(existsSync(join(tmp, "evidence", "setup", "01-setup-child", "result.json")));
|
|
const result = JSON.parse(readFileSync(join(tmp, "evidence", "automation-result.json"), "utf8"));
|
|
assert.equal(result.value, "from-child");
|
|
} finally {
|
|
rmSync(tmp, { recursive: true, force: true });
|
|
}
|
|
});
|
|
|
|
test("test run automation inherits parent process environment", () => {
|
|
const tmp = mkdtempSync(join(tmpdir(), "lbs-run-env-inherit-"));
|
|
try {
|
|
const skillDir = join(tmp, "skills", "langbot-testing");
|
|
const casesDir = join(skillDir, "cases");
|
|
const scriptsDir = join(tmp, "scripts");
|
|
mkdirSync(casesDir, { recursive: true });
|
|
mkdirSync(scriptsDir, { recursive: true });
|
|
writeFileSync(join(skillDir, "SKILL.md"), "---\nname: langbot-testing\ndescription: Testing.\n---\n\n# Testing\n");
|
|
writeFileSync(join(tmp, "skills", ".env"), "");
|
|
writeFileSync(
|
|
join(casesDir, "env-inherit.yaml"),
|
|
[
|
|
"id: env-inherit",
|
|
"title: Env Inherit",
|
|
"mode: probe",
|
|
"area: qa",
|
|
"type: smoke",
|
|
"priority: p2",
|
|
"risk: low",
|
|
"ci_eligible: true",
|
|
"automation: scripts/read-path.mjs",
|
|
].join("\n"),
|
|
);
|
|
writeFileSync(
|
|
join(scriptsDir, "read-path.mjs"),
|
|
[
|
|
"import { mkdirSync, writeFileSync } from 'node:fs';",
|
|
"import { join } from 'node:path';",
|
|
"mkdirSync(process.env.LBS_EVIDENCE_DIR, { recursive: true });",
|
|
"writeFileSync(join(process.env.LBS_EVIDENCE_DIR, 'automation-result.json'), JSON.stringify({ status: process.env.PATH ? 'pass' : 'fail' }));",
|
|
"process.exit(process.env.PATH ? 0 : 1);",
|
|
].join("\n"),
|
|
);
|
|
|
|
const run = capture(() => commandTestRun({
|
|
root: tmp,
|
|
args: ["test", "run", "env-inherit", "--run-id", "env-inherit-run", "--output", join(tmp, "evidence")],
|
|
}));
|
|
|
|
assert.equal(run.code, 0);
|
|
const result = JSON.parse(readFileSync(join(tmp, "evidence", "automation-result.json"), "utf8"));
|
|
assert.equal(result.status, "pass");
|
|
} finally {
|
|
rmSync(tmp, { recursive: true, force: true });
|
|
}
|
|
});
|
|
|
|
test("test run dry-run marks missing setup case targets", () => {
|
|
const tmp = mkdtempSync(join(tmpdir(), "lbs-run-setup-missing-case-"));
|
|
try {
|
|
const skillDir = join(tmp, "skills", "langbot-testing");
|
|
const casesDir = join(skillDir, "cases");
|
|
const scriptsDir = join(tmp, "scripts");
|
|
mkdirSync(casesDir, { recursive: true });
|
|
mkdirSync(scriptsDir, { recursive: true });
|
|
writeFileSync(join(skillDir, "SKILL.md"), "---\nname: langbot-testing\ndescription: Testing.\n---\n\n# Testing\n");
|
|
writeFileSync(join(tmp, "skills", ".env"), "");
|
|
writeFileSync(
|
|
join(casesDir, "setup-parent.yaml"),
|
|
[
|
|
"id: setup-parent",
|
|
"title: Setup Parent",
|
|
"mode: probe",
|
|
"area: qa",
|
|
"type: smoke",
|
|
"priority: p2",
|
|
"risk: low",
|
|
"ci_eligible: true",
|
|
"setup_automation:",
|
|
" - \"case:missing-child\"",
|
|
"automation: scripts/pass.mjs",
|
|
].join("\n"),
|
|
);
|
|
writeFileSync(join(scriptsDir, "pass.mjs"), "process.exit(0);\n");
|
|
|
|
const result = capture(() => commandTestRun({
|
|
root: tmp,
|
|
args: ["test", "run", "setup-parent", "--dry-run", "--json"],
|
|
}));
|
|
|
|
assert.equal(result.code, 0);
|
|
const run = JSON.parse(result.output);
|
|
assert.equal(run.setup_automation[0].entry, "case:missing-child");
|
|
assert.doesNotMatch(run.setup_automation[0].command, /--dry-run/);
|
|
assert.match(run.setup_automation[0].dry_run_command, /--dry-run/);
|
|
assert.equal(run.setup_automation[0].exists, false);
|
|
} finally {
|
|
rmSync(tmp, { recursive: true, force: true });
|
|
}
|
|
});
|
|
|
|
test("local-agent effective prompt case has runnable automation defaults", () => {
|
|
const result = capture(() => commandTestRun(ctx([
|
|
"test",
|
|
"run",
|
|
"local-agent-effective-prompt-debug-chat",
|
|
"--run-id",
|
|
"effective-run",
|
|
"--dry-run",
|
|
"--json",
|
|
])));
|
|
assert.equal(result.code, 0);
|
|
const run = JSON.parse(result.output);
|
|
assert.equal(run.automation.script, "scripts/e2e/pipeline-debug-chat.mjs");
|
|
assert.equal(run.automation.env_defaults.LANGBOT_E2E_PROMPT, "qa-effective-prompt");
|
|
assert.equal(run.automation.env_defaults.LANGBOT_E2E_EXPECTED_TEXT, "PROMPT_PREPROCESS_OK");
|
|
assert.equal(run.automation.env_defaults.LANGBOT_E2E_RESPONSE_TIMEOUT_MS, "180000");
|
|
assert.equal(run.automation.pipeline_env_required, true);
|
|
assert.ok(run.automation.env_aliases.some((alias: { target: string; source: string }) => (
|
|
alias.target === "LANGBOT_E2E_PIPELINE_URL" && alias.source === "LANGBOT_LOCAL_AGENT_PIPELINE_URL"
|
|
)));
|
|
});
|
|
|
|
test("local-agent basic case can setup the local-agent pipeline env", () => {
|
|
withEnv({
|
|
LANGBOT_BROWSER_PROFILE: "/tmp/langbot-test-profile",
|
|
LANGBOT_CHROMIUM_EXECUTABLE: "/tmp/langbot-test-chromium",
|
|
}, () => {
|
|
const result = capture(() => commandTestRun(ctx([
|
|
"test",
|
|
"run",
|
|
"local-agent-basic-debug-chat",
|
|
"--dry-run",
|
|
"--json",
|
|
])));
|
|
assert.equal(result.code, 0);
|
|
const run = JSON.parse(result.output);
|
|
assert.deepEqual(run.setup_automation.map((item: { entry: string }) => item.entry), [
|
|
"node:scripts/e2e/ensure-local-agent-pipeline.mjs --write-env",
|
|
]);
|
|
|
|
const planResult = capture(() => commandTestPlan(ctx(["test", "plan", "local-agent-basic-debug-chat", "--json"])));
|
|
assert.equal(planResult.code, 0);
|
|
const plan = JSON.parse(planResult.output);
|
|
assert.deepEqual(plan.setup_provides_env, [
|
|
"LANGBOT_LOCAL_AGENT_PIPELINE_URL",
|
|
"LANGBOT_LOCAL_AGENT_PIPELINE_NAME",
|
|
]);
|
|
assert.equal(plan.automation_readiness.status, "ready");
|
|
});
|
|
});
|
|
|
|
test("local-agent nonstreaming case disables stream output through automation defaults", () => {
|
|
const result = capture(() => commandTestRun(ctx([
|
|
"test",
|
|
"run",
|
|
"local-agent-nonstreaming-debug-chat",
|
|
"--dry-run",
|
|
"--json",
|
|
])));
|
|
assert.equal(result.code, 0);
|
|
const run = JSON.parse(result.output);
|
|
assert.equal(run.automation.script, "scripts/e2e/pipeline-debug-chat.mjs");
|
|
assert.equal(run.automation.env_defaults.LANGBOT_E2E_PROMPT, "Reply only NONSTREAM_OK.");
|
|
assert.equal(run.automation.env_defaults.LANGBOT_E2E_EXPECTED_TEXT, "NONSTREAM_OK");
|
|
assert.equal(run.automation.env_defaults.LANGBOT_E2E_STREAM_OUTPUT, "0");
|
|
assert.equal(run.automation.pipeline_env_required, true);
|
|
});
|
|
|
|
test("local-agent multimodal case exposes image fixture automation defaults", () => {
|
|
const result = capture(() => commandTestRun(ctx([
|
|
"test",
|
|
"run",
|
|
"local-agent-multimodal-debug-chat",
|
|
"--dry-run",
|
|
"--json",
|
|
])));
|
|
assert.equal(result.code, 0);
|
|
const run = JSON.parse(result.output);
|
|
assert.equal(run.automation.script, "scripts/e2e/pipeline-debug-chat.mjs");
|
|
assert.equal(run.automation.env_defaults.LANGBOT_E2E_EXPECTED_TEXT, "IMAGE_OK");
|
|
assert.match(run.automation.env_defaults.LANGBOT_E2E_IMAGE_BASE64_PATH, /red-square\.png\.base64$/);
|
|
assert.equal(run.automation.pipeline_env_required, true);
|
|
});
|
|
|
|
test("MCP stdio case passes case-specific failure signals to automation defaults", () => {
|
|
const result = capture(() => commandTestRun(ctx([
|
|
"test",
|
|
"run",
|
|
"mcp-stdio-tool-call",
|
|
"--dry-run",
|
|
"--json",
|
|
])));
|
|
assert.equal(result.code, 0);
|
|
const run = JSON.parse(result.output);
|
|
assert.match(run.automation.env_defaults.LANGBOT_E2E_FAILURE_SIGNALS, /qa-plugin-smoke:mcp-ok-local-agent/);
|
|
assert.match(run.automation.env_defaults.LANGBOT_E2E_FAILURE_SIGNALS, /model_not_found/);
|
|
});
|
|
|
|
test("MCP stdio tool-call case setups pipeline and registered MCP server", () => {
|
|
const result = capture(() => commandTestRun(ctx([
|
|
"test",
|
|
"run",
|
|
"mcp-stdio-tool-call",
|
|
"--dry-run",
|
|
"--json",
|
|
])));
|
|
assert.equal(result.code, 0);
|
|
const run = JSON.parse(result.output);
|
|
assert.deepEqual(run.setup_automation.map((item: { entry: string }) => item.entry), [
|
|
"node:scripts/e2e/ensure-local-agent-pipeline.mjs --write-env",
|
|
"case:mcp-stdio-register",
|
|
]);
|
|
|
|
const planResult = capture(() => commandTestPlan(ctx(["test", "plan", "mcp-stdio-tool-call", "--json"])));
|
|
assert.equal(planResult.code, 0);
|
|
const plan = JSON.parse(planResult.output);
|
|
assert.deepEqual(plan.setup_provides_env, [
|
|
"LANGBOT_LOCAL_AGENT_PIPELINE_URL",
|
|
"LANGBOT_LOCAL_AGENT_PIPELINE_NAME",
|
|
]);
|
|
assert.ok(!plan.preconditions.some((item: string) => item.includes("points to the local-agent pipeline")));
|
|
});
|
|
|
|
test("generic pipeline automation can still use the shared pipeline env", () => {
|
|
const result = capture(() => commandTestRun(ctx([
|
|
"test",
|
|
"run",
|
|
"pipeline-debug-chat",
|
|
"--dry-run",
|
|
"--json",
|
|
])));
|
|
assert.equal(result.code, 0);
|
|
const run = JSON.parse(result.output);
|
|
assert.equal(run.automation.pipeline_env_required, false);
|
|
assert.deepEqual(run.automation.env_aliases, []);
|
|
assert.ok(run.automation.required_env.includes("LANGBOT_PIPELINE_URL|LANGBOT_PIPELINE_NAME"));
|
|
});
|
|
|
|
test("AgentRunner live install case exposes package automation defaults", () => {
|
|
const result = capture(() => commandTestRun(ctx([
|
|
"test",
|
|
"run",
|
|
"agent-runner-live-install",
|
|
"--dry-run",
|
|
"--json",
|
|
])));
|
|
assert.equal(result.code, 0);
|
|
const run = JSON.parse(result.output);
|
|
assert.equal(
|
|
run.automation.env_defaults.LANGBOT_E2E_PLUGIN_PACKAGE,
|
|
"skills/langbot-testing/fixtures/plugins/qa-agent-runner/dist/qa-agent-runner-0.1.0.lbpkg",
|
|
);
|
|
assert.equal(run.automation.env_defaults.LANGBOT_E2E_EXPECTED_PLUGIN_ID, "qa/agent-runner");
|
|
assert.equal(run.automation.env_defaults.LANGBOT_E2E_EXPECTED_RUNNER_ID, "plugin:qa/agent-runner/default");
|
|
});
|
|
|
|
test("QA plugin live install checks the fixture package before installed state", () => {
|
|
const tmp = mkdtempSync(join(tmpdir(), "lbs-install-qa-plugin-"));
|
|
try {
|
|
const result = spawnSync(
|
|
process.execPath,
|
|
[join(root, "scripts/e2e/install-qa-plugin-smoke.mjs")],
|
|
{
|
|
cwd: root,
|
|
env: {
|
|
...process.env,
|
|
LBS_RUN_ID: "missing-package",
|
|
LBS_EVIDENCE_DIR: join(tmp, "evidence"),
|
|
LANGBOT_BACKEND_URL: "http://127.0.0.1:59999",
|
|
LANGBOT_E2E_LOGIN_USER: "qa@example.test",
|
|
LANGBOT_E2E_PLUGIN_PACKAGE: join(tmp, "missing.lbpkg"),
|
|
},
|
|
encoding: "utf8",
|
|
},
|
|
);
|
|
assert.equal(result.status, 1);
|
|
const output = JSON.parse(result.stdout);
|
|
assert.match(output.reason, /missing\.lbpkg/);
|
|
} finally {
|
|
rmSync(tmp, { recursive: true, force: true });
|
|
}
|
|
});
|
|
|
|
test("AgentRunner QA Debug Chat case uses dedicated pipeline env", () => {
|
|
const result = capture(() => commandTestRun(ctx([
|
|
"test",
|
|
"run",
|
|
"agent-runner-qa-debug-chat",
|
|
"--dry-run",
|
|
"--json",
|
|
])));
|
|
assert.equal(result.code, 0);
|
|
const run = JSON.parse(result.output);
|
|
assert.equal(run.automation.script, "scripts/e2e/pipeline-debug-chat.mjs");
|
|
assert.equal(run.automation.pipeline_env_required, true);
|
|
assert.equal(run.automation.env_defaults.LANGBOT_E2E_EXPECTED_RUNNER_ID, "plugin:qa/agent-runner/default");
|
|
assert.deepEqual(
|
|
run.setup_automation.map((item: { entry: string }) => item.entry),
|
|
[
|
|
"case:agent-runner-live-install",
|
|
"node:scripts/e2e/ensure-qa-agent-runner-pipeline.mjs --write-env",
|
|
],
|
|
);
|
|
assert.ok(run.automation.env_aliases.some((alias: { target: string; source: string }) => (
|
|
alias.target === "LANGBOT_E2E_PIPELINE_URL" && alias.source === "LANGBOT_QA_AGENT_RUNNER_PIPELINE_URL"
|
|
)));
|
|
});
|
|
|
|
test("AgentRunner QA Debug Chat setup automation removes manual readiness", () => {
|
|
withEnv({
|
|
LANGBOT_BROWSER_PROFILE: "/tmp/langbot-test-profile",
|
|
LANGBOT_CHROMIUM_EXECUTABLE: "/tmp/langbot-test-chromium",
|
|
}, () => {
|
|
const planResult = capture(() => commandTestPlan(ctx(["test", "plan", "agent-runner-qa-debug-chat", "--json"])));
|
|
assert.equal(planResult.code, 0);
|
|
const plan = JSON.parse(planResult.output);
|
|
assert.equal(plan.manual_readiness.status, "not_required");
|
|
assert.deepEqual(plan.setup_provides_env, [
|
|
"LANGBOT_QA_AGENT_RUNNER_PIPELINE_URL",
|
|
"LANGBOT_QA_AGENT_RUNNER_PIPELINE_NAME",
|
|
]);
|
|
assert.equal(plan.automation_readiness.status, "ready");
|
|
|
|
const suiteResult = capture(() => commandSuitePlan(ctx(["suite", "plan", "agent-runner-release-gate", "--json"])));
|
|
assert.equal(suiteResult.code, 0);
|
|
const suite = JSON.parse(suiteResult.output);
|
|
assert.ok(!suite.readiness.manual_check_cases.includes("agent-runner-qa-debug-chat"));
|
|
});
|
|
});
|
|
|
|
test("ACP AgentRunner Debug Chat case setups the ACP pipeline env", () => {
|
|
const result = capture(() => commandTestRun(ctx([
|
|
"test",
|
|
"run",
|
|
"acp-agent-runner-debug-chat",
|
|
"--dry-run",
|
|
"--json",
|
|
])));
|
|
assert.equal(result.code, 0);
|
|
const run = JSON.parse(result.output);
|
|
assert.deepEqual(run.setup_automation.map((item: { entry: string }) => item.entry), [
|
|
"node:scripts/e2e/ensure-acp-agent-runner-pipeline.mjs --write-env",
|
|
]);
|
|
assert.ok(run.automation.env_aliases.some((alias: { target: string; source: string }) => (
|
|
alias.target === "LANGBOT_E2E_PIPELINE_URL" && alias.source === "LANGBOT_ACP_AGENT_RUNNER_PIPELINE_URL"
|
|
)));
|
|
|
|
const planResult = capture(() => commandTestPlan(ctx(["test", "plan", "acp-agent-runner-debug-chat", "--json"])));
|
|
assert.equal(planResult.code, 0);
|
|
const plan = JSON.parse(planResult.output);
|
|
assert.deepEqual(plan.setup_provides_env, [
|
|
"LANGBOT_ACP_AGENT_RUNNER_PIPELINE_URL",
|
|
"LANGBOT_ACP_AGENT_RUNNER_PIPELINE_NAME",
|
|
]);
|
|
assert.ok(!plan.preconditions.some((item: string) => item.includes("pipeline AI runner")));
|
|
});
|
|
|
|
test("local-agent plugin cases setup the QA plugin smoke fixture", () => {
|
|
const result = capture(() => commandTestRun(ctx([
|
|
"test",
|
|
"run",
|
|
"local-agent-plugin-tool-call-debug-chat",
|
|
"--dry-run",
|
|
"--json",
|
|
])));
|
|
assert.equal(result.code, 0);
|
|
const run = JSON.parse(result.output);
|
|
assert.deepEqual(run.setup_automation.map((item: { entry: string }) => item.entry), [
|
|
"node:scripts/e2e/ensure-local-agent-pipeline.mjs --write-env",
|
|
"case:qa-plugin-smoke-live-install",
|
|
]);
|
|
});
|
|
|
|
test("local-agent RAG case only requires the KB fixture env", () => {
|
|
const result = capture(() => commandTestRun(ctx([
|
|
"test",
|
|
"run",
|
|
"local-agent-rag-debug-chat",
|
|
"--dry-run",
|
|
"--json",
|
|
])));
|
|
assert.equal(result.code, 0);
|
|
const run = JSON.parse(result.output);
|
|
assert.ok(run.automation.required_env.includes("LANGBOT_LOCAL_AGENT_RAG_KB_UUID"));
|
|
assert.ok(!run.automation.required_env.includes("LANGBOT_LOCAL_AGENT_RAG_TEXT_MODEL_UUID"));
|
|
assert.equal(
|
|
run.automation.env_defaults.LANGBOT_E2E_RUNNER_CONFIG_PATCH_JSON,
|
|
JSON.stringify({
|
|
"knowledge-bases": [
|
|
loadEnv(root).LANGBOT_LOCAL_AGENT_RAG_KB_UUID || "",
|
|
],
|
|
}),
|
|
);
|
|
});
|
|
|
|
test("LangRAG retrieve readiness requires a KB UUID alternative", () => {
|
|
const result = capture(() => commandTestPlan(ctx(["test", "plan", "langrag-kb-retrieve", "--json"])));
|
|
assert.equal(result.code, 0);
|
|
const plan = JSON.parse(result.output);
|
|
assert.ok(plan.automation_readiness.required.includes("LANGBOT_LOCAL_AGENT_RAG_KB_UUID|LANGBOT_RAG_KB_UUID"));
|
|
});
|
|
|
|
test("local-agent RAG multimodal case setups the KB fixture env", () => {
|
|
const result = capture(() => commandTestRun(ctx([
|
|
"test",
|
|
"run",
|
|
"local-agent-rag-multimodal-debug-chat",
|
|
"--dry-run",
|
|
"--json",
|
|
])));
|
|
assert.equal(result.code, 0);
|
|
const run = JSON.parse(result.output);
|
|
assert.ok(run.automation.required_env.includes("LANGBOT_LOCAL_AGENT_RAG_KB_UUID"));
|
|
assert.equal(
|
|
run.automation.env_defaults.LANGBOT_E2E_RUNNER_CONFIG_PATCH_JSON,
|
|
JSON.stringify({
|
|
"knowledge-bases": [
|
|
loadEnv(root).LANGBOT_LOCAL_AGENT_RAG_KB_UUID || "",
|
|
],
|
|
}),
|
|
);
|
|
assert.deepEqual(run.setup_automation.map((item: { entry: string }) => item.entry), [
|
|
"node:scripts/e2e/ensure-local-agent-pipeline.mjs --write-env",
|
|
"node:scripts/e2e/ensure-langrag-sentinel-kb.mjs --write-env",
|
|
]);
|
|
});
|
|
|
|
test("test report renders a reusable evidence template", () => {
|
|
const result = capture(() => commandTestReport(ctx(["test", "report", "pipeline-debug-chat", "--no-auto-log"])));
|
|
assert.equal(result.code, 0);
|
|
assert.match(result.output, /^# Test Report: pipeline-debug-chat/m);
|
|
assert.match(result.output, /result: pass \| fail \| blocked \| env_issue \| flaky/);
|
|
assert.match(result.output, /## Log Guard/);
|
|
assert.match(result.output, /## Automation Result/);
|
|
assert.match(result.output, /## Required Evidence/);
|
|
assert.match(result.output, /no log files provided/);
|
|
});
|
|
|
|
test("validate rejects dangling case references and missing automation scripts", () => {
|
|
const tmp = mkdtempSync(join(tmpdir(), "lbs-validate-strict-"));
|
|
try {
|
|
const schemasDir = join(tmp, "schemas");
|
|
const skillsDir = join(tmp, "skills");
|
|
const envSetupDir = join(skillsDir, "langbot-env-setup");
|
|
const testingDir = join(skillsDir, "langbot-testing");
|
|
mkdirSync(schemasDir, { recursive: true });
|
|
mkdirSync(join(testingDir, "cases"), { recursive: true });
|
|
mkdirSync(join(testingDir, "fixtures"), { recursive: true });
|
|
mkdirSync(join(testingDir, "suites"), { recursive: true });
|
|
mkdirSync(envSetupDir, { recursive: true });
|
|
for (const schemaName of ["case.schema.json", "suite.schema.json", "troubleshooting.schema.json", "skill-index.schema.json"]) {
|
|
writeFileSync(join(schemasDir, schemaName), "{}");
|
|
}
|
|
writeFileSync(join(envSetupDir, "SKILL.md"), "---\nname: langbot-env-setup\ndescription: Env setup.\n---\n\n# Env\n");
|
|
writeFileSync(join(testingDir, "SKILL.md"), "---\nname: langbot-testing\ndescription: Testing.\n---\n\n# Testing\n");
|
|
writeFileSync(
|
|
join(skillsDir, ".env"),
|
|
[
|
|
"LANGBOT_FRONTEND_URL=http://127.0.0.1:3000",
|
|
"LANGBOT_BACKEND_URL=http://127.0.0.1:5300",
|
|
"LANGBOT_DEV_FRONTEND_URL=http://127.0.0.1:3000",
|
|
"LANGBOT_REPO=/tmp/langbot",
|
|
"LANGBOT_WEB_REPO=/tmp/langbot/web",
|
|
"LANGBOT_BROWSER_PROFILE=/tmp/browser",
|
|
"LANGBOT_CHROMIUM_EXECUTABLE=/tmp/chromium",
|
|
"LANGBOT_PROXY_HTTP=http://127.0.0.1:7890",
|
|
"LANGBOT_PROXY_SOCKS=socks5://127.0.0.1:7890",
|
|
"LANGBOT_NO_PROXY=localhost,127.0.0.1,::1",
|
|
].join("\n"),
|
|
);
|
|
writeFileSync(
|
|
join(testingDir, "cases", "bad.yaml"),
|
|
[
|
|
"id: bad",
|
|
"title: Bad",
|
|
"mode: agent-browser",
|
|
"area: pipeline",
|
|
"type: smoke",
|
|
"priority: p9",
|
|
"risk: medium",
|
|
"ci_eligible: false",
|
|
"tags:",
|
|
" - smoke",
|
|
"skills:",
|
|
" - langbot-env-setup",
|
|
" - langbot-testing",
|
|
"env:",
|
|
" - LANGBOT_FRONTEND_URL",
|
|
"automation: scripts/e2e/missing.mjs",
|
|
"setup_provides_env:",
|
|
" - LANGBOT_PIPELINE_URL",
|
|
"steps:",
|
|
" - Open UI.",
|
|
"checks:",
|
|
" - UI works.",
|
|
"evidence_required:",
|
|
" - ui",
|
|
"troubleshooting:",
|
|
" - missing-trouble",
|
|
].join("\n"),
|
|
);
|
|
for (const [id, target] of [["cycle-a", "cycle-b"], ["cycle-b", "cycle-a"]]) {
|
|
writeFileSync(
|
|
join(testingDir, "cases", `${id}.yaml`),
|
|
[
|
|
`id: ${id}`,
|
|
`title: ${id}`,
|
|
"mode: probe",
|
|
"area: qa",
|
|
"type: smoke",
|
|
"priority: p2",
|
|
"risk: low",
|
|
"ci_eligible: true",
|
|
"tags:",
|
|
" - smoke",
|
|
"skills:",
|
|
" - langbot-testing",
|
|
"setup_automation:",
|
|
` - \"case:${target}\"`,
|
|
"steps:",
|
|
" - Run probe.",
|
|
"checks:",
|
|
" - Probe works.",
|
|
"evidence_required:",
|
|
" - filesystem",
|
|
].join("\n"),
|
|
);
|
|
}
|
|
writeFileSync(
|
|
join(testingDir, "suites", "bad-suite.yaml"),
|
|
[
|
|
"id: bad-suite",
|
|
"title: Bad Suite",
|
|
"description: Bad suite for strict validation.",
|
|
"type: release_gate",
|
|
"priority: p1",
|
|
"tags:",
|
|
" - gate",
|
|
"cases:",
|
|
" - missing-case",
|
|
].join("\n"),
|
|
);
|
|
writeFileSync(
|
|
join(testingDir, "fixtures", "fixtures.json"),
|
|
JSON.stringify([{ id: "bad-fixture", title: "Bad Fixture", path: "fixtures/missing.txt", related_cases: ["missing-case"] }]),
|
|
);
|
|
|
|
const result = captureAll(() => commandValidate(tmp));
|
|
|
|
assert.equal(result.code, 1);
|
|
assert.match(result.error, /priority/);
|
|
assert.match(result.error, /missing-trouble/);
|
|
assert.match(result.error, /missing-case/);
|
|
assert.match(result.error, /bad-fixture/);
|
|
assert.match(result.error, /automation script does not exist/);
|
|
assert.match(result.error, /setup_provides_env/);
|
|
assert.match(result.error, /setup_automation case cycle detected/);
|
|
} finally {
|
|
rmSync(tmp, { recursive: true, force: true });
|
|
}
|
|
});
|
|
|
|
test("test report JSON scans logs and redacts secrets", () => {
|
|
const tmp = mkdtempSync(join(tmpdir(), "lbs-report-"));
|
|
try {
|
|
const logPath = join(tmp, "backend.log");
|
|
writeFileSync(
|
|
logPath,
|
|
[
|
|
"INFO request started",
|
|
"Action invoke_llm_stream call timed out",
|
|
"Traceback (most recent call last):",
|
|
"API_KEY=sk-test-secret",
|
|
].join("\n"),
|
|
);
|
|
|
|
const result = capture(() => commandTestReport(ctx(["test", "report", "pipeline-debug-chat", "--backend-log", logPath, "--json"])));
|
|
assert.equal(result.code, 0);
|
|
assert.doesNotMatch(result.output, /sk-test-secret/);
|
|
|
|
const report = JSON.parse(result.output);
|
|
assert.equal(report.log_guard.status, "fail");
|
|
assert.ok(report.log_guard.findings.some((finding: { kind: string }) => (
|
|
finding.kind === "case_failure_pattern"
|
|
)));
|
|
assert.ok(report.log_guard.findings.some((finding: { troubleshooting_id?: string }) => (
|
|
finding.troubleshooting_id === "plugin-runtime-timeout"
|
|
)));
|
|
assert.ok(report.log_guard.findings.some((finding: { kind: string }) => finding.kind === "python_traceback"));
|
|
|
|
const secretFinding = report.log_guard.findings.find((finding: { kind: string }) => finding.kind === "secret_leak");
|
|
assert.ok(secretFinding);
|
|
assert.match(secretFinding.excerpt, /\[redacted\]/);
|
|
} finally {
|
|
rmSync(tmp, { recursive: true, force: true });
|
|
}
|
|
});
|
|
|
|
test("test report does not treat invalid api key wording as a secret leak", () => {
|
|
const tmp = mkdtempSync(join(tmpdir(), "lbs-report-api-key-wording-"));
|
|
try {
|
|
const logPath = join(tmp, "backend.log");
|
|
writeFileSync(
|
|
logPath,
|
|
"RequesterError: 模型请求失败: 无效的 api-key: Error code: 401 - invalid api key\n",
|
|
);
|
|
|
|
const result = capture(() => commandTestReport(ctx(["test", "report", "mcp-stdio-tool-call", "--backend-log", logPath, "--json"])));
|
|
assert.equal(result.code, 0);
|
|
assert.match(result.output, /api-key: Error code/);
|
|
|
|
const report = JSON.parse(result.output);
|
|
assert.ok(!report.log_guard.findings.some((finding: { kind: string }) => finding.kind === "secret_leak"));
|
|
assert.ok(report.log_guard.findings.some((finding: { troubleshooting_id?: string }) => (
|
|
finding.troubleshooting_id === "local-agent-model-route-unavailable"
|
|
)));
|
|
} finally {
|
|
rmSync(tmp, { recursive: true, force: true });
|
|
}
|
|
});
|
|
|
|
test("test report records declared success signals from logs", () => {
|
|
const tmp = mkdtempSync(join(tmpdir(), "lbs-report-success-"));
|
|
try {
|
|
const logPath = join(tmp, "backend.log");
|
|
writeFileSync(
|
|
logPath,
|
|
[
|
|
"[05-21 10:31:00.000] websocket.py (1) - [INFO] : Processing request from person_websocket",
|
|
"[05-21 10:31:01.000] runner.py (2) - [INFO] : Conversation(0) Streaming completed",
|
|
].join("\n"),
|
|
);
|
|
|
|
const result = capture(() => commandTestReport(ctx([
|
|
"test",
|
|
"report",
|
|
"pipeline-debug-chat",
|
|
"--backend-log",
|
|
logPath,
|
|
"--json",
|
|
])));
|
|
assert.equal(result.code, 0);
|
|
const report = JSON.parse(result.output);
|
|
assert.equal(report.log_guard.status, "pass");
|
|
assert.equal(report.log_guard.success_signals.length, 2);
|
|
assert.ok(report.log_guard.success_signals.some((signal: { pattern: string }) => (
|
|
signal.pattern === "Streaming completed"
|
|
)));
|
|
} finally {
|
|
rmSync(tmp, { recursive: true, force: true });
|
|
}
|
|
});
|
|
|
|
test("test report warns when declared success signals are missing", () => {
|
|
const tmp = mkdtempSync(join(tmpdir(), "lbs-report-missing-success-"));
|
|
try {
|
|
const logPath = join(tmp, "backend.log");
|
|
writeFileSync(logPath, "INFO request started\nINFO request ended\n");
|
|
|
|
const result = capture(() => commandTestReport(ctx([
|
|
"test",
|
|
"report",
|
|
"pipeline-debug-chat",
|
|
"--backend-log",
|
|
logPath,
|
|
"--json",
|
|
])));
|
|
assert.equal(result.code, 0);
|
|
const report = JSON.parse(result.output);
|
|
assert.equal(report.log_guard.status, "warning");
|
|
assert.ok(report.log_guard.findings.some((finding: { kind: string }) => (
|
|
finding.kind === "missing_success_signal"
|
|
)));
|
|
} finally {
|
|
rmSync(tmp, { recursive: true, force: true });
|
|
}
|
|
});
|
|
|
|
test("test report can limit log guard to tail lines", () => {
|
|
const tmp = mkdtempSync(join(tmpdir(), "lbs-report-tail-"));
|
|
try {
|
|
const logPath = join(tmp, "backend.log");
|
|
writeFileSync(
|
|
logPath,
|
|
[
|
|
"ERROR old failure outside scan window",
|
|
"INFO middle",
|
|
"Action invoke_llm_stream call timed out",
|
|
"API_KEY=sk-tail-secret",
|
|
].join("\n"),
|
|
);
|
|
|
|
const result = capture(() => commandTestReport(ctx([
|
|
"test",
|
|
"report",
|
|
"pipeline-debug-chat",
|
|
"--backend-log",
|
|
logPath,
|
|
"--tail-lines",
|
|
"2",
|
|
"--json",
|
|
])));
|
|
assert.equal(result.code, 0);
|
|
const report = JSON.parse(result.output);
|
|
assert.equal(report.log_guard.scan.mode, "tail-lines");
|
|
assert.equal(report.log_guard.scan.tail_lines, 2);
|
|
assert.equal(report.log_guard.sources[0].line_count, 2);
|
|
assert.equal(report.log_guard.sources[0].start_line, 3);
|
|
assert.ok(report.log_guard.findings.some((finding: { troubleshooting_id?: string }) => (
|
|
finding.troubleshooting_id === "plugin-runtime-timeout"
|
|
)));
|
|
assert.ok(!report.log_guard.findings.some((finding: { kind: string; excerpt?: string }) => (
|
|
finding.kind === "error_log" && finding.excerpt?.includes("old failure")
|
|
)));
|
|
} finally {
|
|
rmSync(tmp, { recursive: true, force: true });
|
|
}
|
|
});
|
|
|
|
test("test report can limit log guard with since timestamp", () => {
|
|
const tmp = mkdtempSync(join(tmpdir(), "lbs-report-since-"));
|
|
try {
|
|
const logPath = join(tmp, "backend.log");
|
|
writeFileSync(
|
|
logPath,
|
|
[
|
|
"[05-21 09:59:00.000] old.py (1) - [ERROR] : old failure outside scan window",
|
|
"[05-21 10:31:00.000] runner.py (2) - [ERROR] : Action invoke_llm_stream call timed out",
|
|
"Traceback continuation should stay with the matching timestamp block",
|
|
"[05-21 10:32:00.000] secrets.py (3) - [INFO] : API_KEY=sk-since-secret",
|
|
].join("\n"),
|
|
);
|
|
|
|
const result = capture(() => commandTestReport(ctx([
|
|
"test",
|
|
"report",
|
|
"pipeline-debug-chat",
|
|
"--backend-log",
|
|
logPath,
|
|
"--since",
|
|
"2026-05-21T10:30:00+08:00",
|
|
"--json",
|
|
])));
|
|
assert.equal(result.code, 0);
|
|
const report = JSON.parse(result.output);
|
|
assert.equal(report.log_guard.scan.mode, "since");
|
|
assert.equal(report.log_guard.sources[0].line_count, 3);
|
|
assert.equal(report.log_guard.sources[0].start_line, 2);
|
|
assert.equal(report.log_guard.sources[0].timestamped_line_count, 3);
|
|
assert.ok(report.log_guard.findings.some((finding: { line?: number; troubleshooting_id?: string }) => (
|
|
finding.line === 2 && finding.troubleshooting_id === "plugin-runtime-timeout"
|
|
)));
|
|
assert.ok(!report.log_guard.findings.some((finding: { excerpt?: string }) => finding.excerpt?.includes("old failure")));
|
|
assert.doesNotMatch(result.output, /sk-since-secret/);
|
|
} finally {
|
|
rmSync(tmp, { recursive: true, force: true });
|
|
}
|
|
});
|
|
|
|
test("test report can limit log guard with since and until timestamps", () => {
|
|
const tmp = mkdtempSync(join(tmpdir(), "lbs-report-window-"));
|
|
try {
|
|
const logPath = join(tmp, "backend.log");
|
|
writeFileSync(
|
|
logPath,
|
|
[
|
|
"[05-21 10:29:59.000] old.py (1) - [ERROR] : old failure outside scan window",
|
|
"[05-21 10:31:00.000] runner.py (2) - [INFO] : Processing request from person_websocket",
|
|
"[05-21 10:31:01.000] runner.py (3) - [INFO] : Conversation(0) Streaming completed",
|
|
"[05-21 10:32:01.000] later.py (4) - [ERROR] : later failure outside scan window",
|
|
].join("\n"),
|
|
);
|
|
|
|
const result = capture(() => commandTestReport(ctx([
|
|
"test",
|
|
"report",
|
|
"pipeline-debug-chat",
|
|
"--backend-log",
|
|
logPath,
|
|
"--since",
|
|
"2026-05-21T10:30:00+08:00",
|
|
"--until",
|
|
"2026-05-21T10:32:00+08:00",
|
|
"--json",
|
|
])));
|
|
assert.equal(result.code, 0);
|
|
const report = JSON.parse(result.output);
|
|
assert.equal(report.log_guard.scan.mode, "since+until");
|
|
assert.equal(report.log_guard.sources[0].line_count, 2);
|
|
assert.equal(report.log_guard.sources[0].start_line, 2);
|
|
assert.equal(report.log_guard.sources[0].end_line, 3);
|
|
assert.equal(report.log_guard.status, "pass");
|
|
assert.ok(!report.log_guard.findings.some((finding: { excerpt?: string }) => finding.excerpt?.includes("old failure")));
|
|
assert.ok(!report.log_guard.findings.some((finding: { excerpt?: string }) => finding.excerpt?.includes("later failure")));
|
|
} finally {
|
|
rmSync(tmp, { recursive: true, force: true });
|
|
}
|
|
});
|
|
|
|
test("test report classifies model route failures as env_issue", () => {
|
|
const tmp = mkdtempSync(join(tmpdir(), "lbs-report-env-issue-"));
|
|
try {
|
|
const logPath = join(tmp, "backend.log");
|
|
writeFileSync(
|
|
logPath,
|
|
"[05-21 10:31:00.000] runner.py (2) - [ERROR] : runner.llm_error model_not_found no available channel for model gpt-test\n",
|
|
);
|
|
|
|
const result = capture(() => commandTestReport(ctx([
|
|
"test",
|
|
"report",
|
|
"local-agent-plugin-tool-call-debug-chat",
|
|
"--backend-log",
|
|
logPath,
|
|
"--json",
|
|
])));
|
|
assert.equal(result.code, 0);
|
|
const report = JSON.parse(result.output);
|
|
assert.equal(report.log_guard.status, "env_issue");
|
|
assert.ok(report.log_guard.findings.some((finding: { severity?: string; troubleshooting_id?: string }) => (
|
|
finding.severity === "env_issue" && finding.troubleshooting_id === "local-agent-model-route-unavailable"
|
|
)));
|
|
} finally {
|
|
rmSync(tmp, { recursive: true, force: true });
|
|
}
|
|
});
|
|
|
|
test("test report infers scan window from automation result evidence", () => {
|
|
const tmp = mkdtempSync(join(tmpdir(), "lbs-report-evidence-window-"));
|
|
try {
|
|
const evidenceDir = join(tmp, "evidence", "run-123");
|
|
mkdirSync(evidenceDir, { recursive: true });
|
|
const consoleLog = join(evidenceDir, "console.log");
|
|
writeFileSync(
|
|
consoleLog,
|
|
[
|
|
"[05-21 10:29:59.000] old.js (1) - [ERROR] : old failure outside scan window",
|
|
"[05-21 10:31:00.000] runner.js (2) - [INFO] : Processing request from person_websocket",
|
|
"[05-21 10:31:01.000] runner.js (3) - [INFO] : Conversation(0) Streaming completed",
|
|
"[05-21 10:32:01.000] later.js (4) - [ERROR] : later failure outside scan window",
|
|
].join("\n"),
|
|
);
|
|
writeFileSync(
|
|
join(evidenceDir, "automation-result.json"),
|
|
JSON.stringify({
|
|
source: "automation",
|
|
status: "pass",
|
|
reason: "UI sentinel appeared.",
|
|
started_at_local: "2026-05-21T10:30:00.000+08:00",
|
|
finished_at_local: "2026-05-21T10:32:00.000+08:00",
|
|
}),
|
|
);
|
|
|
|
const result = capture(() => commandTestReport(ctx([
|
|
"test",
|
|
"report",
|
|
"pipeline-debug-chat",
|
|
"--console-log",
|
|
consoleLog,
|
|
"--no-auto-log",
|
|
"--json",
|
|
])));
|
|
assert.equal(result.code, 0);
|
|
const report = JSON.parse(result.output);
|
|
assert.equal(report.log_guard.scan.mode, "since+until");
|
|
assert.equal(report.log_guard.scan.since, "2026-05-21T10:30:00.000+08:00");
|
|
assert.equal(report.log_guard.scan.until, "2026-05-21T10:32:00.000+08:00");
|
|
assert.equal(report.log_guard.sources[0].line_count, 2);
|
|
assert.equal(report.log_guard.status, "pass");
|
|
assert.equal(report.automation_result.status, "loaded");
|
|
assert.equal(report.automation_result.result, "pass");
|
|
assert.equal(report.automation_result.reason, "UI sentinel appeared.");
|
|
assert.ok(!report.log_guard.findings.some((finding: { excerpt?: string }) => finding.excerpt?.includes("old failure")));
|
|
assert.ok(!report.log_guard.findings.some((finding: { excerpt?: string }) => finding.excerpt?.includes("later failure")));
|
|
} finally {
|
|
rmSync(tmp, { recursive: true, force: true });
|
|
}
|
|
});
|
|
|
|
test("test report does not treat final result as automation evidence", () => {
|
|
const tmp = mkdtempSync(join(tmpdir(), "lbs-report-final-result-"));
|
|
try {
|
|
const evidenceDir = join(tmp, "evidence", "run-final");
|
|
mkdirSync(evidenceDir, { recursive: true });
|
|
const consoleLog = join(evidenceDir, "console.log");
|
|
writeFileSync(consoleLog, "[05-21 10:31:00.000] ui.js (1) - [INFO] : opened\n");
|
|
writeFileSync(
|
|
join(evidenceDir, "result.json"),
|
|
JSON.stringify({
|
|
source: "final",
|
|
status: "pass",
|
|
reason: "Final manual decision.",
|
|
started_at_local: "2026-05-21T10:30:00.000+08:00",
|
|
finished_at_local: "2026-05-21T10:32:00.000+08:00",
|
|
evidence_collected: ["ui", "screenshot", "console"],
|
|
}),
|
|
);
|
|
|
|
const result = capture(() => commandTestReport(ctx([
|
|
"test",
|
|
"report",
|
|
"webui-login-state",
|
|
"--console-log",
|
|
consoleLog,
|
|
"--no-auto-log",
|
|
"--json",
|
|
])));
|
|
|
|
assert.equal(result.code, 0);
|
|
const report = JSON.parse(result.output);
|
|
assert.equal(report.automation_result.status, "not_provided");
|
|
assert.match(report.automation_result.reason, /only final result\.json is present/);
|
|
} finally {
|
|
rmSync(tmp, { recursive: true, force: true });
|
|
}
|
|
});
|
|
|
|
test("test report still scans untimestamped explicit console evidence within an inferred run window", () => {
|
|
const tmp = mkdtempSync(join(tmpdir(), "lbs-report-untimestamped-console-"));
|
|
try {
|
|
const evidenceDir = join(tmp, "evidence", "run-untimestamped");
|
|
mkdirSync(evidenceDir, { recursive: true });
|
|
const consoleLog = join(evidenceDir, "console.log");
|
|
writeFileSync(consoleLog, "[error] Uncaught TypeError: Cannot read properties of undefined\n");
|
|
writeFileSync(
|
|
join(evidenceDir, "result.json"),
|
|
JSON.stringify({
|
|
status: "pass",
|
|
reason: "UI sentinel appeared.",
|
|
started_at_local: "2026-05-21T10:30:00.000+08:00",
|
|
finished_at_local: "2026-05-21T10:32:00.000+08:00",
|
|
}),
|
|
);
|
|
|
|
const result = capture(() => commandTestReport(ctx([
|
|
"test",
|
|
"report",
|
|
"webui-login-state",
|
|
"--console-log",
|
|
consoleLog,
|
|
"--no-auto-log",
|
|
"--json",
|
|
])));
|
|
|
|
assert.equal(result.code, 0);
|
|
const report = JSON.parse(result.output);
|
|
assert.equal(report.log_guard.scan.mode, "since+until");
|
|
assert.equal(report.log_guard.sources[0].timestamped_line_count, 0);
|
|
assert.ok(report.log_guard.sources[0].line_count >= 1);
|
|
assert.equal(report.log_guard.status, "fail");
|
|
assert.ok(report.log_guard.findings.some((finding: { kind: string }) => (
|
|
finding.kind === "frontend_uncaught_error"
|
|
)));
|
|
} finally {
|
|
rmSync(tmp, { recursive: true, force: true });
|
|
}
|
|
});
|
|
|
|
test("test report can write markdown to an output path", () => {
|
|
const tmp = mkdtempSync(join(tmpdir(), "lbs-report-output-"));
|
|
try {
|
|
const output = join(tmp, "reports", "pipeline-debug-chat.md");
|
|
const result = capture(() => commandTestReport(ctx(["test", "report", "pipeline-debug-chat", "--output", output])));
|
|
assert.equal(result.code, 0);
|
|
assert.match(result.output, /pipeline-debug-chat\.md$/);
|
|
assert.match(readFileSync(output, "utf8"), /^# Test Report: pipeline-debug-chat/m);
|
|
} finally {
|
|
rmSync(tmp, { recursive: true, force: true });
|
|
}
|
|
});
|
|
|
|
test("log scan reuses case-aware log guard patterns", () => {
|
|
const tmp = mkdtempSync(join(tmpdir(), "lbs-log-scan-"));
|
|
try {
|
|
const logPath = join(tmp, "backend.log");
|
|
writeFileSync(
|
|
logPath,
|
|
[
|
|
"[05-21 10:31:00.000] process.py (1) - [INFO] : Processing request from person_websocket",
|
|
"[05-21 10:31:01.000] chat.py (2) - [INFO] : Conversation(0) Streaming completed",
|
|
"[05-21 10:31:02.000] runner.py (3) - [ERROR] : Action invoke_llm_stream call timed out",
|
|
].join("\n"),
|
|
);
|
|
|
|
const result = capture(() => commandLogScan(ctx([
|
|
"log",
|
|
"scan",
|
|
"--backend-log",
|
|
logPath,
|
|
"--case",
|
|
"pipeline-debug-chat",
|
|
"--json",
|
|
])));
|
|
|
|
assert.equal(result.code, 0);
|
|
const report = JSON.parse(result.output);
|
|
assert.equal(report.status, "fail");
|
|
assert.ok(report.success_signals.some((signal: { pattern: string }) => signal.pattern === "Streaming completed"));
|
|
assert.ok(report.findings.some((finding: { kind: string }) => finding.kind === "case_failure_pattern"));
|
|
|
|
const strict = capture(() => commandLogScan(ctx([
|
|
"log",
|
|
"scan",
|
|
"--backend-log",
|
|
logPath,
|
|
"--case",
|
|
"pipeline-debug-chat",
|
|
"--strict",
|
|
"--json",
|
|
])));
|
|
assert.equal(strict.code, 1);
|
|
} finally {
|
|
rmSync(tmp, { recursive: true, force: true });
|
|
}
|
|
});
|
|
|
|
test("log guard start and stop bound a QA log window", () => {
|
|
const tmp = mkdtempSync(join(tmpdir(), "lbs-log-guard-"));
|
|
try {
|
|
const logPath = join(tmp, "backend.log");
|
|
const outputDir = join(tmp, "guards");
|
|
writeFileSync(logPath, "INFO before guard\n");
|
|
|
|
const start = capture(() => commandLogGuard(ctx([
|
|
"log",
|
|
"guard",
|
|
"start",
|
|
"--run-id",
|
|
"qa-run",
|
|
"--output-dir",
|
|
outputDir,
|
|
"--backend-log",
|
|
logPath,
|
|
"--case",
|
|
"pipeline-debug-chat",
|
|
"--json",
|
|
])));
|
|
assert.equal(start.code, 0);
|
|
const session = JSON.parse(start.output);
|
|
assert.equal(session.run_id, "qa-run");
|
|
assert.ok(existsSync(join(outputDir, "qa-run.json")));
|
|
|
|
appendFileSync(logPath, "Traceback (most recent call last):\n");
|
|
const stop = capture(() => commandLogGuard(ctx([
|
|
"log",
|
|
"guard",
|
|
"stop",
|
|
"--run-id",
|
|
"qa-run",
|
|
"--output-dir",
|
|
outputDir,
|
|
"--json",
|
|
])));
|
|
|
|
assert.equal(stop.code, 1);
|
|
const report = JSON.parse(stop.output);
|
|
assert.equal(report.session.run_id, "qa-run");
|
|
assert.equal(report.result.status, "fail");
|
|
assert.ok(report.result.findings.some((finding: { kind: string }) => finding.kind === "python_traceback"));
|
|
} finally {
|
|
rmSync(tmp, { recursive: true, force: true });
|
|
}
|
|
});
|
|
|
|
test("log watch observes appended LangBot backend lines", async () => {
|
|
const tmp = mkdtempSync(join(tmpdir(), "lbs-log-watch-"));
|
|
try {
|
|
const logPath = join(tmp, "backend.log");
|
|
writeFileSync(logPath, "INFO existing line\n");
|
|
|
|
const watching = captureAsync(() => commandLogWatch(ctx([
|
|
"log",
|
|
"watch",
|
|
"--backend-log",
|
|
logPath,
|
|
"--duration-ms",
|
|
"220",
|
|
"--interval-ms",
|
|
"20",
|
|
"--strict",
|
|
"--json",
|
|
])));
|
|
setTimeout(() => {
|
|
appendFileSync(logPath, "Traceback (most recent call last):\n");
|
|
}, 50);
|
|
|
|
const result = await watching;
|
|
assert.equal(result.code, 1);
|
|
const summary = JSON.parse(result.output);
|
|
assert.equal(summary.mode, "watch");
|
|
assert.equal(summary.status, "fail");
|
|
assert.ok(summary.bytes_read > 0);
|
|
assert.ok(summary.findings.some((finding: { kind: string }) => finding.kind === "python_traceback"));
|
|
} finally {
|
|
rmSync(tmp, { recursive: true, force: true });
|
|
}
|
|
});
|
|
|
|
test("trouble search finds structured troubleshooting entries", () => {
|
|
const result = capture(() => commandTroubleSearch(ctx(["trouble", "search", "proxy"])));
|
|
assert.equal(result.code, 0);
|
|
assert.match(result.output, /proxy-env-mismatch/);
|
|
});
|
|
|
|
test("env local overrides shared env defaults", () => {
|
|
const tmp = mkdtempSync(join(tmpdir(), "lbs-env-"));
|
|
try {
|
|
mkdirSync(join(tmp, "skills"));
|
|
writeFileSync(join(tmp, "skills", ".env"), "LANGBOT_REPO=/shared\nLANGBOT_BACKEND_URL=http://127.0.0.1:5300\n");
|
|
writeFileSync(join(tmp, "skills", ".env.local"), "LANGBOT_REPO=/local\n");
|
|
|
|
assert.deepEqual(loadEnv(tmp), {
|
|
LANGBOT_REPO: "/local",
|
|
LANGBOT_BACKEND_URL: "http://127.0.0.1:5300",
|
|
});
|
|
} finally {
|
|
rmSync(tmp, { recursive: true, force: true });
|
|
}
|
|
});
|