import assert from "node:assert/strict"; import { test } from "node:test"; import { appendFileSync, existsSync, mkdtempSync, mkdirSync, readFileSync, rmSync, writeFileSync } from "node:fs"; import { spawnSync } from "node:child_process"; import { tmpdir } from "node:os"; import { join } from "node:path"; import type { CommandContext } from "../src/types.ts"; import { commandCaseList, commandCaseNew, commandCaseShow } from "../src/commands/case.ts"; import { commandEnvDoctor, commandEnvShow } from "../src/commands/env.ts"; import { commandFixtureCheck, commandFixtureList } from "../src/commands/fixture.ts"; import { commandLogGuard, commandLogScan, commandLogWatch } from "../src/commands/log.ts"; import { commandSuiteList, commandSuiteNew, commandSuitePlan, commandSuiteReport, commandSuiteRun, commandSuiteShow, commandSuiteStart } from "../src/commands/suite.ts"; import { commandTestPlan, commandTestRecommend, commandTestReport, commandTestResult, commandTestRun, commandTestStart } from "../src/commands/test.ts"; import { commandTroubleSearch } from "../src/commands/trouble.ts"; import { commandValidate } from "../src/commands/validate.ts"; import { commandIndex } from "../src/commands/skill.ts"; import { loadEnv } from "../src/fs.ts"; import { repoRoot } from "../src/cli.ts"; import { classifyDebugChatResult, findNewFailureSignal, minExpectedOccurrences, } from "../scripts/e2e/lib/debug-chat.mjs"; const root = process.cwd(); test("repo root detects the skills tree before generated bin exists", () => { const tmp = mkdtempSync(join(tmpdir(), "lbs-root-no-bin-")); try { mkdirSync(join(tmp, "schemas"), { recursive: true }); mkdirSync(join(tmp, "skills", "langbot-testing"), { recursive: true }); writeFileSync(join(tmp, "skills.index.json"), "{}"); writeFileSync(join(tmp, "schemas", "case.schema.json"), "{}"); assert.equal(repoRoot(join(tmp, "skills", "langbot-testing")), tmp); } finally { rmSync(tmp, { recursive: true, force: true }); } }); function ctx(args: string[]): CommandContext { return { root, args }; } function capture(fn: () => number): { code: number; output: string } { const originalLog = console.log; const lines: string[] = []; console.log = (...args: unknown[]) => { lines.push(args.map(String).join(" ")); }; try { const code = fn(); return { code, output: lines.join("\n") }; } finally { console.log = originalLog; } } function captureAll(fn: () => number): { code: number; output: string; error: string } { const originalLog = console.log; const originalWrite = process.stderr.write; const lines: string[] = []; const errors: string[] = []; console.log = (...args: unknown[]) => { lines.push(args.map(String).join(" ")); }; process.stderr.write = ((chunk: string | Uint8Array) => { errors.push(String(chunk)); return true; }) as typeof process.stderr.write; try { const code = fn(); return { code, output: lines.join("\n"), error: errors.join("") }; } finally { console.log = originalLog; process.stderr.write = originalWrite; } } function suiteResult(caseId: string, runId: string, status = "pass", evidence = ["ui", "screenshot", "console", "backend_log"]): string { return JSON.stringify({ source: "final", case_id: caseId, run_id: `${runId}-${caseId}`, status, reason: `${caseId} ${status}`, started_at_local: "2026-05-21T10:30:00.000+08:00", finished_at_local: "2026-05-21T10:31:00.000+08:00", evidence_collected: evidence, }); } function withEnv(values: Record, fn: () => T): T { const previous = new Map(Object.keys(values).map((key) => [key, process.env[key]])); try { for (const [key, value] of Object.entries(values)) process.env[key] = value; return fn(); } finally { for (const [key, value] of previous) { if (value === undefined) delete process.env[key]; else process.env[key] = value; } } } async function captureAsync(fn: () => Promise): Promise<{ code: number; output: string }> { const originalLog = console.log; const lines: string[] = []; console.log = (...args: unknown[]) => { lines.push(args.map(String).join(" ")); }; try { const code = await fn(); return { code, output: lines.join("\n") }; } finally { console.log = originalLog; } } test("validate accepts the repository assets", () => { const result = capture(() => commandValidate(root)); assert.equal(result.code, 0); assert.match(result.output, /^OK/m); }); test("validate allows blank shared env values but requires declared keys", () => { const tmp = mkdtempSync(join(tmpdir(), "lbs-validate-env-template-")); try { const schemasDir = join(tmp, "schemas"); const skillsDir = join(tmp, "skills"); const testingDir = join(skillsDir, "langbot-testing"); mkdirSync(schemasDir, { recursive: true }); mkdirSync(testingDir, { recursive: true }); for (const schemaName of ["case.schema.json", "suite.schema.json", "troubleshooting.schema.json", "skill-index.schema.json"]) { writeFileSync(join(schemasDir, schemaName), "{}"); } writeFileSync(join(testingDir, "SKILL.md"), "---\nname: langbot-testing\ndescription: Testing.\n---\n\n# Testing\n"); const envText = [ "LANGBOT_FRONTEND_URL=http://127.0.0.1:3000", "LANGBOT_BACKEND_URL=http://127.0.0.1:5300", "LANGBOT_DEV_FRONTEND_URL=http://127.0.0.1:3000", "LANGBOT_REPO=", "LANGBOT_WEB_REPO=", "LANGBOT_BROWSER_PROFILE=", "LANGBOT_CHROMIUM_EXECUTABLE=", ].join("\n"); writeFileSync(join(skillsDir, ".env"), envText); writeFileSync(join(skillsDir, ".env.example"), envText); const result = capture(() => commandValidate(tmp)); assert.equal(result.code, 0); assert.match(result.output, /^OK/m); } finally { rmSync(tmp, { recursive: true, force: true }); } }); test("index includes case summaries for agent discovery", () => { const result = capture(() => commandIndex({ root, args: ["index"] })); assert.equal(result.code, 0); const index = JSON.parse(readFileSync(join(root, "skills.index.json"), "utf8")); const testing = index.skills.find((skill: { name: string }) => skill.name === "langbot-testing"); assert.ok(testing); assert.ok(testing.case_summaries.some((item: { id: string; priority: string; evidence_required: string[] }) => ( item.id === "pipeline-debug-chat" && item.priority === "p0" && item.evidence_required.includes("backend_log") ))); assert.ok(testing.case_summaries.some((item: { id: string; setup_automation: string[]; setup_provides_env: string[] }) => ( item.id === "agent-runner-qa-debug-chat" && item.setup_automation.includes("case:agent-runner-live-install") && item.setup_provides_env.includes("LANGBOT_QA_AGENT_RUNNER_PIPELINE_URL") ))); assert.ok(testing.suite_summaries.some((item: { id: string; cases: string[] }) => ( item.id === "core-smoke" && item.cases.includes("pipeline-debug-chat") ))); assert.ok(testing.fixtures.some((item: { id: string; related_cases: string[] }) => ( item.id === "mcp-stdio-echo-server" && item.related_cases.includes("mcp-stdio-tool-call") ))); }); test("index check detects stale index without writing", () => { const path = join(root, "skills.index.json"); const current = capture(() => commandIndex({ root, args: ["index"] })); assert.equal(current.code, 0); const fresh = readFileSync(path, "utf8"); try { const ok = capture(() => commandIndex({ root, args: ["index", "--check"] })); assert.equal(ok.code, 0); assert.match(ok.output, /^OK /); writeFileSync(path, "{}\n"); const stale = captureAll(() => commandIndex({ root, args: ["index", "--check"] })); assert.equal(stale.code, 1); assert.match(stale.error, /index is stale/); assert.equal(readFileSync(path, "utf8"), "{}\n"); } finally { writeFileSync(path, fresh); } }); test("case list exposes seeded QA cases", () => { const result = capture(() => commandCaseList(ctx(["case", "list"]))); assert.equal(result.code, 0); assert.match(result.output, /pipeline-debug-chat/); assert.match(result.output, /provider-deepseek/); assert.match(result.output, /webui-login-state/); }); test("case list JSON filters by reusable agent-selection metadata", () => { const result = capture(() => commandCaseList(ctx([ "case", "list", "--json", "--priority", "p0", "--automation", ]))); assert.equal(result.code, 0); const rows = JSON.parse(result.output); assert.ok(rows.length >= 2); assert.ok(rows.every((row: { priority: string }) => row.priority === "p0")); assert.ok(rows.every((row: { automation: string }) => row.automation)); assert.ok(rows.some((row: { id: string; evidence_required: string[]; readiness: string }) => ( row.id === "pipeline-debug-chat" && row.evidence_required.includes("backend_log") && row.readiness ))); }); test("case list distinguishes machine readiness from manual precondition checks", () => { const tmp = mkdtempSync(join(tmpdir(), "lbs-case-manual-readiness-")); try { const skillDir = join(tmp, "skills", "langbot-testing"); mkdirSync(join(skillDir, "cases"), { recursive: true }); writeFileSync( join(skillDir, "SKILL.md"), "---\nname: langbot-testing\ndescription: Testing.\n---\n\n# Testing\n", ); writeFileSync(join(tmp, "skills", ".env"), "LANGBOT_FRONTEND_URL=http://127.0.0.1:3000\n"); writeFileSync( join(skillDir, "cases", "manual-case.yaml"), [ "id: manual-case", "title: Manual Case", "mode: agent-browser", "area: pipeline", "type: smoke", "priority: p2", "risk: medium", "ci_eligible: false", "tags:", " - smoke", "skills:", " - langbot-testing", "env:", " - LANGBOT_FRONTEND_URL", "preconditions:", " - Confirm the target pipeline is safe to modify.", "steps:", " - Open the page.", "checks:", " - UI: Page opens.", "evidence_required:", " - ui", ].join("\n"), ); const machineReady = capture(() => commandCaseList({ root: tmp, args: ["case", "list", "--machine-ready"] })); assert.equal(machineReady.code, 0); assert.match(machineReady.output, /manual-case/); assert.match(machineReady.output, /manual-check/); const ready = capture(() => commandCaseList({ root: tmp, args: ["case", "list", "--ready"] })); assert.equal(ready.code, 0); assert.doesNotMatch(ready.output, /manual-case/); } finally { rmSync(tmp, { recursive: true, force: true }); } }); test("case show prints structured agent-browser case", () => { const result = capture(() => commandCaseShow(ctx(["case", "show", "pipeline-debug-chat"]))); assert.equal(result.code, 0); assert.match(result.output, /^id: pipeline-debug-chat/m); assert.match(result.output, /^mode: agent-browser/m); assert.match(result.output, /^checks:/m); }); test("case new writes required selection metadata", () => { const tmp = mkdtempSync(join(tmpdir(), "lbs-case-new-")); try { const skillDir = join(tmp, "skills", "langbot-testing"); mkdirSync(skillDir, { recursive: true }); writeFileSync( join(skillDir, "SKILL.md"), "---\nname: langbot-testing\ndescription: Testing.\n---\n\n# Testing\n", ); const result = capture(() => commandCaseNew({ root: tmp, args: ["case", "new", "new-case", "--title", "New Case"], })); assert.equal(result.code, 0); const text = readFileSync(join(skillDir, "cases", "new-case.yaml"), "utf8"); assert.match(text, /^priority: p2/m); assert.match(text, /^risk: medium/m); assert.match(text, /^ci_eligible: false/m); assert.match(text, /^evidence_required:/m); } finally { rmSync(tmp, { recursive: true, force: true }); } }); test("suite list and plan expose reusable case groups", () => { const list = capture(() => commandSuiteList(ctx(["suite", "list", "--json", "--priority", "p0"]))); assert.equal(list.code, 0); const suites = JSON.parse(list.output); assert.ok(suites.some((suite: { id: string; cases: string[] }) => ( suite.id === "core-smoke" && suite.cases.includes("webui-login-state") ))); const plan = capture(() => commandSuitePlan(ctx(["suite", "plan", "core-smoke", "--json"]))); assert.equal(plan.code, 0); const suitePlan = JSON.parse(plan.output); assert.equal(suitePlan.id, "core-smoke"); assert.ok(suitePlan.cases.some((item: { id: string; evidence_required: string[] }) => ( item.id === "pipeline-debug-chat" && item.evidence_required.includes("backend_log") ))); assert.ok(suitePlan.commands.some((item: { id: string; automation: string }) => ( item.id === "pipeline-debug-chat" && item.automation.includes("test run") ))); const localAgent = capture(() => commandSuitePlan(ctx(["suite", "plan", "local-agent-gate", "--json"]))); assert.equal(localAgent.code, 0); const localAgentPlan = JSON.parse(localAgent.output); assert.ok(["ready", "missing", "manual_check"].includes(localAgentPlan.readiness.status)); const basic = localAgentPlan.cases.find((item: { id: string }) => item.id === "local-agent-basic-debug-chat"); assert.equal(basic.automation_readiness.pipeline_env_required, true); }); test("suite show prints structured suite YAML", () => { const result = capture(() => commandSuiteShow(ctx(["suite", "show", "local-agent-gate"]))); assert.equal(result.code, 0); assert.match(result.output, /^id: local-agent-gate/m); assert.match(result.output, /^cases:/m); assert.match(result.output, /local-agent-effective-prompt-debug-chat/); }); test("suite start creates a run handoff with per-case evidence commands", () => { const tmp = mkdtempSync(join(tmpdir(), "lbs-suite-start-")); try { const evidenceRoot = join(tmp, "evidence"); const result = capture(() => commandSuiteStart(ctx([ "suite", "start", "core-smoke", "--run-id", "core-smoke-local", "--evidence-dir", evidenceRoot, "--json", ]))); assert.equal(result.code, 0); const start = JSON.parse(result.output); assert.equal(start.suite.id, "core-smoke"); assert.equal(start.run_id, "core-smoke-local"); assert.equal(start.evidence_root, evidenceRoot); assert.equal(start.manifest_path, join(evidenceRoot, "suite-start.json")); assert.equal(start.handoff_path, join(evidenceRoot, "suite-start.md")); assert.match(start.report_command, /bin\/lbs suite report core-smoke/); assert.ok(existsSync(join(evidenceRoot, "suite-start.json"))); assert.ok(existsSync(join(evidenceRoot, "suite-start.md"))); const pipeline = start.cases.find((item: { id: string }) => item.id === "pipeline-debug-chat"); assert.ok(pipeline); assert.ok(existsSync(join(evidenceRoot, "pipeline-debug-chat"))); assert.match(pipeline.automation_command, /bin\/lbs test run pipeline-debug-chat/); assert.match(pipeline.report_command, /--evidence-dir .+pipeline-debug-chat/); assert.match(pipeline.result_command_template, /bin\/lbs test result pipeline-debug-chat/); } finally { rmSync(tmp, { recursive: true, force: true }); } }); test("suite report aggregates case result JSON files", () => { const tmp = mkdtempSync(join(tmpdir(), "lbs-suite-report-")); try { const evidenceRoot = join(tmp, "suite-evidence"); const runId = "suite-report-run"; for (const [caseId, status] of [ ["webui-login-state", "pass"], ["pipeline-debug-chat", "pass"], ["local-agent-basic-debug-chat", "env_issue"], ]) { const dir = join(evidenceRoot, caseId); mkdirSync(dir, { recursive: true }); writeFileSync( join(dir, "result.json"), suiteResult(caseId, runId, status), ); } const result = capture(() => commandSuiteReport(ctx([ "suite", "report", "core-smoke", "--run-id", runId, "--evidence-dir", evidenceRoot, "--json", ]))); assert.equal(result.code, 0); const report = JSON.parse(result.output); assert.equal(report.status, "env_issue"); assert.equal(report.counts.pass, 2); assert.equal(report.counts.env_issue, 1); assert.ok(report.cases.some((item: { id: string; result: { status: string } }) => ( item.id === "local-agent-basic-debug-chat" && item.result.status === "env_issue" ))); } finally { rmSync(tmp, { recursive: true, force: true }); } }); test("suite report treats pass without required evidence as incomplete", () => { const tmp = mkdtempSync(join(tmpdir(), "lbs-suite-report-evidence-")); try { const evidenceRoot = join(tmp, "suite-evidence"); const runId = "suite-report-evidence"; for (const caseId of ["webui-login-state", "pipeline-debug-chat", "local-agent-basic-debug-chat"]) { const dir = join(evidenceRoot, caseId); mkdirSync(dir, { recursive: true }); writeFileSync( join(dir, "result.json"), suiteResult(caseId, runId, "pass", ["ui"]), ); } const result = capture(() => commandSuiteReport(ctx([ "suite", "report", "core-smoke", "--run-id", runId, "--evidence-dir", evidenceRoot, "--json", ]))); assert.equal(result.code, 0); const report = JSON.parse(result.output); assert.equal(report.status, "incomplete"); assert.ok(report.cases.some((item: { id: string; result: { evidence_missing: string[] } }) => ( item.id === "pipeline-debug-chat" && item.result.evidence_missing.includes("backend_log") ))); } finally { rmSync(tmp, { recursive: true, force: true }); } }); test("suite report marks missing case evidence as incomplete", () => { const tmp = mkdtempSync(join(tmpdir(), "lbs-suite-report-missing-")); try { const evidenceRoot = join(tmp, "suite-evidence"); const runId = "suite-report-missing"; mkdirSync(join(evidenceRoot, "webui-login-state"), { recursive: true }); writeFileSync(join(evidenceRoot, "webui-login-state", "result.json"), suiteResult("webui-login-state", runId, "pass")); const result = capture(() => commandSuiteReport(ctx([ "suite", "report", "core-smoke", "--run-id", runId, "--evidence-dir", evidenceRoot, "--json", ]))); assert.equal(result.code, 0); const report = JSON.parse(result.output); assert.equal(report.status, "incomplete"); assert.ok(report.cases.some((item: { id: string; result: { status: string } }) => ( item.id === "pipeline-debug-chat" && item.result.status === "missing" ))); } finally { rmSync(tmp, { recursive: true, force: true }); } }); test("suite report rejects result files from the wrong case or run", () => { const tmp = mkdtempSync(join(tmpdir(), "lbs-suite-report-mismatch-")); try { const evidenceRoot = join(tmp, "suite-evidence"); const runId = "suite-report-mismatch"; for (const caseId of ["webui-login-state", "pipeline-debug-chat", "local-agent-basic-debug-chat"]) { const dir = join(evidenceRoot, caseId); mkdirSync(dir, { recursive: true }); writeFileSync(join(dir, "result.json"), suiteResult(caseId, runId, "pass")); } writeFileSync(join(evidenceRoot, "pipeline-debug-chat", "result.json"), suiteResult("webui-login-state", runId, "pass")); writeFileSync(join(evidenceRoot, "local-agent-basic-debug-chat", "result.json"), suiteResult("local-agent-basic-debug-chat", "old-run", "pass")); const result = capture(() => commandSuiteReport(ctx([ "suite", "report", "core-smoke", "--run-id", runId, "--evidence-dir", evidenceRoot, "--json", ]))); assert.equal(result.code, 0); const report = JSON.parse(result.output); assert.equal(report.status, "fail"); assert.ok(report.cases.some((item: { id: string; result: { status: string; reason: string } }) => ( item.id === "pipeline-debug-chat" && item.result.status === "invalid" && item.result.reason.includes("case_id mismatch") ))); assert.ok(report.cases.some((item: { id: string; result: { status: string; reason: string } }) => ( item.id === "local-agent-basic-debug-chat" && item.result.status === "invalid" && item.result.reason.includes("run_id mismatch") ))); } finally { rmSync(tmp, { recursive: true, force: true }); } }); test("suite run executes automated cases and aggregates a verdict", () => { const tmp = mkdtempSync(join(tmpdir(), "lbs-suite-run-")); try { const skillDir = join(tmp, "skills", "langbot-testing"); const casesDir = join(skillDir, "cases"); const suitesDir = join(skillDir, "suites"); const scriptsDir = join(tmp, "scripts"); mkdirSync(casesDir, { recursive: true }); mkdirSync(suitesDir, { recursive: true }); mkdirSync(scriptsDir, { recursive: true }); writeFileSync(join(skillDir, "SKILL.md"), "---\nname: langbot-testing\ndescription: Testing.\n---\n\n# Testing\n"); writeFileSync(join(tmp, "skills", ".env"), ""); writeFileSync( join(casesDir, "one.yaml"), [ "id: one", "title: One", "mode: probe", "area: qa", "type: smoke", "priority: p2", "risk: low", "ci_eligible: true", "automation: scripts/pass.mjs", "evidence_required:", " - filesystem", ].join("\n"), ); writeFileSync( join(casesDir, "two.yaml"), [ "id: two", "title: Two", "mode: probe", "area: qa", "type: smoke", "priority: p2", "risk: low", "ci_eligible: true", "automation: scripts/pass.mjs", "evidence_required:", " - filesystem", ].join("\n"), ); writeFileSync( join(suitesDir, "mini.yaml"), [ "id: mini", "title: Mini", "description: Mini suite.", "type: smoke", "priority: p2", "tags:", " - qa", "cases:", " - one", " - two", ].join("\n"), ); writeFileSync( join(scriptsDir, "pass.mjs"), [ "import { mkdirSync, writeFileSync } from 'node:fs';", "import { join } from 'node:path';", "mkdirSync(process.env.LBS_EVIDENCE_DIR, { recursive: true });", "writeFileSync(join(process.env.LBS_EVIDENCE_DIR, 'result.json'), JSON.stringify({", " case_id: process.env.LBS_CASE_ID,", " run_id: process.env.LBS_RUN_ID,", " status: 'pass',", " reason: `${process.env.LBS_CASE_ID} pass`,", " evidence_collected: ['filesystem']", "}));", "writeFileSync(join(process.env.LBS_EVIDENCE_DIR, 'automation-result.json'), JSON.stringify({ status: 'pass' }));", ].join("\n"), ); const result = capture(() => commandSuiteRun({ root: tmp, args: ["suite", "run", "mini", "--run-id", "mini-run", "--evidence-dir", join(tmp, "evidence"), "--json"], })); assert.equal(result.code, 0); const payload = JSON.parse(result.output); assert.equal(payload.report.status, "pass"); assert.equal(payload.report.counts.pass, 2); assert.deepEqual(payload.executions.map((item: { status: string }) => item.status), ["ok", "ok"]); assert.ok(existsSync(join(tmp, "evidence", "one", "result.json"))); assert.ok(existsSync(join(tmp, "evidence", "two", "result.json"))); } finally { rmSync(tmp, { recursive: true, force: true }); } }); test("suite run JSON captures failed case output", () => { const tmp = mkdtempSync(join(tmpdir(), "lbs-suite-run-fail-")); try { const skillDir = join(tmp, "skills", "langbot-testing"); const casesDir = join(skillDir, "cases"); const suitesDir = join(skillDir, "suites"); const scriptsDir = join(tmp, "scripts"); mkdirSync(casesDir, { recursive: true }); mkdirSync(suitesDir, { recursive: true }); mkdirSync(scriptsDir, { recursive: true }); writeFileSync(join(skillDir, "SKILL.md"), "---\nname: langbot-testing\ndescription: Testing.\n---\n\n# Testing\n"); writeFileSync(join(tmp, "skills", ".env"), ""); writeFileSync( join(casesDir, "fail-case.yaml"), [ "id: fail-case", "title: Fail Case", "mode: probe", "area: qa", "type: smoke", "priority: p2", "risk: low", "ci_eligible: true", "automation: scripts/fail.mjs", ].join("\n"), ); writeFileSync( join(suitesDir, "mini.yaml"), [ "id: mini", "title: Mini", "description: Mini suite.", "type: smoke", "priority: p2", "tags:", " - qa", "cases:", " - fail-case", ].join("\n"), ); writeFileSync(join(scriptsDir, "fail.mjs"), "console.error('child failure detail'); process.exit(1);\n"); const result = capture(() => commandSuiteRun({ root: tmp, args: ["suite", "run", "mini", "--run-id", "mini-run", "--evidence-dir", join(tmp, "evidence"), "--json"], })); assert.equal(result.code, 1); const payload = JSON.parse(result.output); assert.equal(payload.executions[0].status, "nonzero"); assert.match(payload.executions[0].stderr, /child failure detail/); assert.equal(payload.report.status, "fail"); } finally { rmSync(tmp, { recursive: true, force: true }); } }); test("suite run failure cannot be masked by stale pass result", () => { const tmp = mkdtempSync(join(tmpdir(), "lbs-suite-run-stale-pass-")); try { const skillDir = join(tmp, "skills", "langbot-testing"); const casesDir = join(skillDir, "cases"); const suitesDir = join(skillDir, "suites"); const scriptsDir = join(tmp, "scripts"); const evidenceDir = join(tmp, "evidence"); mkdirSync(casesDir, { recursive: true }); mkdirSync(suitesDir, { recursive: true }); mkdirSync(scriptsDir, { recursive: true }); mkdirSync(join(evidenceDir, "fail-case"), { recursive: true }); writeFileSync(join(skillDir, "SKILL.md"), "---\nname: langbot-testing\ndescription: Testing.\n---\n\n# Testing\n"); writeFileSync(join(tmp, "skills", ".env"), ""); writeFileSync( join(casesDir, "fail-case.yaml"), [ "id: fail-case", "title: Fail Case", "mode: probe", "area: qa", "type: smoke", "priority: p2", "risk: low", "ci_eligible: true", "automation: scripts/fail.mjs", "evidence_required:", " - filesystem", ].join("\n"), ); writeFileSync( join(suitesDir, "mini.yaml"), [ "id: mini", "title: Mini", "description: Mini suite.", "type: smoke", "priority: p2", "tags:", " - qa", "cases:", " - fail-case", ].join("\n"), ); writeFileSync(join(scriptsDir, "fail.mjs"), "process.exit(1);\n"); writeFileSync(join(evidenceDir, "fail-case", "result.json"), JSON.stringify({ case_id: "fail-case", run_id: "stale-run-fail-case", status: "pass", evidence_collected: ["filesystem"], })); const result = capture(() => commandSuiteRun({ root: tmp, args: ["suite", "run", "mini", "--run-id", "stale-run", "--evidence-dir", evidenceDir, "--json"], })); assert.equal(result.code, 1); const payload = JSON.parse(result.output); assert.equal(payload.executions[0].status, "nonzero"); assert.equal(payload.report.status, "fail"); assert.equal(payload.report.execution_status, "fail"); } finally { rmSync(tmp, { recursive: true, force: true }); } }); test("suite run dry-run plans automation without creating evidence", () => { const tmp = mkdtempSync(join(tmpdir(), "lbs-suite-run-dry-")); try { const skillDir = join(tmp, "skills", "langbot-testing"); const casesDir = join(skillDir, "cases"); const suitesDir = join(skillDir, "suites"); const scriptsDir = join(tmp, "scripts"); mkdirSync(casesDir, { recursive: true }); mkdirSync(suitesDir, { recursive: true }); mkdirSync(scriptsDir, { recursive: true }); writeFileSync(join(skillDir, "SKILL.md"), "---\nname: langbot-testing\ndescription: Testing.\n---\n\n# Testing\n"); writeFileSync(join(tmp, "skills", ".env"), ""); writeFileSync( join(casesDir, "dry-case.yaml"), [ "id: dry-case", "title: Dry Case", "mode: probe", "area: qa", "type: smoke", "priority: p2", "risk: low", "ci_eligible: true", "automation: scripts/fail-if-run.mjs", ].join("\n"), ); writeFileSync( join(suitesDir, "dry-suite.yaml"), [ "id: dry-suite", "title: Dry Suite", "description: Dry run suite.", "type: smoke", "priority: p2", "tags:", " - qa", "cases:", " - dry-case", ].join("\n"), ); writeFileSync(join(scriptsDir, "fail-if-run.mjs"), "process.exit(9);\n"); const evidenceDir = join(tmp, "evidence"); const result = capture(() => commandSuiteRun({ root: tmp, args: ["suite", "run", "dry-suite", "--run-id", "dry-run", "--evidence-dir", evidenceDir, "--dry-run", "--json"], })); assert.equal(result.code, 0); const payload = JSON.parse(result.output); assert.equal(payload.executions[0].status, "planned"); assert.match(payload.executions[0].command, /test run dry-case/); assert.equal(payload.report.status, "incomplete"); assert.equal(existsSync(evidenceDir), false); assert.equal(existsSync(join(tmp, "reports", "dry-run.md")), false); const markdown = capture(() => commandSuiteRun({ root: tmp, args: ["suite", "run", "dry-suite", "--run-id", "dry-run-markdown", "--evidence-dir", join(tmp, "evidence-md"), "--dry-run"], })); assert.equal(markdown.code, 0); assert.match(markdown.output, /# Suite Report: dry-suite/); assert.equal(existsSync(join(tmp, "reports", "dry-run-markdown.md")), false); assert.equal(existsSync(join(tmp, "evidence-md")), false); } finally { rmSync(tmp, { recursive: true, force: true }); } }); test("suite run skips manual-check cases unless explicitly included", () => { const tmp = mkdtempSync(join(tmpdir(), "lbs-suite-run-manual-")); try { const skillDir = join(tmp, "skills", "langbot-testing"); const casesDir = join(skillDir, "cases"); const suitesDir = join(skillDir, "suites"); const scriptsDir = join(tmp, "scripts"); mkdirSync(casesDir, { recursive: true }); mkdirSync(suitesDir, { recursive: true }); mkdirSync(scriptsDir, { recursive: true }); writeFileSync(join(skillDir, "SKILL.md"), "---\nname: langbot-testing\ndescription: Testing.\n---\n\n# Testing\n"); writeFileSync(join(tmp, "skills", ".env"), ""); writeFileSync( join(casesDir, "manual-case.yaml"), [ "id: manual-case", "title: Manual Case", "mode: probe", "area: qa", "type: smoke", "priority: p2", "risk: low", "ci_eligible: true", "preconditions:", " - Confirm this case is safe to run.", "automation: scripts/pass.mjs", "evidence_required:", " - filesystem", ].join("\n"), ); writeFileSync( join(suitesDir, "manual-suite.yaml"), [ "id: manual-suite", "title: Manual Suite", "description: Manual check suite.", "type: smoke", "priority: p2", "tags:", " - qa", "cases:", " - manual-case", ].join("\n"), ); writeFileSync( join(scriptsDir, "pass.mjs"), [ "import { mkdirSync, writeFileSync } from 'node:fs';", "import { join } from 'node:path';", "mkdirSync(process.env.LBS_EVIDENCE_DIR, { recursive: true });", "writeFileSync(join(process.env.LBS_EVIDENCE_DIR, 'result.json'), JSON.stringify({ case_id: process.env.LBS_CASE_ID, run_id: process.env.LBS_RUN_ID, status: 'pass', evidence_collected: ['filesystem'] }));", ].join("\n"), ); const skipped = capture(() => commandSuiteRun({ root: tmp, args: ["suite", "run", "manual-suite", "--run-id", "manual-run", "--evidence-dir", join(tmp, "evidence"), "--json"], })); assert.equal(skipped.code, 1); const skippedPayload = JSON.parse(skipped.output); assert.equal(skippedPayload.executions[0].status, "skipped"); assert.match(skippedPayload.executions[0].reason, /manual_check/); assert.equal(existsSync(join(tmp, "evidence", "manual-case", "result.json")), false); const included = capture(() => commandSuiteRun({ root: tmp, args: ["suite", "run", "manual-suite", "--run-id", "manual-run-included", "--evidence-dir", join(tmp, "evidence-included"), "--include-manual-check", "--json"], })); assert.equal(included.code, 0); const includedPayload = JSON.parse(included.output); assert.equal(includedPayload.executions[0].status, "ok"); assert.equal(includedPayload.report.status, "pass"); assert.ok(existsSync(join(tmp, "evidence-included", "manual-case", "result.json"))); } finally { rmSync(tmp, { recursive: true, force: true }); } }); test("suite run skips cases with missing machine readiness unless explicitly included", () => { const tmp = mkdtempSync(join(tmpdir(), "lbs-suite-run-readiness-")); try { const skillDir = join(tmp, "skills", "langbot-testing"); const casesDir = join(skillDir, "cases"); const suitesDir = join(skillDir, "suites"); const fixturesDir = join(skillDir, "fixtures"); const scriptsDir = join(tmp, "scripts"); mkdirSync(casesDir, { recursive: true }); mkdirSync(suitesDir, { recursive: true }); mkdirSync(fixturesDir, { recursive: true }); mkdirSync(scriptsDir, { recursive: true }); writeFileSync(join(skillDir, "SKILL.md"), "---\nname: langbot-testing\ndescription: Testing.\n---\n\n# Testing\n"); writeFileSync(join(tmp, "skills", ".env"), ""); writeFileSync( join(casesDir, "not-ready-case.yaml"), [ "id: not-ready-case", "title: Not Ready Case", "mode: probe", "area: qa", "type: smoke", "priority: p2", "risk: low", "ci_eligible: true", "env:", " - LBS_TEST_SUITE_RUN_MISSING_ENV", "automation_env:", " - LBS_TEST_SUITE_RUN_MISSING_AUTOMATION_ENV", "automation: scripts/pass.mjs", "evidence_required:", " - filesystem", ].join("\n"), ); writeFileSync( join(fixturesDir, "fixtures.json"), `${JSON.stringify([{ id: "missing-fixture", title: "Missing fixture", kind: "file", path: "fixtures/missing.txt", related_cases: ["not-ready-case"], checks: ["exists"], }], null, 2)}\n`, ); writeFileSync( join(suitesDir, "readiness-suite.yaml"), [ "id: readiness-suite", "title: Readiness Suite", "description: Readiness suite.", "type: smoke", "priority: p2", "tags:", " - qa", "cases:", " - not-ready-case", ].join("\n"), ); writeFileSync( join(scriptsDir, "pass.mjs"), [ "import { mkdirSync, writeFileSync } from 'node:fs';", "import { join } from 'node:path';", "mkdirSync(process.env.LBS_EVIDENCE_DIR, { recursive: true });", "writeFileSync(join(process.env.LBS_EVIDENCE_DIR, 'result.json'), JSON.stringify({ case_id: process.env.LBS_CASE_ID, run_id: process.env.LBS_RUN_ID, status: 'pass', evidence_collected: ['filesystem'] }));", ].join("\n"), ); const skipped = capture(() => commandSuiteRun({ root: tmp, args: ["suite", "run", "readiness-suite", "--run-id", "readiness-run", "--evidence-dir", join(tmp, "evidence"), "--json"], })); assert.equal(skipped.code, 1); const skippedPayload = JSON.parse(skipped.output); assert.equal(skippedPayload.executions[0].status, "skipped"); assert.match(skippedPayload.executions[0].reason, /readiness missing/); assert.match(skippedPayload.executions[0].reason, /LBS_TEST_SUITE_RUN_MISSING_ENV/); assert.match(skippedPayload.executions[0].reason, /LBS_TEST_SUITE_RUN_MISSING_AUTOMATION_ENV/); assert.match(skippedPayload.executions[0].reason, /missing-fixture/); assert.equal(existsSync(join(tmp, "evidence", "not-ready-case", "result.json")), false); const included = capture(() => commandSuiteRun({ root: tmp, args: ["suite", "run", "readiness-suite", "--run-id", "readiness-run-included", "--evidence-dir", join(tmp, "evidence-included"), "--include-not-ready", "--json"], })); assert.equal(included.code, 0); const includedPayload = JSON.parse(included.output); assert.equal(includedPayload.executions[0].status, "ok"); assert.equal(includedPayload.report.status, "pass"); assert.ok(existsSync(join(tmp, "evidence-included", "not-ready-case", "result.json"))); } finally { rmSync(tmp, { recursive: true, force: true }); } }); test("suite new writes a reusable suite skeleton", () => { const tmp = mkdtempSync(join(tmpdir(), "lbs-suite-new-")); try { const skillDir = join(tmp, "skills", "langbot-testing"); mkdirSync(skillDir, { recursive: true }); writeFileSync( join(skillDir, "SKILL.md"), "---\nname: langbot-testing\ndescription: Testing.\n---\n\n# Testing\n", ); const result = capture(() => commandSuiteNew({ root: tmp, args: ["suite", "new", "new-suite", "--title", "New Suite"], })); assert.equal(result.code, 0); const text = readFileSync(join(skillDir, "suites", "new-suite.yaml"), "utf8"); assert.match(text, /^description:/m); assert.match(text, /^priority: p2/m); assert.match(text, /^cases:/m); } finally { rmSync(tmp, { recursive: true, force: true }); } }); test("fixture list and check expose reusable fixture readiness", () => { const list = capture(() => commandFixtureList(ctx(["fixture", "list", "langbot-testing", "--json"]))); assert.equal(list.code, 0); const fixtures = JSON.parse(list.output); assert.ok(fixtures.some((item: { id: string; exists: boolean }) => ( item.id === "mcp-stdio-echo-server" && item.exists === true ))); const check = capture(() => commandFixtureCheck(ctx(["fixture", "check", "langbot-testing", "--json"]))); assert.equal(check.code, 0); const report = JSON.parse(check.output); assert.equal(report.status, "pass"); assert.ok(report.fixtures.some((item: { id: string }) => item.id === "qa-plugin-smoke-package")); }); test("fixture check reports missing manifest paths", () => { const tmp = mkdtempSync(join(tmpdir(), "lbs-fixture-check-")); try { const skillDir = join(tmp, "skills", "langbot-testing"); mkdirSync(join(skillDir, "fixtures"), { recursive: true }); writeFileSync( join(skillDir, "SKILL.md"), "---\nname: langbot-testing\ndescription: Testing.\n---\n\n# Testing\n", ); writeFileSync( join(skillDir, "fixtures", "fixtures.json"), JSON.stringify([{ id: "missing-fixture", title: "Missing Fixture", path: "fixtures/missing.txt" }]), ); const result = capture(() => commandFixtureCheck({ root: tmp, args: ["fixture", "check", "langbot-testing", "--json"] })); assert.equal(result.code, 1); const report = JSON.parse(result.output); assert.equal(report.status, "fail"); assert.ok(report.findings.some((finding: { id?: string }) => finding.id === "missing-fixture")); } finally { rmSync(tmp, { recursive: true, force: true }); } }); test("fixture check verifies QA AgentRunner source shape", () => { const tmp = mkdtempSync(join(tmpdir(), "lbs-fixture-check-")); try { const skillDir = join(tmp, "skills", "langbot-testing"); const fixtureDir = join(skillDir, "fixtures", "plugins", "qa-agent-runner"); mkdirSync(join(fixtureDir, "components", "agent_runner"), { recursive: true }); writeFileSync( join(skillDir, "SKILL.md"), "---\nname: langbot-testing\ndescription: Testing.\n---\n\n# Testing\n", ); writeFileSync( join(skillDir, "fixtures", "fixtures.json"), JSON.stringify([{ id: "qa-agent-runner-source", title: "QA AgentRunner", path: "fixtures/plugins/qa-agent-runner/manifest.yaml", checks: ["exists", "qa_agent_runner_source"], }]), ); writeFileSync(join(fixtureDir, "manifest.yaml"), "spec:\n components:\n AgentRunner: {}\nexecution:\n python:\n attr: QAAgentRunnerPlugin\n"); const result = capture(() => commandFixtureCheck({ root: tmp, args: ["fixture", "check", "langbot-testing", "--json"] })); assert.equal(result.code, 1); const report = JSON.parse(result.output); assert.ok(report.findings.some((finding: { kind?: string; path?: string }) => ( finding.kind === "fixture_check_missing_file" && finding.path?.endsWith("components/agent_runner/default.py") ))); } finally { rmSync(tmp, { recursive: true, force: true }); } }); test("fixture check accepts complete QA AgentRunner source shape", () => { const result = capture(() => commandFixtureCheck(ctx(["fixture", "check", "langbot-testing", "--json"]))); assert.equal(result.code, 0); const report = JSON.parse(result.output); assert.ok(report.fixtures.some((item: { id: string; checks: string[] }) => ( item.id === "qa-agent-runner-source" && item.checks.includes("qa_agent_runner_source") ))); }); test("fixture check rejects invalid plugin package files", () => { const tmp = mkdtempSync(join(tmpdir(), "lbs-fixture-check-")); try { const skillDir = join(tmp, "skills", "langbot-testing"); mkdirSync(join(skillDir, "fixtures"), { recursive: true }); writeFileSync( join(skillDir, "SKILL.md"), "---\nname: langbot-testing\ndescription: Testing.\n---\n\n# Testing\n", ); writeFileSync(join(skillDir, "fixtures", "bad.lbpkg"), "not a zip"); writeFileSync( join(skillDir, "fixtures", "fixtures.json"), JSON.stringify([{ id: "bad-package", title: "Bad Package", path: "fixtures/bad.lbpkg", checks: ["exists", "zip_package"], }]), ); const result = capture(() => commandFixtureCheck({ root: tmp, args: ["fixture", "check", "langbot-testing", "--json"] })); assert.equal(result.code, 1); const report = JSON.parse(result.output); assert.ok(report.findings.some((finding: { kind?: string; id?: string }) => ( finding.kind === "fixture_check_invalid_zip" && finding.id === "bad-package" ))); } finally { rmSync(tmp, { recursive: true, force: true }); } }); test("debug chat classifier prefers latest response leaf over body counts", () => { const result = classifyDebugChatResult({ beforeText: "OK from an older chat", afterText: "OK from an older chat\nUser: say OK\nBot: OK", expectedText: "OK", prompt: "say OK", latestExpectedLeaf: "Bot: OK", latestFailureLeaf: "", }); assert.equal(result.status, "pass"); assert.match(result.reason, /latest visible response leaf/); }); test("debug chat classifier distinguishes new failure signals from old history", () => { assert.equal( findNewFailureSignal("Agent runner temporarily unavailable", "Agent runner temporarily unavailable"), "", ); assert.equal( findNewFailureSignal("", "Agent runner temporarily unavailable"), "Agent runner temporarily unavailable", ); const result = classifyDebugChatResult({ beforeText: "", afterText: "Agent runner temporarily unavailable", expectedText: "OK", prompt: "say OK", latestExpectedLeaf: "", latestFailureLeaf: "Agent runner temporarily unavailable", }); assert.equal(result.status, "fail"); assert.match(result.reason, /known failure signal/); const custom = classifyDebugChatResult({ beforeText: "", afterText: "Bot: qa-plugin-smoke:mcp-ok-local-agent", expectedText: "qa_mcp_echo:mcp-ok-local-agent", prompt: "call mcp", latestExpectedLeaf: "", latestFailureLeaf: "Bot: qa-plugin-smoke:mcp-ok-local-agent", failureSignals: ["qa-plugin-smoke:mcp-ok-local-agent"], }); assert.equal(custom.status, "fail"); assert.equal(custom.failure_signal, "qa-plugin-smoke:mcp-ok-local-agent"); }); test("debug chat classifier lets new failure signals override stale expected history", () => { const result = classifyDebugChatResult({ beforeText: "Bot: qa_mcp_echo:mcp-ok-local-agent", afterText: [ "Bot: qa_mcp_echo:mcp-ok-local-agent", "User: Call qa_mcp_echo", "Bot: Agent runner temporarily unavailable.", ].join("\n"), expectedText: "qa_mcp_echo:mcp-ok-local-agent", prompt: "Call qa_mcp_echo", latestExpectedLeaf: "Bot: qa_mcp_echo:mcp-ok-local-agent", latestFailureLeaf: "Bot: Agent runner temporarily unavailable.", }); assert.equal(result.status, "fail"); assert.equal(result.failure_signal, "Agent runner temporarily unavailable"); }); test("debug chat classifier does not pass on stale expected history without a new occurrence", () => { const result = classifyDebugChatResult({ beforeText: "Bot: qa_mcp_echo:mcp-ok-local-agent", afterText: [ "Bot: qa_mcp_echo:mcp-ok-local-agent", "User: Call qa_mcp_echo", ].join("\n"), expectedText: "qa_mcp_echo:mcp-ok-local-agent", prompt: "Call qa_mcp_echo", latestExpectedLeaf: "Bot: qa_mcp_echo:mcp-ok-local-agent", latestFailureLeaf: "", }); assert.equal(result.status, "fail"); assert.equal(result.final_count, 1); assert.equal(result.min_expected_count, 2); }); test("debug chat classifier accounts for prompt echo occurrences", () => { assert.equal(minExpectedOccurrences("", "OK", "say OK"), 2); const result = classifyDebugChatResult({ beforeText: "", afterText: "User: say OK", expectedText: "OK", prompt: "say OK", latestExpectedLeaf: "User: say OK", latestFailureLeaf: "", }); assert.equal(result.status, "fail"); assert.equal(result.min_expected_count, 2); assert.equal(result.final_count, 1); }); test("debug chat classifier requires new assistant evidence when message bubbles are available", () => { const prompt = "If all steps succeed, final answer must be E2E_OK:skill"; const result = classifyDebugChatResult({ beforeText: "", afterText: `User: ${prompt}`, expectedText: "E2E_OK:skill", prompt, latestExpectedLeaf: prompt, latestFailureLeaf: "", beforeMessages: [], afterMessages: [{ role: "user", text: prompt }], latestAssistantText: "", }); assert.equal(result.status, "fail"); assert.match(result.reason, /new assistant message/); assert.equal(result.before_assistant_expected_count, 0); assert.equal(result.after_assistant_expected_count, 0); }); test("debug chat classifier passes when expected text appears in a new assistant message", () => { const prompt = "Return only E2E_OK:skill"; const result = classifyDebugChatResult({ beforeText: "", afterText: `User: ${prompt}\nBot: E2E_OK:skill`, expectedText: "E2E_OK:skill", prompt, latestExpectedLeaf: "E2E_OK:skill", latestFailureLeaf: "", beforeMessages: [], afterMessages: [ { role: "user", text: prompt }, { role: "assistant", text: "E2E_OK:skill" }, ], latestAssistantText: "E2E_OK:skill", }); assert.equal(result.status, "pass"); assert.match(result.reason, /new assistant message/); assert.equal(result.before_assistant_expected_count, 0); assert.equal(result.after_assistant_expected_count, 1); }); test("debug chat classifier allows a recovered failure when latest assistant is successful", () => { const expectedText = "E2E_OK:skill"; const result = classifyDebugChatResult({ beforeText: "", afterText: [ "Bot: Agent runner temporarily unavailable", `Bot: recovered and completed ${expectedText}`, ].join("\n"), expectedText, prompt: "Modify the existing skill", latestExpectedLeaf: `recovered and completed ${expectedText}`, latestFailureLeaf: "Agent runner temporarily unavailable", beforeMessages: [], afterMessages: [ { role: "assistant", text: "Agent runner temporarily unavailable" }, { role: "assistant", text: `recovered and completed ${expectedText}` }, ], latestAssistantText: `recovered and completed ${expectedText}`, }); assert.equal(result.status, "pass"); assert.equal(result.before_assistant_expected_count, 0); assert.equal(result.after_assistant_expected_count, 1); }); test("env doctor explains a missing backend listener with a startup hint", async () => { const tmp = mkdtempSync(join(tmpdir(), "lbs-env-doctor-")); try { const skillsDir = join(tmp, "skills"); const repoDir = join(tmp, "LangBot"); const webDir = join(repoDir, "web"); const browserProfile = join(tmp, "browser-profile"); const chromium = join(tmp, "chromium"); mkdirSync(skillsDir, { recursive: true }); mkdirSync(webDir, { recursive: true }); mkdirSync(browserProfile, { recursive: true }); writeFileSync(chromium, ""); writeFileSync( join(skillsDir, ".env"), [ "LANGBOT_BACKEND_URL=http://127.0.0.1:59998", "LANGBOT_FRONTEND_URL=http://127.0.0.1:59998", "LANGBOT_DEV_FRONTEND_URL=http://127.0.0.1:59998", `LANGBOT_REPO=${repoDir}`, `LANGBOT_WEB_REPO=${webDir}`, `LANGBOT_BROWSER_PROFILE=${browserProfile}`, `LANGBOT_CHROMIUM_EXECUTABLE=${chromium}`, "LANGBOT_PROXY_HTTP=http://127.0.0.1:7890", "LANGBOT_PROXY_SOCKS=socks5://127.0.0.1:7890", "LANGBOT_NO_PROXY=localhost,127.0.0.1,::1", ].join("\n"), ); const result = await captureAsync(() => commandEnvDoctor({ root: tmp, args: ["env", "doctor"] })); assert.equal(result.code, 1); assert.match(result.output, /FAIL: LANGBOT_BACKEND_URL: no HTTP service reachable because 127\.0\.0\.1:59998 is not listening/); assert.match(result.output, new RegExp(`WARN: LANGBOT_BACKEND_URL: start backend: cd ${repoDir.replace(/[.*+?^${}()|[\]\\]/g, "\\$&")} && uv run main.py`)); assert.match(result.output, new RegExp(`WARN: LANGBOT_FRONTEND_URL: start frontend: cd ${webDir.replace(/[.*+?^${}()|[\]\\]/g, "\\$&")} && pnpm dev`)); } finally { rmSync(tmp, { recursive: true, force: true }); } }); test("env doctor does not require proxy variables", async () => { const tmp = mkdtempSync(join(tmpdir(), "lbs-env-doctor-no-proxy-")); try { const skillsDir = join(tmp, "skills"); const repoDir = join(tmp, "LangBot"); const webDir = join(repoDir, "web"); const browserProfile = join(tmp, "browser-profile"); const chromium = join(tmp, "chromium"); mkdirSync(skillsDir, { recursive: true }); mkdirSync(webDir, { recursive: true }); mkdirSync(browserProfile, { recursive: true }); writeFileSync(chromium, ""); writeFileSync( join(skillsDir, ".env"), [ "LANGBOT_BACKEND_URL=http://127.0.0.1:59997", "LANGBOT_FRONTEND_URL=http://127.0.0.1:59997", "LANGBOT_DEV_FRONTEND_URL=http://127.0.0.1:59997", `LANGBOT_REPO=${repoDir}`, `LANGBOT_WEB_REPO=${webDir}`, `LANGBOT_BROWSER_PROFILE=${browserProfile}`, `LANGBOT_CHROMIUM_EXECUTABLE=${chromium}`, ].join("\n"), ); const result = await captureAsync(() => commandEnvDoctor({ root: tmp, args: ["env", "doctor"] })); assert.equal(result.code, 1); assert.doesNotMatch(result.output, /missing LANGBOT_PROXY|missing LANGBOT_NO_PROXY/); } finally { rmSync(tmp, { recursive: true, force: true }); } }); test("env show redacts secret-like values by default", () => { const tmp = mkdtempSync(join(tmpdir(), "lbs-env-show-redact-")); try { mkdirSync(join(tmp, "skills"), { recursive: true }); writeFileSync( join(tmp, "skills", ".env"), [ "LANGBOT_FRONTEND_URL=http://127.0.0.1:3000", "LANGBOT_API_KEY=sk-test-secret", "LANGBOT_PROXY_HTTP=http://user:pass@127.0.0.1:7890", ].join("\n"), ); const text = capture(() => commandEnvShow({ root: tmp, args: ["env", "show"] })); assert.equal(text.code, 0); assert.match(text.output, /LANGBOT_API_KEY=\[redacted\]/); assert.match(text.output, /LANGBOT_PROXY_HTTP=http:\/\/\[redacted\]@127\.0\.0\.1:7890/); assert.doesNotMatch(text.output, /sk-test-secret|user:pass/); const json = capture(() => commandEnvShow({ root: tmp, args: ["env", "show", "--json"] })); assert.equal(json.code, 0); const parsed = JSON.parse(json.output); assert.equal(parsed.LANGBOT_API_KEY, "[redacted]"); assert.equal(parsed.LANGBOT_PROXY_HTTP, "http://[redacted]@127.0.0.1:7890"); } finally { rmSync(tmp, { recursive: true, force: true }); } }); test("test plan renders agent-browser QA guidance", () => { const result = capture(() => commandTestPlan(ctx(["test", "plan", "pipeline-debug-chat"]))); assert.equal(result.code, 0); assert.match(result.output, /Mode: agent-browser/); assert.match(result.output, /Use browser\/UI interaction as the primary QA path/); assert.match(result.output, /API\/curl\/log checks are diagnostic only/); assert.match(result.output, /## Browser Steps/); assert.match(result.output, /## Success Signals/); assert.match(result.output, /## Required Evidence/); assert.match(result.output, /## Automation Readiness/); assert.match(result.output, /## Fixture Readiness/); assert.match(result.output, /## Manual Readiness/); assert.match(result.output, /backend_log/); }); test("test plan JSON is parseable and includes troubleshooting patterns", () => { const result = capture(() => commandTestPlan(ctx(["test", "plan", "pipeline-debug-chat", "--json"]))); assert.equal(result.code, 0); const plan = JSON.parse(result.output); assert.equal(plan.id, "pipeline-debug-chat"); assert.equal(plan.mode, "agent-browser"); assert.ok(["ready", "missing"].includes(plan.automation_readiness.status)); assert.ok(plan.automation_readiness.defaulted.includes("LANGBOT_E2E_PROMPT")); assert.ok(plan.automation_readiness.defaulted.includes("LANGBOT_E2E_EXPECTED_TEXT")); assert.equal(plan.manual_readiness.status, "manual_check"); assert.ok(plan.success_patterns.includes("Streaming completed")); assert.ok(plan.troubleshooting.some((entry: { id: string }) => entry.id === "plugin-runtime-timeout")); }); test("test plan JSON exposes missing case-specific pipeline readiness", () => { const result = capture(() => commandTestPlan(ctx(["test", "plan", "local-agent-basic-debug-chat", "--json"]))); assert.equal(result.code, 0); const plan = JSON.parse(result.output); assert.equal(plan.env_readiness.status, "ready"); assert.ok(["ready", "missing"].includes(plan.automation_readiness.status)); assert.ok(plan.automation_readiness.pipeline_env_required); assert.ok( plan.automation_readiness.missing.includes("LANGBOT_LOCAL_AGENT_PIPELINE_URL|LANGBOT_LOCAL_AGENT_PIPELINE_NAME") || plan.automation_readiness.configured.some((key: string) => key.startsWith("LANGBOT_LOCAL_AGENT_PIPELINE_")), ); }); test("generic pipeline readiness accepts either URL or name target", () => { const originalUrl = process.env.LANGBOT_PIPELINE_URL; const originalName = process.env.LANGBOT_PIPELINE_NAME; try { withEnv({ LANGBOT_BROWSER_PROFILE: "/tmp/langbot-test-profile", LANGBOT_CHROMIUM_EXECUTABLE: "/tmp/langbot-test-chromium", }, () => { process.env.LANGBOT_PIPELINE_URL = "http://127.0.0.1:3000/home/pipelines?id=only-url"; process.env.LANGBOT_PIPELINE_NAME = ""; const ready = capture(() => commandTestPlan(ctx(["test", "plan", "pipeline-debug-chat", "--json"]))); assert.equal(ready.code, 0); const plan = JSON.parse(ready.output); assert.equal(plan.env_readiness.status, "ready"); assert.equal(plan.automation_readiness.status, "ready"); assert.ok(plan.automation_readiness.required.includes("LANGBOT_PIPELINE_URL|LANGBOT_PIPELINE_NAME")); }); process.env.LANGBOT_PIPELINE_URL = ""; process.env.LANGBOT_PIPELINE_NAME = ""; const missing = capture(() => commandTestPlan(ctx(["test", "plan", "pipeline-debug-chat", "--json"]))); assert.equal(missing.code, 0); const missingPlan = JSON.parse(missing.output); assert.equal(missingPlan.env_readiness.status, "missing"); assert.ok(missingPlan.env_readiness.missing.includes("LANGBOT_PIPELINE_URL|LANGBOT_PIPELINE_NAME")); assert.equal(missingPlan.automation_readiness.status, "missing"); assert.ok(missingPlan.automation_readiness.missing.includes("LANGBOT_PIPELINE_URL|LANGBOT_PIPELINE_NAME")); } finally { if (originalUrl === undefined) delete process.env.LANGBOT_PIPELINE_URL; else process.env.LANGBOT_PIPELINE_URL = originalUrl; if (originalName === undefined) delete process.env.LANGBOT_PIPELINE_NAME; else process.env.LANGBOT_PIPELINE_NAME = originalName; } }); test("test recommend maps AgentRunner ledger changes to focused probes", () => { const result = capture(() => commandTestRecommend(ctx([ "test", "recommend", "--file", "LangBot/src/langbot/pkg/agent/runner/run_ledger_store.py", "--file", "LangBot/tests/unit_tests/agent/test_run_ledger_store.py", "--json", ]))); assert.equal(result.code, 0); const report = JSON.parse(result.output); const ids = report.recommendations.map((item: { id: string }) => item.id); assert.ok(ids.includes("agent-runner-ledger-invariants")); assert.ok(ids.includes("agent-runner-ledger-stress")); assert.ok(ids.includes("agent-runner-ledger-contention")); assert.ok(ids.includes("agent-runner-async-db-readiness")); assert.ok(ids.includes("agent-runner-ledger-concurrency")); assert.ok(report.commands.every((command: string) => !command.startsWith("bin/lbs test run ") || command.endsWith(" --dry-run"))); assert.ok(report.notes.some((note: string) => note.includes("Remove --dry-run"))); }); test("test recommend maps AgentRunner result changes to fixture contract", () => { const result = capture(() => commandTestRecommend(ctx([ "test", "recommend", "--file", "langbot-plugin-sdk/src/langbot_plugin/api/entities/builtin/agent_runner/result.py", "--json", ]))); assert.equal(result.code, 0); const report = JSON.parse(result.output); const ids = report.recommendations.map((item: { id: string }) => item.id); assert.ok(ids.includes("agent-runner-fixture-contract")); assert.ok(ids.includes("agent-runner-behavior-matrix")); assert.ok(!ids.includes("agent-runner-ledger-invariants")); }); test("test recommend maps QA AgentRunner fixture changes to live install", () => { const result = capture(() => commandTestRecommend(ctx([ "test", "recommend", "--file", "langbot-skills/skills/langbot-testing/fixtures/plugins/qa-agent-runner/components/agent_runner/default.py", "--json", ]))); assert.equal(result.code, 0); const report = JSON.parse(result.output); const ids = report.recommendations.map((item: { id: string }) => item.id); assert.ok(ids.includes("agent-runner-fixture-contract")); assert.ok(ids.includes("agent-runner-live-install")); assert.ok(ids.includes("agent-runner-qa-debug-chat")); }); test("test recommend maps QA plugin smoke fixture changes to live install", () => { const result = capture(() => commandTestRecommend(ctx([ "test", "recommend", "--file", "langbot-skills/skills/langbot-testing/fixtures/plugins/qa-plugin-smoke/main.py", "--json", ]))); assert.equal(result.code, 0); const report = JSON.parse(result.output); const ids = report.recommendations.map((item: { id: string }) => item.id); assert.ok(ids.includes("qa-plugin-smoke-live-install")); }); test("test recommend keeps git status paths intact", () => { const tmp = mkdtempSync(join(tmpdir(), "lbs-recommend-git-")); const originalRepos = { LANGBOT_REPO: process.env.LANGBOT_REPO, LANGBOT_PLUGIN_SDK_REPO: process.env.LANGBOT_PLUGIN_SDK_REPO, LANGBOT_AGENT_RUNNER_REPO: process.env.LANGBOT_AGENT_RUNNER_REPO, LANGBOT_LOCAL_AGENT_REPO: process.env.LANGBOT_LOCAL_AGENT_REPO, }; try { const repo = join(tmp, "LangBot"); mkdirSync(join(repo, "src", "langbot", "pkg", "agent", "runner"), { recursive: true }); spawnSync("git", ["init"], { cwd: repo }); spawnSync("git", ["config", "user.email", "qa@example.test"], { cwd: repo }); spawnSync("git", ["config", "user.name", "QA"], { cwd: repo }); writeFileSync(join(repo, "README.md"), "test\n"); writeFileSync(join(repo, "src", "langbot", "pkg", "agent", "runner", "run_ledger_store.py"), "# test\n"); spawnSync("git", ["add", "README.md", "src/langbot/pkg/agent/runner/run_ledger_store.py"], { cwd: repo }); spawnSync("git", ["commit", "-m", "init"], { cwd: repo }); writeFileSync(join(repo, "src", "langbot", "pkg", "agent", "runner", "run_ledger_store.py"), "# changed\n"); process.env.LANGBOT_REPO = repo; process.env.LANGBOT_PLUGIN_SDK_REPO = join(tmp, "missing-sdk"); process.env.LANGBOT_AGENT_RUNNER_REPO = join(tmp, "missing-runner"); process.env.LANGBOT_LOCAL_AGENT_REPO = join(tmp, "missing-local"); const result = capture(() => commandTestRecommend({ root, args: ["test", "recommend", "--json"] })); assert.equal(result.code, 0); const report = JSON.parse(result.output); assert.ok(report.changed_files.includes("LangBot/src/langbot/pkg/agent/runner/run_ledger_store.py")); assert.ok(!report.changed_files.some((file: string) => file.includes("LangBot/rc/"))); } finally { for (const [key, value] of Object.entries(originalRepos)) { if (value === undefined) delete process.env[key]; else process.env[key] = value; } rmSync(tmp, { recursive: true, force: true }); } }); test("test start creates a run handoff with a bounded report command", () => { const result = capture(() => commandTestStart(ctx(["test", "start", "pipeline-debug-chat"]))); assert.equal(result.code, 0); assert.match(result.output, /^# Test Start: pipeline-debug-chat/m); assert.match(result.output, /bin\/lbs test plan pipeline-debug-chat/); assert.match(result.output, /bin\/lbs test run pipeline-debug-chat --run-id .+ --output reports\/evidence\/.+pipeline-debug-chat/); assert.match(result.output, /bin\/lbs test report pipeline-debug-chat --since ".+" --console-log reports\/evidence\/.+\/console\.log --evidence-dir reports\/evidence\/.+ --output reports\/.+pipeline-debug-chat\.md/); assert.match(result.output, /Streaming completed/); }); test("test start JSON is parseable for agent orchestration", () => { const result = capture(() => commandTestStart(ctx(["test", "start", "pipeline-debug-chat", "--json"]))); assert.equal(result.code, 0); const start = JSON.parse(result.output); assert.equal(start.case.id, "pipeline-debug-chat"); assert.match(start.run_id, /pipeline-debug-chat$/); assert.match(start.started_at_local, /\d{4}-\d{2}-\d{2}T/); assert.match(start.report_command, /--since/); assert.match(start.result_command_template, /bin\/lbs test result pipeline-debug-chat/); assert.match(start.automation.command, /bin\/lbs test run pipeline-debug-chat/); assert.ok(start.success_patterns.includes("Streaming completed")); assert.ok(start.evidence_required.includes("backend_log")); }); test("test result writes a suite-readable result.json and enforces pass evidence", () => { const tmp = mkdtempSync(join(tmpdir(), "lbs-test-result-")); try { const evidenceDir = join(tmp, "pipeline-run"); const ok = capture(() => commandTestResult(ctx([ "test", "result", "pipeline-debug-chat", "--result", "pass", "--reason", "Debug Chat returned OK and logs were clean.", "--evidence-dir", evidenceDir, "--started-at", "2026-05-21T10:30:00.000+08:00", "--evidence", "ui,screenshot,console,backend_log", "--json", ]))); assert.equal(ok.code, 0); const record = JSON.parse(ok.output); assert.equal(record.source, "final"); assert.equal(record.status, "pass"); assert.equal(record.evidence_status, "complete"); assert.deepEqual(record.evidence_missing, []); assert.equal(JSON.parse(readFileSync(join(evidenceDir, "result.json"), "utf8")).case_id, "pipeline-debug-chat"); const missing = captureAll(() => commandTestResult(ctx([ "test", "result", "pipeline-debug-chat", "--result", "pass", "--reason", "Missing backend evidence should not be accepted as pass.", "--evidence-dir", join(tmp, "missing-evidence"), "--evidence", "ui", ]))); assert.equal(missing.code, 1); assert.match(missing.error, /missing required evidence/); } finally { rmSync(tmp, { recursive: true, force: true }); } }); test("test run dry-run exposes case automation script and evidence paths", () => { const result = capture(() => commandTestRun(ctx([ "test", "run", "pipeline-debug-chat", "--run-id", "run-123", "--output", "reports/evidence/run-123", "--dry-run", ]))); assert.equal(result.code, 0); assert.match(result.output, /^# Test Automation: pipeline-debug-chat/m); assert.match(result.output, /scripts\/e2e\/pipeline-debug-chat\.mjs/); assert.match(result.output, /console_log: reports\/evidence\/run-123\/console\.log/); assert.match(result.output, /automation_result_json: reports\/evidence\/run-123\/automation-result\.json/); assert.match(result.output, /result_json: reports\/evidence\/run-123\/result\.json/); assert.match(result.output, /LANGBOT_PIPELINE_URL/); }); test("test run dry-run JSON is parseable for automation orchestration", () => { const result = capture(() => commandTestRun(ctx([ "test", "run", "webui-login-state", "--run-id", "login-run", "--dry-run", "--json", ]))); assert.equal(result.code, 0); const run = JSON.parse(result.output); assert.equal(run.case.id, "webui-login-state"); assert.equal(run.run_id, "login-run"); assert.equal(run.automation.script, "scripts/e2e/webui-login-state.mjs"); assert.equal(run.automation.exists, true); assert.match(run.automation.automation_result_json, /automation-result\.json$/); assert.match(run.automation.result_json, /result\.json$/); assert.match(run.automation.report_command, /--console-log/); }); test("test run JSON executes automation unless dry-run is explicit", () => { const tmp = mkdtempSync(join(tmpdir(), "lbs-run-json-exec-")); try { const skillDir = join(tmp, "skills", "langbot-testing"); const casesDir = join(skillDir, "cases"); const scriptsDir = join(tmp, "scripts"); mkdirSync(casesDir, { recursive: true }); mkdirSync(scriptsDir, { recursive: true }); writeFileSync(join(skillDir, "SKILL.md"), "---\nname: langbot-testing\ndescription: Testing.\n---\n\n# Testing\n"); writeFileSync(join(tmp, "skills", ".env"), ""); writeFileSync( join(casesDir, "json-exec.yaml"), [ "id: json-exec", "title: JSON Exec", "mode: probe", "area: qa", "type: smoke", "priority: p2", "risk: low", "ci_eligible: true", "automation: scripts/write-marker.mjs", ].join("\n"), ); writeFileSync( join(scriptsDir, "write-marker.mjs"), [ "import { writeFileSync } from 'node:fs';", "import { join } from 'node:path';", "writeFileSync(join(process.env.LBS_ROOT, 'json-ran.txt'), 'yes');", ].join("\n"), ); const result = capture(() => commandTestRun({ root: tmp, args: ["test", "run", "json-exec", "--run-id", "json-run", "--json"], })); assert.equal(result.code, 0); assert.equal(readFileSync(join(tmp, "json-ran.txt"), "utf8"), "yes"); const payload = JSON.parse(result.output); assert.equal(payload.exit_status, 0); assert.equal(payload.automation_execution.status, "ok"); } finally { rmSync(tmp, { recursive: true, force: true }); } }); test("test run lets explicit environment override automation defaults", () => { const tmp = mkdtempSync(join(tmpdir(), "lbs-run-env-override-")); const originalPatch = process.env.LANGBOT_E2E_RUNNER_CONFIG_PATCH_JSON; try { const skillDir = join(tmp, "skills", "langbot-testing"); const casesDir = join(skillDir, "cases"); const scriptsDir = join(tmp, "scripts"); mkdirSync(casesDir, { recursive: true }); mkdirSync(scriptsDir, { recursive: true }); writeFileSync(join(skillDir, "SKILL.md"), "---\nname: langbot-testing\ndescription: Testing.\n---\n\n# Testing\n"); writeFileSync(join(tmp, "skills", ".env"), ""); writeFileSync( join(casesDir, "env-override.yaml"), [ "id: env-override", "title: Env Override", "mode: agent-browser", "area: pipeline", "type: smoke", "priority: p2", "risk: low", "ci_eligible: false", "automation: scripts/write-env.mjs", "automation_runner_config_patch_json: '{\"source\":\"default\"}'", ].join("\n"), ); writeFileSync( join(scriptsDir, "write-env.mjs"), [ "import { writeFileSync } from 'node:fs';", "import { join } from 'node:path';", "writeFileSync(join(process.env.LBS_ROOT, 'env-out.json'), JSON.stringify({", " patch: process.env.LANGBOT_E2E_RUNNER_CONFIG_PATCH_JSON,", "}));", ].join("\n"), ); process.env.LANGBOT_E2E_RUNNER_CONFIG_PATCH_JSON = '{"source":"explicit"}'; const result = capture(() => commandTestRun({ root: tmp, args: ["test", "run", "env-override", "--run-id", "env-run"], })); assert.equal(result.code, 0); const observed = JSON.parse(readFileSync(join(tmp, "env-out.json"), "utf8")); assert.equal(observed.patch, '{"source":"explicit"}'); } finally { if (originalPatch === undefined) delete process.env.LANGBOT_E2E_RUNNER_CONFIG_PATCH_JSON; else process.env.LANGBOT_E2E_RUNNER_CONFIG_PATCH_JSON = originalPatch; rmSync(tmp, { recursive: true, force: true }); } }); test("test run expands env references in automation defaults", () => { const tmp = mkdtempSync(join(tmpdir(), "lbs-run-env-expand-")); try { const skillDir = join(tmp, "skills", "langbot-testing"); const casesDir = join(skillDir, "cases"); const scriptsDir = join(tmp, "scripts"); mkdirSync(casesDir, { recursive: true }); mkdirSync(scriptsDir, { recursive: true }); writeFileSync(join(skillDir, "SKILL.md"), "---\nname: langbot-testing\ndescription: Testing.\n---\n\n# Testing\n"); writeFileSync(join(tmp, "skills", ".env"), "QA_KB_UUID=kb-from-env\nQA_MODEL_UUID=model-from-env\n"); writeFileSync( join(casesDir, "env-expand.yaml"), [ "id: env-expand", "title: Env Expand", "mode: agent-browser", "area: pipeline", "type: smoke", "priority: p2", "risk: low", "ci_eligible: false", "automation: scripts/write-expanded-env.mjs", "automation_runner_config_patch_json: '{\"knowledge-bases\":[\"${QA_KB_UUID}\"],\"model\":{\"primary\":\"${QA_MODEL_UUID}\"}}'", ].join("\n"), ); writeFileSync( join(scriptsDir, "write-expanded-env.mjs"), [ "import { writeFileSync } from 'node:fs';", "import { join } from 'node:path';", "writeFileSync(join(process.env.LBS_ROOT, 'expanded-env-out.json'), JSON.stringify({", " patch: process.env.LANGBOT_E2E_RUNNER_CONFIG_PATCH_JSON,", "}));", ].join("\n"), ); const dryRun = capture(() => commandTestRun({ root: tmp, args: ["test", "run", "env-expand", "--run-id", "env-expand-dry", "--dry-run", "--json"], })); assert.equal(dryRun.code, 0); const plan = JSON.parse(dryRun.output); assert.equal( plan.automation.env_defaults.LANGBOT_E2E_RUNNER_CONFIG_PATCH_JSON, '{"knowledge-bases":["kb-from-env"],"model":{"primary":"model-from-env"}}', ); const run = capture(() => commandTestRun({ root: tmp, args: ["test", "run", "env-expand", "--run-id", "env-expand-run"], })); assert.equal(run.code, 0); const observed = JSON.parse(readFileSync(join(tmp, "expanded-env-out.json"), "utf8")); assert.equal(observed.patch, '{"knowledge-bases":["kb-from-env"],"model":{"primary":"model-from-env"}}'); } finally { rmSync(tmp, { recursive: true, force: true }); } }); test("test run setup automation isolates evidence and reloads env", () => { const tmp = mkdtempSync(join(tmpdir(), "lbs-run-setup-automation-")); try { const skillDir = join(tmp, "skills", "langbot-testing"); const casesDir = join(skillDir, "cases"); const scriptsDir = join(tmp, "scripts"); mkdirSync(casesDir, { recursive: true }); mkdirSync(scriptsDir, { recursive: true }); writeFileSync(join(skillDir, "SKILL.md"), "---\nname: langbot-testing\ndescription: Testing.\n---\n\n# Testing\n"); writeFileSync(join(tmp, "skills", ".env"), "SETUP_VALUE=\n"); writeFileSync( join(casesDir, "setup-main.yaml"), [ "id: setup-main", "title: Setup Main", "mode: agent-browser", "area: pipeline", "type: smoke", "priority: p2", "risk: low", "ci_eligible: false", "env:", " - SETUP_VALUE", "setup_automation:", " - \"node:scripts/write-setup-env.mjs --write-env\"", "setup_provides_env:", " - SETUP_VALUE", "automation: scripts/read-setup-env.mjs", ].join("\n"), ); writeFileSync( join(casesDir, "setup-env-issue.yaml"), [ "id: setup-env-issue", "title: Setup Env Issue", "mode: agent-browser", "area: pipeline", "type: smoke", "priority: p2", "risk: low", "ci_eligible: false", "setup_automation:", " - \"node:scripts/write-setup-env-issue.mjs\"", "automation: scripts/read-setup-env.mjs", ].join("\n"), ); writeFileSync( join(casesDir, "setup-fail-after-pass.yaml"), [ "id: setup-fail-after-pass", "title: Setup Fail After Pass", "mode: agent-browser", "area: pipeline", "type: smoke", "priority: p2", "risk: low", "ci_eligible: false", "setup_automation:", " - \"node:scripts/write-setup-pass-then-fail.mjs\"", "automation: scripts/read-setup-env.mjs", ].join("\n"), ); writeFileSync( join(scriptsDir, "write-setup-env.mjs"), [ "import { mkdirSync, writeFileSync } from 'node:fs';", "import { dirname, join } from 'node:path';", "const local = join(process.env.LBS_ROOT, 'skills', '.env.local');", "writeFileSync(local, 'SETUP_VALUE=from-setup\\n');", "mkdirSync(process.env.LBS_EVIDENCE_DIR, { recursive: true });", "writeFileSync(join(process.env.LBS_EVIDENCE_DIR, 'automation-result.json'), JSON.stringify({ status: 'pass', stage: 'setup' }));", "writeFileSync(join(process.env.LBS_EVIDENCE_DIR, 'result.json'), JSON.stringify({ status: 'pass', stage: 'setup' }));", "writeFileSync(join(dirname(process.env.LBS_EVIDENCE_DIR), 'setup-ran.txt'), 'yes');", ].join("\n"), ); writeFileSync( join(scriptsDir, "read-setup-env.mjs"), [ "import { mkdirSync, writeFileSync } from 'node:fs';", "import { join } from 'node:path';", "mkdirSync(process.env.LBS_EVIDENCE_DIR, { recursive: true });", "writeFileSync(join(process.env.LBS_ROOT, 'main-observed.json'), JSON.stringify({ value: process.env.SETUP_VALUE }));", "writeFileSync(join(process.env.LBS_EVIDENCE_DIR, 'automation-result.json'), JSON.stringify({ status: 'pass', stage: 'main' }));", "writeFileSync(join(process.env.LBS_EVIDENCE_DIR, 'result.json'), JSON.stringify({ status: 'pass', stage: 'main' }));", "if (process.env.SETUP_VALUE !== 'from-setup') process.exit(1);", ].join("\n"), ); writeFileSync( join(scriptsDir, "write-setup-env-issue.mjs"), [ "import { mkdirSync, writeFileSync } from 'node:fs';", "import { join } from 'node:path';", "mkdirSync(process.env.LBS_EVIDENCE_DIR, { recursive: true });", "writeFileSync(join(process.env.LBS_EVIDENCE_DIR, 'automation-result.json'), JSON.stringify({ status: 'env_issue', reason: 'setup env missing' }));", "process.exit(2);", ].join("\n"), ); writeFileSync( join(scriptsDir, "write-setup-pass-then-fail.mjs"), [ "import { mkdirSync, writeFileSync } from 'node:fs';", "import { join } from 'node:path';", "mkdirSync(process.env.LBS_EVIDENCE_DIR, { recursive: true });", "writeFileSync(join(process.env.LBS_EVIDENCE_DIR, 'automation-result.json'), JSON.stringify({ status: 'pass', reason: 'stale pass before crash' }));", "process.exit(1);", ].join("\n"), ); const dryRun = capture(() => commandTestRun({ root: tmp, args: ["test", "run", "setup-main", "--run-id", "setup-run", "--output", join(tmp, "evidence"), "--dry-run", "--json"], })); assert.equal(dryRun.code, 0); const plan = JSON.parse(dryRun.output); assert.equal(plan.setup_automation.length, 1); assert.match(plan.setup_automation[0].evidence_dir, /setup\/01-write-setup-env$/); assert.match(plan.setup_automation[0].command, /^node scripts\/write-setup-env\.mjs --write-env$/); assert.equal(plan.setup_automation[0].dry_run_command, ""); assert.equal(existsSync(join(tmp, "skills", ".env.local")), false); const run = capture(() => commandTestRun({ root: tmp, args: ["test", "run", "setup-main", "--run-id", "setup-run", "--output", join(tmp, "evidence")], })); assert.equal(run.code, 0); const observed = JSON.parse(readFileSync(join(tmp, "main-observed.json"), "utf8")); assert.equal(observed.value, "from-setup"); const setupResult = JSON.parse(readFileSync(join(tmp, "evidence", "setup", "01-write-setup-env", "automation-result.json"), "utf8")); const mainResult = JSON.parse(readFileSync(join(tmp, "evidence", "automation-result.json"), "utf8")); assert.equal(setupResult.stage, "setup"); assert.equal(mainResult.stage, "main"); const envIssue = capture(() => commandTestRun({ root: tmp, args: ["test", "run", "setup-env-issue", "--run-id", "setup-env-issue-run", "--output", join(tmp, "evidence-env-issue")], })); assert.equal(envIssue.code, 2); const parentResult = JSON.parse(readFileSync(join(tmp, "evidence-env-issue", "automation-result.json"), "utf8")); assert.equal(parentResult.status, "env_issue"); assert.equal(parentResult.reason, "setup env missing"); const failAfterPass = capture(() => commandTestRun({ root: tmp, args: ["test", "run", "setup-fail-after-pass", "--run-id", "setup-fail-after-pass-run", "--output", join(tmp, "evidence-fail-after-pass")], })); assert.equal(failAfterPass.code, 1); const failAfterPassResult = JSON.parse(readFileSync(join(tmp, "evidence-fail-after-pass", "automation-result.json"), "utf8")); assert.equal(failAfterPassResult.status, "fail"); assert.equal(failAfterPassResult.reason, "stale pass before crash"); } finally { rmSync(tmp, { recursive: true, force: true }); } }); test("test run setup automation can execute another case outside this source repo", () => { const tmp = mkdtempSync(join(tmpdir(), "lbs-run-setup-case-")); try { const skillDir = join(tmp, "skills", "langbot-testing"); const casesDir = join(skillDir, "cases"); const scriptsDir = join(tmp, "scripts"); mkdirSync(casesDir, { recursive: true }); mkdirSync(scriptsDir, { recursive: true }); writeFileSync(join(skillDir, "SKILL.md"), "---\nname: langbot-testing\ndescription: Testing.\n---\n\n# Testing\n"); writeFileSync(join(tmp, "skills", ".env"), "SETUP_VALUE=\n"); writeFileSync( join(casesDir, "setup-child.yaml"), [ "id: setup-child", "title: Setup Child", "mode: probe", "area: qa", "type: smoke", "priority: p2", "risk: low", "ci_eligible: true", "automation: scripts/write-child-env.mjs", ].join("\n"), ); writeFileSync( join(casesDir, "setup-parent.yaml"), [ "id: setup-parent", "title: Setup Parent", "mode: probe", "area: qa", "type: smoke", "priority: p2", "risk: low", "ci_eligible: true", "setup_automation:", " - \"case:setup-child\"", "setup_provides_env:", " - SETUP_VALUE", "automation: scripts/read-child-env.mjs", ].join("\n"), ); writeFileSync( join(scriptsDir, "write-child-env.mjs"), [ "import { mkdirSync, writeFileSync } from 'node:fs';", "import { join } from 'node:path';", "writeFileSync(join(process.env.LBS_ROOT, 'skills', '.env.local'), 'SETUP_VALUE=from-child\\n');", "mkdirSync(process.env.LBS_EVIDENCE_DIR, { recursive: true });", "writeFileSync(join(process.env.LBS_EVIDENCE_DIR, 'automation-result.json'), JSON.stringify({ status: 'pass' }));", "writeFileSync(join(process.env.LBS_EVIDENCE_DIR, 'result.json'), JSON.stringify({ status: 'pass' }));", ].join("\n"), ); writeFileSync( join(scriptsDir, "read-child-env.mjs"), [ "import { mkdirSync, writeFileSync } from 'node:fs';", "import { join } from 'node:path';", "mkdirSync(process.env.LBS_EVIDENCE_DIR, { recursive: true });", "writeFileSync(join(process.env.LBS_EVIDENCE_DIR, 'automation-result.json'), JSON.stringify({ status: 'pass', value: process.env.SETUP_VALUE }));", "writeFileSync(join(process.env.LBS_EVIDENCE_DIR, 'result.json'), JSON.stringify({ status: 'pass', value: process.env.SETUP_VALUE }));", "if (process.env.SETUP_VALUE !== 'from-child') process.exit(1);", ].join("\n"), ); const run = capture(() => commandTestRun({ root: tmp, args: ["test", "run", "setup-parent", "--run-id", "setup-parent-run", "--output", join(tmp, "evidence")], })); assert.equal(run.code, 0); assert.ok(existsSync(join(tmp, "evidence", "setup", "01-setup-child", "result.json"))); const result = JSON.parse(readFileSync(join(tmp, "evidence", "automation-result.json"), "utf8")); assert.equal(result.value, "from-child"); } finally { rmSync(tmp, { recursive: true, force: true }); } }); test("test run automation inherits parent process environment", () => { const tmp = mkdtempSync(join(tmpdir(), "lbs-run-env-inherit-")); try { const skillDir = join(tmp, "skills", "langbot-testing"); const casesDir = join(skillDir, "cases"); const scriptsDir = join(tmp, "scripts"); mkdirSync(casesDir, { recursive: true }); mkdirSync(scriptsDir, { recursive: true }); writeFileSync(join(skillDir, "SKILL.md"), "---\nname: langbot-testing\ndescription: Testing.\n---\n\n# Testing\n"); writeFileSync(join(tmp, "skills", ".env"), ""); writeFileSync( join(casesDir, "env-inherit.yaml"), [ "id: env-inherit", "title: Env Inherit", "mode: probe", "area: qa", "type: smoke", "priority: p2", "risk: low", "ci_eligible: true", "automation: scripts/read-path.mjs", ].join("\n"), ); writeFileSync( join(scriptsDir, "read-path.mjs"), [ "import { mkdirSync, writeFileSync } from 'node:fs';", "import { join } from 'node:path';", "mkdirSync(process.env.LBS_EVIDENCE_DIR, { recursive: true });", "writeFileSync(join(process.env.LBS_EVIDENCE_DIR, 'automation-result.json'), JSON.stringify({ status: process.env.PATH ? 'pass' : 'fail' }));", "process.exit(process.env.PATH ? 0 : 1);", ].join("\n"), ); const run = capture(() => commandTestRun({ root: tmp, args: ["test", "run", "env-inherit", "--run-id", "env-inherit-run", "--output", join(tmp, "evidence")], })); assert.equal(run.code, 0); const result = JSON.parse(readFileSync(join(tmp, "evidence", "automation-result.json"), "utf8")); assert.equal(result.status, "pass"); } finally { rmSync(tmp, { recursive: true, force: true }); } }); test("test run dry-run marks missing setup case targets", () => { const tmp = mkdtempSync(join(tmpdir(), "lbs-run-setup-missing-case-")); try { const skillDir = join(tmp, "skills", "langbot-testing"); const casesDir = join(skillDir, "cases"); const scriptsDir = join(tmp, "scripts"); mkdirSync(casesDir, { recursive: true }); mkdirSync(scriptsDir, { recursive: true }); writeFileSync(join(skillDir, "SKILL.md"), "---\nname: langbot-testing\ndescription: Testing.\n---\n\n# Testing\n"); writeFileSync(join(tmp, "skills", ".env"), ""); writeFileSync( join(casesDir, "setup-parent.yaml"), [ "id: setup-parent", "title: Setup Parent", "mode: probe", "area: qa", "type: smoke", "priority: p2", "risk: low", "ci_eligible: true", "setup_automation:", " - \"case:missing-child\"", "automation: scripts/pass.mjs", ].join("\n"), ); writeFileSync(join(scriptsDir, "pass.mjs"), "process.exit(0);\n"); const result = capture(() => commandTestRun({ root: tmp, args: ["test", "run", "setup-parent", "--dry-run", "--json"], })); assert.equal(result.code, 0); const run = JSON.parse(result.output); assert.equal(run.setup_automation[0].entry, "case:missing-child"); assert.doesNotMatch(run.setup_automation[0].command, /--dry-run/); assert.match(run.setup_automation[0].dry_run_command, /--dry-run/); assert.equal(run.setup_automation[0].exists, false); } finally { rmSync(tmp, { recursive: true, force: true }); } }); test("local-agent effective prompt case has runnable automation defaults", () => { const result = capture(() => commandTestRun(ctx([ "test", "run", "local-agent-effective-prompt-debug-chat", "--run-id", "effective-run", "--dry-run", "--json", ]))); assert.equal(result.code, 0); const run = JSON.parse(result.output); assert.equal(run.automation.script, "scripts/e2e/pipeline-debug-chat.mjs"); assert.equal(run.automation.env_defaults.LANGBOT_E2E_PROMPT, "qa-effective-prompt"); assert.equal(run.automation.env_defaults.LANGBOT_E2E_EXPECTED_TEXT, "PROMPT_PREPROCESS_OK"); assert.equal(run.automation.env_defaults.LANGBOT_E2E_RESPONSE_TIMEOUT_MS, "180000"); assert.equal(run.automation.pipeline_env_required, true); assert.ok(run.automation.env_aliases.some((alias: { target: string; source: string }) => ( alias.target === "LANGBOT_E2E_PIPELINE_URL" && alias.source === "LANGBOT_LOCAL_AGENT_PIPELINE_URL" ))); }); test("local-agent basic case can setup the local-agent pipeline env", () => { withEnv({ LANGBOT_BROWSER_PROFILE: "/tmp/langbot-test-profile", LANGBOT_CHROMIUM_EXECUTABLE: "/tmp/langbot-test-chromium", }, () => { const result = capture(() => commandTestRun(ctx([ "test", "run", "local-agent-basic-debug-chat", "--dry-run", "--json", ]))); assert.equal(result.code, 0); const run = JSON.parse(result.output); assert.deepEqual(run.setup_automation.map((item: { entry: string }) => item.entry), [ "node:scripts/e2e/ensure-local-agent-pipeline.mjs --write-env", ]); const planResult = capture(() => commandTestPlan(ctx(["test", "plan", "local-agent-basic-debug-chat", "--json"]))); assert.equal(planResult.code, 0); const plan = JSON.parse(planResult.output); assert.deepEqual(plan.setup_provides_env, [ "LANGBOT_LOCAL_AGENT_PIPELINE_URL", "LANGBOT_LOCAL_AGENT_PIPELINE_NAME", ]); assert.equal(plan.automation_readiness.status, "ready"); }); }); test("local-agent nonstreaming case disables stream output through automation defaults", () => { const result = capture(() => commandTestRun(ctx([ "test", "run", "local-agent-nonstreaming-debug-chat", "--dry-run", "--json", ]))); assert.equal(result.code, 0); const run = JSON.parse(result.output); assert.equal(run.automation.script, "scripts/e2e/pipeline-debug-chat.mjs"); assert.equal(run.automation.env_defaults.LANGBOT_E2E_PROMPT, "Reply only NONSTREAM_OK."); assert.equal(run.automation.env_defaults.LANGBOT_E2E_EXPECTED_TEXT, "NONSTREAM_OK"); assert.equal(run.automation.env_defaults.LANGBOT_E2E_STREAM_OUTPUT, "0"); assert.equal(run.automation.pipeline_env_required, true); }); test("local-agent multimodal case exposes image fixture automation defaults", () => { const result = capture(() => commandTestRun(ctx([ "test", "run", "local-agent-multimodal-debug-chat", "--dry-run", "--json", ]))); assert.equal(result.code, 0); const run = JSON.parse(result.output); assert.equal(run.automation.script, "scripts/e2e/pipeline-debug-chat.mjs"); assert.equal(run.automation.env_defaults.LANGBOT_E2E_EXPECTED_TEXT, "IMAGE_OK"); assert.match(run.automation.env_defaults.LANGBOT_E2E_IMAGE_BASE64_PATH, /red-square\.png\.base64$/); assert.equal(run.automation.pipeline_env_required, true); }); test("MCP stdio case passes case-specific failure signals to automation defaults", () => { const result = capture(() => commandTestRun(ctx([ "test", "run", "mcp-stdio-tool-call", "--dry-run", "--json", ]))); assert.equal(result.code, 0); const run = JSON.parse(result.output); assert.match(run.automation.env_defaults.LANGBOT_E2E_FAILURE_SIGNALS, /qa-plugin-smoke:mcp-ok-local-agent/); assert.match(run.automation.env_defaults.LANGBOT_E2E_FAILURE_SIGNALS, /model_not_found/); }); test("MCP stdio tool-call case setups pipeline and registered MCP server", () => { const result = capture(() => commandTestRun(ctx([ "test", "run", "mcp-stdio-tool-call", "--dry-run", "--json", ]))); assert.equal(result.code, 0); const run = JSON.parse(result.output); assert.deepEqual(run.setup_automation.map((item: { entry: string }) => item.entry), [ "node:scripts/e2e/ensure-local-agent-pipeline.mjs --write-env", "case:mcp-stdio-register", ]); const planResult = capture(() => commandTestPlan(ctx(["test", "plan", "mcp-stdio-tool-call", "--json"]))); assert.equal(planResult.code, 0); const plan = JSON.parse(planResult.output); assert.deepEqual(plan.setup_provides_env, [ "LANGBOT_LOCAL_AGENT_PIPELINE_URL", "LANGBOT_LOCAL_AGENT_PIPELINE_NAME", ]); assert.ok(!plan.preconditions.some((item: string) => item.includes("points to the local-agent pipeline"))); }); test("generic pipeline automation can still use the shared pipeline env", () => { const result = capture(() => commandTestRun(ctx([ "test", "run", "pipeline-debug-chat", "--dry-run", "--json", ]))); assert.equal(result.code, 0); const run = JSON.parse(result.output); assert.equal(run.automation.pipeline_env_required, false); assert.deepEqual(run.automation.env_aliases, []); assert.ok(run.automation.required_env.includes("LANGBOT_PIPELINE_URL|LANGBOT_PIPELINE_NAME")); }); test("AgentRunner live install case exposes package automation defaults", () => { const result = capture(() => commandTestRun(ctx([ "test", "run", "agent-runner-live-install", "--dry-run", "--json", ]))); assert.equal(result.code, 0); const run = JSON.parse(result.output); assert.equal( run.automation.env_defaults.LANGBOT_E2E_PLUGIN_PACKAGE, "skills/langbot-testing/fixtures/plugins/qa-agent-runner/dist/qa-agent-runner-0.1.0.lbpkg", ); assert.equal(run.automation.env_defaults.LANGBOT_E2E_EXPECTED_PLUGIN_ID, "qa/agent-runner"); assert.equal(run.automation.env_defaults.LANGBOT_E2E_EXPECTED_RUNNER_ID, "plugin:qa/agent-runner/default"); }); test("QA plugin live install checks the fixture package before installed state", () => { const tmp = mkdtempSync(join(tmpdir(), "lbs-install-qa-plugin-")); try { const result = spawnSync( process.execPath, [join(root, "scripts/e2e/install-qa-plugin-smoke.mjs")], { cwd: root, env: { ...process.env, LBS_RUN_ID: "missing-package", LBS_EVIDENCE_DIR: join(tmp, "evidence"), LANGBOT_BACKEND_URL: "http://127.0.0.1:59999", LANGBOT_E2E_LOGIN_USER: "qa@example.test", LANGBOT_E2E_PLUGIN_PACKAGE: join(tmp, "missing.lbpkg"), }, encoding: "utf8", }, ); assert.equal(result.status, 1); const output = JSON.parse(result.stdout); assert.match(output.reason, /missing\.lbpkg/); } finally { rmSync(tmp, { recursive: true, force: true }); } }); test("AgentRunner QA Debug Chat case uses dedicated pipeline env", () => { const result = capture(() => commandTestRun(ctx([ "test", "run", "agent-runner-qa-debug-chat", "--dry-run", "--json", ]))); assert.equal(result.code, 0); const run = JSON.parse(result.output); assert.equal(run.automation.script, "scripts/e2e/pipeline-debug-chat.mjs"); assert.equal(run.automation.pipeline_env_required, true); assert.equal(run.automation.env_defaults.LANGBOT_E2E_EXPECTED_RUNNER_ID, "plugin:qa/agent-runner/default"); assert.deepEqual( run.setup_automation.map((item: { entry: string }) => item.entry), [ "case:agent-runner-live-install", "node:scripts/e2e/ensure-qa-agent-runner-pipeline.mjs --write-env", ], ); assert.ok(run.automation.env_aliases.some((alias: { target: string; source: string }) => ( alias.target === "LANGBOT_E2E_PIPELINE_URL" && alias.source === "LANGBOT_QA_AGENT_RUNNER_PIPELINE_URL" ))); }); test("AgentRunner QA Debug Chat setup automation removes manual readiness", () => { withEnv({ LANGBOT_BROWSER_PROFILE: "/tmp/langbot-test-profile", LANGBOT_CHROMIUM_EXECUTABLE: "/tmp/langbot-test-chromium", }, () => { const planResult = capture(() => commandTestPlan(ctx(["test", "plan", "agent-runner-qa-debug-chat", "--json"]))); assert.equal(planResult.code, 0); const plan = JSON.parse(planResult.output); assert.equal(plan.manual_readiness.status, "not_required"); assert.deepEqual(plan.setup_provides_env, [ "LANGBOT_QA_AGENT_RUNNER_PIPELINE_URL", "LANGBOT_QA_AGENT_RUNNER_PIPELINE_NAME", ]); assert.equal(plan.automation_readiness.status, "ready"); const suiteResult = capture(() => commandSuitePlan(ctx(["suite", "plan", "agent-runner-release-gate", "--json"]))); assert.equal(suiteResult.code, 0); const suite = JSON.parse(suiteResult.output); assert.ok(!suite.readiness.manual_check_cases.includes("agent-runner-qa-debug-chat")); }); }); test("ACP AgentRunner Debug Chat case setups the ACP pipeline env", () => { const result = capture(() => commandTestRun(ctx([ "test", "run", "acp-agent-runner-debug-chat", "--dry-run", "--json", ]))); assert.equal(result.code, 0); const run = JSON.parse(result.output); assert.deepEqual(run.setup_automation.map((item: { entry: string }) => item.entry), [ "node:scripts/e2e/ensure-acp-agent-runner-pipeline.mjs --write-env", ]); assert.ok(run.automation.env_aliases.some((alias: { target: string; source: string }) => ( alias.target === "LANGBOT_E2E_PIPELINE_URL" && alias.source === "LANGBOT_ACP_AGENT_RUNNER_PIPELINE_URL" ))); const planResult = capture(() => commandTestPlan(ctx(["test", "plan", "acp-agent-runner-debug-chat", "--json"]))); assert.equal(planResult.code, 0); const plan = JSON.parse(planResult.output); assert.deepEqual(plan.setup_provides_env, [ "LANGBOT_ACP_AGENT_RUNNER_PIPELINE_URL", "LANGBOT_ACP_AGENT_RUNNER_PIPELINE_NAME", ]); assert.ok(!plan.preconditions.some((item: string) => item.includes("pipeline AI runner"))); }); test("local-agent plugin cases setup the QA plugin smoke fixture", () => { const result = capture(() => commandTestRun(ctx([ "test", "run", "local-agent-plugin-tool-call-debug-chat", "--dry-run", "--json", ]))); assert.equal(result.code, 0); const run = JSON.parse(result.output); assert.deepEqual(run.setup_automation.map((item: { entry: string }) => item.entry), [ "node:scripts/e2e/ensure-local-agent-pipeline.mjs --write-env", "case:qa-plugin-smoke-live-install", ]); }); test("local-agent RAG case only requires the KB fixture env", () => { const result = capture(() => commandTestRun(ctx([ "test", "run", "local-agent-rag-debug-chat", "--dry-run", "--json", ]))); assert.equal(result.code, 0); const run = JSON.parse(result.output); assert.ok(run.automation.required_env.includes("LANGBOT_LOCAL_AGENT_RAG_KB_UUID")); assert.ok(!run.automation.required_env.includes("LANGBOT_LOCAL_AGENT_RAG_TEXT_MODEL_UUID")); assert.equal( run.automation.env_defaults.LANGBOT_E2E_RUNNER_CONFIG_PATCH_JSON, JSON.stringify({ "knowledge-bases": [ loadEnv(root).LANGBOT_LOCAL_AGENT_RAG_KB_UUID || "", ], }), ); }); test("LangRAG retrieve readiness requires a KB UUID alternative", () => { const result = capture(() => commandTestPlan(ctx(["test", "plan", "langrag-kb-retrieve", "--json"]))); assert.equal(result.code, 0); const plan = JSON.parse(result.output); assert.ok(plan.automation_readiness.required.includes("LANGBOT_LOCAL_AGENT_RAG_KB_UUID|LANGBOT_RAG_KB_UUID")); }); test("local-agent RAG multimodal case setups the KB fixture env", () => { const result = capture(() => commandTestRun(ctx([ "test", "run", "local-agent-rag-multimodal-debug-chat", "--dry-run", "--json", ]))); assert.equal(result.code, 0); const run = JSON.parse(result.output); assert.ok(run.automation.required_env.includes("LANGBOT_LOCAL_AGENT_RAG_KB_UUID")); assert.equal( run.automation.env_defaults.LANGBOT_E2E_RUNNER_CONFIG_PATCH_JSON, JSON.stringify({ "knowledge-bases": [ loadEnv(root).LANGBOT_LOCAL_AGENT_RAG_KB_UUID || "", ], }), ); assert.deepEqual(run.setup_automation.map((item: { entry: string }) => item.entry), [ "node:scripts/e2e/ensure-local-agent-pipeline.mjs --write-env", "node:scripts/e2e/ensure-langrag-sentinel-kb.mjs --write-env", ]); }); test("test report renders a reusable evidence template", () => { const result = capture(() => commandTestReport(ctx(["test", "report", "pipeline-debug-chat", "--no-auto-log"]))); assert.equal(result.code, 0); assert.match(result.output, /^# Test Report: pipeline-debug-chat/m); assert.match(result.output, /result: pass \| fail \| blocked \| env_issue \| flaky/); assert.match(result.output, /## Log Guard/); assert.match(result.output, /## Automation Result/); assert.match(result.output, /## Required Evidence/); assert.match(result.output, /no log files provided/); }); test("validate rejects dangling case references and missing automation scripts", () => { const tmp = mkdtempSync(join(tmpdir(), "lbs-validate-strict-")); try { const schemasDir = join(tmp, "schemas"); const skillsDir = join(tmp, "skills"); const envSetupDir = join(skillsDir, "langbot-env-setup"); const testingDir = join(skillsDir, "langbot-testing"); mkdirSync(schemasDir, { recursive: true }); mkdirSync(join(testingDir, "cases"), { recursive: true }); mkdirSync(join(testingDir, "fixtures"), { recursive: true }); mkdirSync(join(testingDir, "suites"), { recursive: true }); mkdirSync(envSetupDir, { recursive: true }); for (const schemaName of ["case.schema.json", "suite.schema.json", "troubleshooting.schema.json", "skill-index.schema.json"]) { writeFileSync(join(schemasDir, schemaName), "{}"); } writeFileSync(join(envSetupDir, "SKILL.md"), "---\nname: langbot-env-setup\ndescription: Env setup.\n---\n\n# Env\n"); writeFileSync(join(testingDir, "SKILL.md"), "---\nname: langbot-testing\ndescription: Testing.\n---\n\n# Testing\n"); writeFileSync( join(skillsDir, ".env"), [ "LANGBOT_FRONTEND_URL=http://127.0.0.1:3000", "LANGBOT_BACKEND_URL=http://127.0.0.1:5300", "LANGBOT_DEV_FRONTEND_URL=http://127.0.0.1:3000", "LANGBOT_REPO=/tmp/langbot", "LANGBOT_WEB_REPO=/tmp/langbot/web", "LANGBOT_BROWSER_PROFILE=/tmp/browser", "LANGBOT_CHROMIUM_EXECUTABLE=/tmp/chromium", "LANGBOT_PROXY_HTTP=http://127.0.0.1:7890", "LANGBOT_PROXY_SOCKS=socks5://127.0.0.1:7890", "LANGBOT_NO_PROXY=localhost,127.0.0.1,::1", ].join("\n"), ); writeFileSync( join(testingDir, "cases", "bad.yaml"), [ "id: bad", "title: Bad", "mode: agent-browser", "area: pipeline", "type: smoke", "priority: p9", "risk: medium", "ci_eligible: false", "tags:", " - smoke", "skills:", " - langbot-env-setup", " - langbot-testing", "env:", " - LANGBOT_FRONTEND_URL", "automation: scripts/e2e/missing.mjs", "setup_provides_env:", " - LANGBOT_PIPELINE_URL", "steps:", " - Open UI.", "checks:", " - UI works.", "evidence_required:", " - ui", "troubleshooting:", " - missing-trouble", ].join("\n"), ); for (const [id, target] of [["cycle-a", "cycle-b"], ["cycle-b", "cycle-a"]]) { writeFileSync( join(testingDir, "cases", `${id}.yaml`), [ `id: ${id}`, `title: ${id}`, "mode: probe", "area: qa", "type: smoke", "priority: p2", "risk: low", "ci_eligible: true", "tags:", " - smoke", "skills:", " - langbot-testing", "setup_automation:", ` - \"case:${target}\"`, "steps:", " - Run probe.", "checks:", " - Probe works.", "evidence_required:", " - filesystem", ].join("\n"), ); } writeFileSync( join(testingDir, "suites", "bad-suite.yaml"), [ "id: bad-suite", "title: Bad Suite", "description: Bad suite for strict validation.", "type: release_gate", "priority: p1", "tags:", " - gate", "cases:", " - missing-case", ].join("\n"), ); writeFileSync( join(testingDir, "fixtures", "fixtures.json"), JSON.stringify([{ id: "bad-fixture", title: "Bad Fixture", path: "fixtures/missing.txt", related_cases: ["missing-case"] }]), ); const result = captureAll(() => commandValidate(tmp)); assert.equal(result.code, 1); assert.match(result.error, /priority/); assert.match(result.error, /missing-trouble/); assert.match(result.error, /missing-case/); assert.match(result.error, /bad-fixture/); assert.match(result.error, /automation script does not exist/); assert.match(result.error, /setup_provides_env/); assert.match(result.error, /setup_automation case cycle detected/); } finally { rmSync(tmp, { recursive: true, force: true }); } }); test("test report JSON scans logs and redacts secrets", () => { const tmp = mkdtempSync(join(tmpdir(), "lbs-report-")); try { const logPath = join(tmp, "backend.log"); writeFileSync( logPath, [ "INFO request started", "Action invoke_llm_stream call timed out", "Traceback (most recent call last):", "API_KEY=sk-test-secret", ].join("\n"), ); const result = capture(() => commandTestReport(ctx(["test", "report", "pipeline-debug-chat", "--backend-log", logPath, "--json"]))); assert.equal(result.code, 0); assert.doesNotMatch(result.output, /sk-test-secret/); const report = JSON.parse(result.output); assert.equal(report.log_guard.status, "fail"); assert.ok(report.log_guard.findings.some((finding: { kind: string }) => ( finding.kind === "case_failure_pattern" ))); assert.ok(report.log_guard.findings.some((finding: { troubleshooting_id?: string }) => ( finding.troubleshooting_id === "plugin-runtime-timeout" ))); assert.ok(report.log_guard.findings.some((finding: { kind: string }) => finding.kind === "python_traceback")); const secretFinding = report.log_guard.findings.find((finding: { kind: string }) => finding.kind === "secret_leak"); assert.ok(secretFinding); assert.match(secretFinding.excerpt, /\[redacted\]/); } finally { rmSync(tmp, { recursive: true, force: true }); } }); test("test report does not treat invalid api key wording as a secret leak", () => { const tmp = mkdtempSync(join(tmpdir(), "lbs-report-api-key-wording-")); try { const logPath = join(tmp, "backend.log"); writeFileSync( logPath, "RequesterError: 模型请求失败: 无效的 api-key: Error code: 401 - invalid api key\n", ); const result = capture(() => commandTestReport(ctx(["test", "report", "mcp-stdio-tool-call", "--backend-log", logPath, "--json"]))); assert.equal(result.code, 0); assert.match(result.output, /api-key: Error code/); const report = JSON.parse(result.output); assert.ok(!report.log_guard.findings.some((finding: { kind: string }) => finding.kind === "secret_leak")); assert.ok(report.log_guard.findings.some((finding: { troubleshooting_id?: string }) => ( finding.troubleshooting_id === "local-agent-model-route-unavailable" ))); } finally { rmSync(tmp, { recursive: true, force: true }); } }); test("test report records declared success signals from logs", () => { const tmp = mkdtempSync(join(tmpdir(), "lbs-report-success-")); try { const logPath = join(tmp, "backend.log"); writeFileSync( logPath, [ "[05-21 10:31:00.000] websocket.py (1) - [INFO] : Processing request from person_websocket", "[05-21 10:31:01.000] runner.py (2) - [INFO] : Conversation(0) Streaming completed", ].join("\n"), ); const result = capture(() => commandTestReport(ctx([ "test", "report", "pipeline-debug-chat", "--backend-log", logPath, "--json", ]))); assert.equal(result.code, 0); const report = JSON.parse(result.output); assert.equal(report.log_guard.status, "pass"); assert.equal(report.log_guard.success_signals.length, 2); assert.ok(report.log_guard.success_signals.some((signal: { pattern: string }) => ( signal.pattern === "Streaming completed" ))); } finally { rmSync(tmp, { recursive: true, force: true }); } }); test("test report warns when declared success signals are missing", () => { const tmp = mkdtempSync(join(tmpdir(), "lbs-report-missing-success-")); try { const logPath = join(tmp, "backend.log"); writeFileSync(logPath, "INFO request started\nINFO request ended\n"); const result = capture(() => commandTestReport(ctx([ "test", "report", "pipeline-debug-chat", "--backend-log", logPath, "--json", ]))); assert.equal(result.code, 0); const report = JSON.parse(result.output); assert.equal(report.log_guard.status, "warning"); assert.ok(report.log_guard.findings.some((finding: { kind: string }) => ( finding.kind === "missing_success_signal" ))); } finally { rmSync(tmp, { recursive: true, force: true }); } }); test("test report can limit log guard to tail lines", () => { const tmp = mkdtempSync(join(tmpdir(), "lbs-report-tail-")); try { const logPath = join(tmp, "backend.log"); writeFileSync( logPath, [ "ERROR old failure outside scan window", "INFO middle", "Action invoke_llm_stream call timed out", "API_KEY=sk-tail-secret", ].join("\n"), ); const result = capture(() => commandTestReport(ctx([ "test", "report", "pipeline-debug-chat", "--backend-log", logPath, "--tail-lines", "2", "--json", ]))); assert.equal(result.code, 0); const report = JSON.parse(result.output); assert.equal(report.log_guard.scan.mode, "tail-lines"); assert.equal(report.log_guard.scan.tail_lines, 2); assert.equal(report.log_guard.sources[0].line_count, 2); assert.equal(report.log_guard.sources[0].start_line, 3); assert.ok(report.log_guard.findings.some((finding: { troubleshooting_id?: string }) => ( finding.troubleshooting_id === "plugin-runtime-timeout" ))); assert.ok(!report.log_guard.findings.some((finding: { kind: string; excerpt?: string }) => ( finding.kind === "error_log" && finding.excerpt?.includes("old failure") ))); } finally { rmSync(tmp, { recursive: true, force: true }); } }); test("test report can limit log guard with since timestamp", () => { const tmp = mkdtempSync(join(tmpdir(), "lbs-report-since-")); try { const logPath = join(tmp, "backend.log"); writeFileSync( logPath, [ "[05-21 09:59:00.000] old.py (1) - [ERROR] : old failure outside scan window", "[05-21 10:31:00.000] runner.py (2) - [ERROR] : Action invoke_llm_stream call timed out", "Traceback continuation should stay with the matching timestamp block", "[05-21 10:32:00.000] secrets.py (3) - [INFO] : API_KEY=sk-since-secret", ].join("\n"), ); const result = capture(() => commandTestReport(ctx([ "test", "report", "pipeline-debug-chat", "--backend-log", logPath, "--since", "2026-05-21T10:30:00+08:00", "--json", ]))); assert.equal(result.code, 0); const report = JSON.parse(result.output); assert.equal(report.log_guard.scan.mode, "since"); assert.equal(report.log_guard.sources[0].line_count, 3); assert.equal(report.log_guard.sources[0].start_line, 2); assert.equal(report.log_guard.sources[0].timestamped_line_count, 3); assert.ok(report.log_guard.findings.some((finding: { line?: number; troubleshooting_id?: string }) => ( finding.line === 2 && finding.troubleshooting_id === "plugin-runtime-timeout" ))); assert.ok(!report.log_guard.findings.some((finding: { excerpt?: string }) => finding.excerpt?.includes("old failure"))); assert.doesNotMatch(result.output, /sk-since-secret/); } finally { rmSync(tmp, { recursive: true, force: true }); } }); test("test report can limit log guard with since and until timestamps", () => { const tmp = mkdtempSync(join(tmpdir(), "lbs-report-window-")); try { const logPath = join(tmp, "backend.log"); writeFileSync( logPath, [ "[05-21 10:29:59.000] old.py (1) - [ERROR] : old failure outside scan window", "[05-21 10:31:00.000] runner.py (2) - [INFO] : Processing request from person_websocket", "[05-21 10:31:01.000] runner.py (3) - [INFO] : Conversation(0) Streaming completed", "[05-21 10:32:01.000] later.py (4) - [ERROR] : later failure outside scan window", ].join("\n"), ); const result = capture(() => commandTestReport(ctx([ "test", "report", "pipeline-debug-chat", "--backend-log", logPath, "--since", "2026-05-21T10:30:00+08:00", "--until", "2026-05-21T10:32:00+08:00", "--json", ]))); assert.equal(result.code, 0); const report = JSON.parse(result.output); assert.equal(report.log_guard.scan.mode, "since+until"); assert.equal(report.log_guard.sources[0].line_count, 2); assert.equal(report.log_guard.sources[0].start_line, 2); assert.equal(report.log_guard.sources[0].end_line, 3); assert.equal(report.log_guard.status, "pass"); assert.ok(!report.log_guard.findings.some((finding: { excerpt?: string }) => finding.excerpt?.includes("old failure"))); assert.ok(!report.log_guard.findings.some((finding: { excerpt?: string }) => finding.excerpt?.includes("later failure"))); } finally { rmSync(tmp, { recursive: true, force: true }); } }); test("test report classifies model route failures as env_issue", () => { const tmp = mkdtempSync(join(tmpdir(), "lbs-report-env-issue-")); try { const logPath = join(tmp, "backend.log"); writeFileSync( logPath, "[05-21 10:31:00.000] runner.py (2) - [ERROR] : runner.llm_error model_not_found no available channel for model gpt-test\n", ); const result = capture(() => commandTestReport(ctx([ "test", "report", "local-agent-plugin-tool-call-debug-chat", "--backend-log", logPath, "--json", ]))); assert.equal(result.code, 0); const report = JSON.parse(result.output); assert.equal(report.log_guard.status, "env_issue"); assert.ok(report.log_guard.findings.some((finding: { severity?: string; troubleshooting_id?: string }) => ( finding.severity === "env_issue" && finding.troubleshooting_id === "local-agent-model-route-unavailable" ))); } finally { rmSync(tmp, { recursive: true, force: true }); } }); test("test report infers scan window from automation result evidence", () => { const tmp = mkdtempSync(join(tmpdir(), "lbs-report-evidence-window-")); try { const evidenceDir = join(tmp, "evidence", "run-123"); mkdirSync(evidenceDir, { recursive: true }); const consoleLog = join(evidenceDir, "console.log"); writeFileSync( consoleLog, [ "[05-21 10:29:59.000] old.js (1) - [ERROR] : old failure outside scan window", "[05-21 10:31:00.000] runner.js (2) - [INFO] : Processing request from person_websocket", "[05-21 10:31:01.000] runner.js (3) - [INFO] : Conversation(0) Streaming completed", "[05-21 10:32:01.000] later.js (4) - [ERROR] : later failure outside scan window", ].join("\n"), ); writeFileSync( join(evidenceDir, "automation-result.json"), JSON.stringify({ source: "automation", status: "pass", reason: "UI sentinel appeared.", started_at_local: "2026-05-21T10:30:00.000+08:00", finished_at_local: "2026-05-21T10:32:00.000+08:00", }), ); const result = capture(() => commandTestReport(ctx([ "test", "report", "pipeline-debug-chat", "--console-log", consoleLog, "--no-auto-log", "--json", ]))); assert.equal(result.code, 0); const report = JSON.parse(result.output); assert.equal(report.log_guard.scan.mode, "since+until"); assert.equal(report.log_guard.scan.since, "2026-05-21T10:30:00.000+08:00"); assert.equal(report.log_guard.scan.until, "2026-05-21T10:32:00.000+08:00"); assert.equal(report.log_guard.sources[0].line_count, 2); assert.equal(report.log_guard.status, "pass"); assert.equal(report.automation_result.status, "loaded"); assert.equal(report.automation_result.result, "pass"); assert.equal(report.automation_result.reason, "UI sentinel appeared."); assert.ok(!report.log_guard.findings.some((finding: { excerpt?: string }) => finding.excerpt?.includes("old failure"))); assert.ok(!report.log_guard.findings.some((finding: { excerpt?: string }) => finding.excerpt?.includes("later failure"))); } finally { rmSync(tmp, { recursive: true, force: true }); } }); test("test report does not treat final result as automation evidence", () => { const tmp = mkdtempSync(join(tmpdir(), "lbs-report-final-result-")); try { const evidenceDir = join(tmp, "evidence", "run-final"); mkdirSync(evidenceDir, { recursive: true }); const consoleLog = join(evidenceDir, "console.log"); writeFileSync(consoleLog, "[05-21 10:31:00.000] ui.js (1) - [INFO] : opened\n"); writeFileSync( join(evidenceDir, "result.json"), JSON.stringify({ source: "final", status: "pass", reason: "Final manual decision.", started_at_local: "2026-05-21T10:30:00.000+08:00", finished_at_local: "2026-05-21T10:32:00.000+08:00", evidence_collected: ["ui", "screenshot", "console"], }), ); const result = capture(() => commandTestReport(ctx([ "test", "report", "webui-login-state", "--console-log", consoleLog, "--no-auto-log", "--json", ]))); assert.equal(result.code, 0); const report = JSON.parse(result.output); assert.equal(report.automation_result.status, "not_provided"); assert.match(report.automation_result.reason, /only final result\.json is present/); } finally { rmSync(tmp, { recursive: true, force: true }); } }); test("test report still scans untimestamped explicit console evidence within an inferred run window", () => { const tmp = mkdtempSync(join(tmpdir(), "lbs-report-untimestamped-console-")); try { const evidenceDir = join(tmp, "evidence", "run-untimestamped"); mkdirSync(evidenceDir, { recursive: true }); const consoleLog = join(evidenceDir, "console.log"); writeFileSync(consoleLog, "[error] Uncaught TypeError: Cannot read properties of undefined\n"); writeFileSync( join(evidenceDir, "result.json"), JSON.stringify({ status: "pass", reason: "UI sentinel appeared.", started_at_local: "2026-05-21T10:30:00.000+08:00", finished_at_local: "2026-05-21T10:32:00.000+08:00", }), ); const result = capture(() => commandTestReport(ctx([ "test", "report", "webui-login-state", "--console-log", consoleLog, "--no-auto-log", "--json", ]))); assert.equal(result.code, 0); const report = JSON.parse(result.output); assert.equal(report.log_guard.scan.mode, "since+until"); assert.equal(report.log_guard.sources[0].timestamped_line_count, 0); assert.ok(report.log_guard.sources[0].line_count >= 1); assert.equal(report.log_guard.status, "fail"); assert.ok(report.log_guard.findings.some((finding: { kind: string }) => ( finding.kind === "frontend_uncaught_error" ))); } finally { rmSync(tmp, { recursive: true, force: true }); } }); test("test report can write markdown to an output path", () => { const tmp = mkdtempSync(join(tmpdir(), "lbs-report-output-")); try { const output = join(tmp, "reports", "pipeline-debug-chat.md"); const result = capture(() => commandTestReport(ctx(["test", "report", "pipeline-debug-chat", "--output", output]))); assert.equal(result.code, 0); assert.match(result.output, /pipeline-debug-chat\.md$/); assert.match(readFileSync(output, "utf8"), /^# Test Report: pipeline-debug-chat/m); } finally { rmSync(tmp, { recursive: true, force: true }); } }); test("log scan reuses case-aware log guard patterns", () => { const tmp = mkdtempSync(join(tmpdir(), "lbs-log-scan-")); try { const logPath = join(tmp, "backend.log"); writeFileSync( logPath, [ "[05-21 10:31:00.000] process.py (1) - [INFO] : Processing request from person_websocket", "[05-21 10:31:01.000] chat.py (2) - [INFO] : Conversation(0) Streaming completed", "[05-21 10:31:02.000] runner.py (3) - [ERROR] : Action invoke_llm_stream call timed out", ].join("\n"), ); const result = capture(() => commandLogScan(ctx([ "log", "scan", "--backend-log", logPath, "--case", "pipeline-debug-chat", "--json", ]))); assert.equal(result.code, 0); const report = JSON.parse(result.output); assert.equal(report.status, "fail"); assert.ok(report.success_signals.some((signal: { pattern: string }) => signal.pattern === "Streaming completed")); assert.ok(report.findings.some((finding: { kind: string }) => finding.kind === "case_failure_pattern")); const strict = capture(() => commandLogScan(ctx([ "log", "scan", "--backend-log", logPath, "--case", "pipeline-debug-chat", "--strict", "--json", ]))); assert.equal(strict.code, 1); } finally { rmSync(tmp, { recursive: true, force: true }); } }); test("log guard start and stop bound a QA log window", () => { const tmp = mkdtempSync(join(tmpdir(), "lbs-log-guard-")); try { const logPath = join(tmp, "backend.log"); const outputDir = join(tmp, "guards"); writeFileSync(logPath, "INFO before guard\n"); const start = capture(() => commandLogGuard(ctx([ "log", "guard", "start", "--run-id", "qa-run", "--output-dir", outputDir, "--backend-log", logPath, "--case", "pipeline-debug-chat", "--json", ]))); assert.equal(start.code, 0); const session = JSON.parse(start.output); assert.equal(session.run_id, "qa-run"); assert.ok(existsSync(join(outputDir, "qa-run.json"))); appendFileSync(logPath, "Traceback (most recent call last):\n"); const stop = capture(() => commandLogGuard(ctx([ "log", "guard", "stop", "--run-id", "qa-run", "--output-dir", outputDir, "--json", ]))); assert.equal(stop.code, 1); const report = JSON.parse(stop.output); assert.equal(report.session.run_id, "qa-run"); assert.equal(report.result.status, "fail"); assert.ok(report.result.findings.some((finding: { kind: string }) => finding.kind === "python_traceback")); } finally { rmSync(tmp, { recursive: true, force: true }); } }); test("log watch observes appended LangBot backend lines", async () => { const tmp = mkdtempSync(join(tmpdir(), "lbs-log-watch-")); try { const logPath = join(tmp, "backend.log"); writeFileSync(logPath, "INFO existing line\n"); const watching = captureAsync(() => commandLogWatch(ctx([ "log", "watch", "--backend-log", logPath, "--duration-ms", "220", "--interval-ms", "20", "--strict", "--json", ]))); setTimeout(() => { appendFileSync(logPath, "Traceback (most recent call last):\n"); }, 50); const result = await watching; assert.equal(result.code, 1); const summary = JSON.parse(result.output); assert.equal(summary.mode, "watch"); assert.equal(summary.status, "fail"); assert.ok(summary.bytes_read > 0); assert.ok(summary.findings.some((finding: { kind: string }) => finding.kind === "python_traceback")); } finally { rmSync(tmp, { recursive: true, force: true }); } }); test("trouble search finds structured troubleshooting entries", () => { const result = capture(() => commandTroubleSearch(ctx(["trouble", "search", "proxy"]))); assert.equal(result.code, 0); assert.match(result.output, /proxy-env-mismatch/); }); test("env local overrides shared env defaults", () => { const tmp = mkdtempSync(join(tmpdir(), "lbs-env-")); try { mkdirSync(join(tmp, "skills")); writeFileSync(join(tmp, "skills", ".env"), "LANGBOT_REPO=/shared\nLANGBOT_BACKEND_URL=http://127.0.0.1:5300\n"); writeFileSync(join(tmp, "skills", ".env.local"), "LANGBOT_REPO=/local\n"); assert.deepEqual(loadEnv(tmp), { LANGBOT_REPO: "/local", LANGBOT_BACKEND_URL: "http://127.0.0.1:5300", }); } finally { rmSync(tmp, { recursive: true, force: true }); } });