Require real behavior proof for external PRs (#77622)

* ci: require real behavior proof for external PRs

* fix: tighten real behavior proof heuristics

* fix: reject test-only real behavior proof labels

---------

Co-authored-by: Peter Steinberger <steipete@gmail.com>
This commit is contained in:
pashpashpash
2026-05-04 21:45:30 -07:00
committed by GitHub
parent d02fbc6116
commit 70f34bf177
10 changed files with 671 additions and 11 deletions

View File

@@ -37,6 +37,28 @@ function pr(title: string, body = blankTemplateBody) {
};
}
function realBehaviorProofBody(evidence: string, overrides: Record<string, string> = {}) {
const fields = {
behavior: "Gateway status now reports the Discord channel as ready.",
environment: "macOS 15.4, Node 24, local OpenClaw gateway, redacted Discord token.",
steps: "pnpm openclaw gateway restart and pnpm openclaw gateway status",
evidence,
observedResult: "The gateway stayed connected and Discord reported ready.",
notTested: "No known gaps.",
...overrides,
};
return [
"## Real behavior proof",
"",
`- Behavior or issue addressed: ${fields.behavior}`,
`- Real environment tested: ${fields.environment}`,
`- Exact steps or command run after this patch: ${fields.steps}`,
`- Evidence after fix: ${fields.evidence}`,
`- Observed result after fix: ${fields.observedResult}`,
`- What was not tested: ${fields.notTested}`,
].join("\n");
}
function file(filename: string, status = "modified") {
return {
filename,
@@ -236,6 +258,44 @@ describe("barnacle-auto-response", () => {
);
});
it("labels external PRs that are missing real behavior proof", () => {
const labels = classifyPullRequestCandidateLabels(pr("Fix gateway startup"), [
file("src/gateway/server.ts"),
]);
expect(labels).toContain(candidateLabels.needsRealBehaviorProof);
expect(labels).not.toContain(candidateLabels.mockOnlyProof);
});
it("labels external PRs whose proof is only tests or mocks", () => {
const labels = classifyPullRequestCandidateLabels(
pr(
"Fix gateway startup",
realBehaviorProofBody("pnpm test passed with Vitest mocks.", {
steps: "pnpm test",
observedResult: "CI passes.",
}),
),
[file("src/gateway/server.ts")],
);
expect(labels).toContain(candidateLabels.mockOnlyProof);
expect(labels).not.toContain(candidateLabels.needsRealBehaviorProof);
});
it("does not label external PRs that include real behavior proof", () => {
const labels = classifyPullRequestCandidateLabels(
pr(
"Fix gateway startup",
realBehaviorProofBody("![after](https://github.com/user-attachments/assets/gateway-ready)"),
),
[file("src/gateway/server.ts")],
);
expect(labels).not.toContain(candidateLabels.needsRealBehaviorProof);
expect(labels).not.toContain(candidateLabels.mockOnlyProof);
});
it("uses linked issues as context and suppresses low-signal docs labels", () => {
const labels = classifyPullRequestCandidateLabels(
pr("Update docs", `${blankTemplateBody}\n\nRelated #12345`),
@@ -577,6 +637,43 @@ describe("barnacle-auto-response", () => {
expect(calls.update).toEqual([]);
});
it("adds proof labels to external PRs without auto-closing by default", async () => {
const { calls, github } = barnacleGithub([file("src/gateway/server.ts")]);
await runBarnacleAutoResponse({
github,
context: barnacleContext({}),
core: {
info: () => undefined,
},
});
expect(calls.addLabels).toContainEqual(
expect.objectContaining({
labels: expect.arrayContaining([candidateLabels.needsRealBehaviorProof]),
}),
);
expect(calls.createComment).toEqual([]);
expect(calls.update).toEqual([]);
});
it("removes stale proof labels when override is present", async () => {
const { calls, github } = barnacleGithub([file("src/gateway/server.ts")]);
await runBarnacleAutoResponse({
github,
context: barnacleContext({}, [candidateLabels.needsRealBehaviorProof, "proof: override"]),
core: {
info: () => undefined,
},
});
expect(calls.removeLabel).toContainEqual(
expect.objectContaining({ name: candidateLabels.needsRealBehaviorProof }),
);
expect(calls.update).toEqual([]);
});
it("actions manually applied candidate labels", async () => {
const { calls, github } = barnacleGithub([file("extensions/example/openclaw.plugin.json")]);
@@ -637,7 +734,7 @@ describe("barnacle-auto-response", () => {
expect(calls.removeLabel).toContainEqual(expect.objectContaining({ name: "trigger-response" }));
expect(calls.createComment).toContainEqual(
expect.objectContaining({
body: expect.stringContaining("only changes tests"),
body: expect.stringContaining("does not include real behavior proof"),
}),
);
expect(calls.update).toContainEqual(expect.objectContaining({ state: "closed" }));