Files
openclaw/src/agents/bash-tools.exec-host-node.test.ts
Jesse Merhi c9707ab635 fix(exec): rebuild command authorization on the Tree-sitter command planner
Replace the exec approval parser/planner path with Tree-sitter-backed authorization planning, carrying planner decisions through node and gateway execution.

This keeps unpersistable shell shapes one-shot, adds typed `unavailableDecisions` for approval prompts, and refreshes coverage for allowlist matching, command rendering, durable allow-always persistence, and host approval paths.

Verification:
- GitHub PR checks for ce2381192d: CLEAN, 142 success, 32 skipped, 0 failed, 0 pending.
- /Users/jmerhi/.nvm/versions/node/v24.12.0/bin/node scripts/plugin-sdk-surface-report.mjs --check
- /Users/jmerhi/.nvm/versions/node/v24.12.0/bin/node scripts/run-vitest.mjs test/scripts/plugin-sdk-surface-report.test.ts --reporter=verbose
- Focused exec approval suite: 13 files, 467 tests.
2026-06-18 10:12:48 +10:00

3178 lines
107 KiB
TypeScript

/**
* Node-host exec orchestration tests.
* Covers node target resolution, remote prepare/invoke payloads, approvals,
* auto-review, and follow-up execution paths.
*/
import crypto from "node:crypto";
import { beforeAll, beforeEach, describe, expect, it, vi } from "vitest";
import type { ExecAllowlistEntry } from "../infra/exec-approvals.types.js";
import { MAX_SAFE_TIMEOUT_DELAY_MS } from "../utils/timer-delay.js";
type StrictInlineEvalBoundary =
typeof import("./bash-tools.exec-host-shared.js").enforceStrictInlineEvalApprovalBoundary;
type ExecAutoReviewer = typeof import("../infra/exec-auto-review.js").defaultExecAutoReviewer;
type ExecAsk = import("../infra/exec-approvals.js").ExecAsk;
type ExecSecurity = import("../infra/exec-approvals.js").ExecSecurity;
type MockAllowAlwaysPersistenceInput = Parameters<
typeof import("../infra/exec-approvals.js").resolveAllowAlwaysPersistenceDecision
>[0];
type MockAllowAlwaysPersistenceDecision =
import("../infra/exec-approvals.js").AllowAlwaysPersistenceDecision;
type MockExecApprovalDecision = import("../infra/exec-approvals.js").ExecApprovalDecision;
type MockExecApprovalUnavailableDecision =
import("../infra/exec-approvals.js").ExecApprovalUnavailableDecision;
type MockAllowlistSegment = {
raw?: string;
resolution: null;
argv: string[];
};
type MockAllowlistResult = {
allowlistMatches: unknown[];
analysisOk: boolean;
allowlistSatisfied: boolean;
segments: MockAllowlistSegment[];
segmentAllowlistEntries: unknown[];
segmentSatisfiedBy?: unknown[];
};
type MockExecAllowlistEntry = {
pattern: string;
argPattern?: string;
source?: "allow-always";
commandText?: string;
};
type MockExecApprovalsResolved = {
allowlist: MockExecAllowlistEntry[];
file: { version: 1; agents: Record<string, unknown> };
agent: {
security: ExecSecurity;
ask: ExecAsk;
askFallback?: "deny";
autoAllowSkills?: false;
};
};
type ShellAllowlistMockParams = {
command?: string;
allowlist?: unknown[];
env?: NodeJS.ProcessEnv;
};
type RequiresExecApprovalMockParams = {
ask?: string;
security?: string;
analysisOk?: boolean;
allowlistSatisfied?: boolean;
durableApprovalSatisfied?: boolean;
};
const INLINE_EVAL_HIT = {
executable: "python3",
normalizedExecutable: "python3",
flag: "-c",
argv: ["python3", "-c", "print(1)"],
};
const preparedPlan = vi.hoisted(() => ({
argv: ["bun", "./script.ts"],
cwd: "/tmp/work",
commandText: "bun ./script.ts",
commandPreview: "bun ./script.ts",
agentId: "prepared-agent",
sessionKey: "prepared-session",
mutableFileOperand: {
argvIndex: 1,
path: "/tmp/work/script.ts",
sha256: "abc123",
},
}));
const nodeCommandMarker = vi.hoisted(() => "=node-command:test");
const exactCommandMarker = (commandText: string): string =>
`=command:${crypto.createHash("sha256").update(commandText).digest("hex").slice(0, 16)}`;
const callGatewayToolMock = vi.hoisted(() => vi.fn());
const listNodesMock = vi.hoisted(() => vi.fn());
const parsePreparedSystemRunPayloadMock = vi.hoisted(() => vi.fn());
const commandRequiresSecurityAuditSuppressionApprovalMock = vi.hoisted(() => vi.fn(() => false));
const evaluateShellAllowlistMock = vi.hoisted(() =>
vi.fn(
(_raw?: ShellAllowlistMockParams): MockAllowlistResult => ({
allowlistMatches: [],
analysisOk: true,
allowlistSatisfied: false,
segments: [{ resolution: null, argv: ["bun", "./script.ts"] }],
segmentAllowlistEntries: [],
segmentSatisfiedBy: [],
}),
),
);
const hasNodeCommandAllowAlwaysMarkerMock = vi.hoisted(() =>
vi.fn((raw: unknown): boolean =>
((raw as { allowlist?: Array<{ pattern?: string }> }).allowlist ?? []).some(
(entry) => entry.pattern === "=node-command:test",
),
),
);
const resolveAllowAlwaysPatternCoverageMock = vi.hoisted(() =>
vi.fn((_raw: unknown): unknown => ({
complete: true,
patterns: [{ pattern: "/trusted/bin/tool" }],
})),
);
const resolveExecApprovalsFromFileMock = vi.hoisted(() =>
vi.fn(
(): MockExecApprovalsResolved => ({
allowlist: [],
file: { version: 1, agents: {} },
agent: {
security: "full",
ask: "off",
askFallback: "deny",
autoAllowSkills: false,
},
}),
),
);
const requiresExecApprovalMock = vi.hoisted(() =>
vi.fn((_raw?: RequiresExecApprovalMockParams) => true),
);
const hasDurableExecApprovalMock = vi.hoisted(() => vi.fn(() => false));
const resolveAllowAlwaysPersistenceDecisionMock = vi.hoisted(() =>
vi.fn(
(_raw: MockAllowAlwaysPersistenceInput): MockAllowAlwaysPersistenceDecision => ({
kind: "patterns",
patterns: [{ pattern: "/trusted/bin/tool" }],
}),
),
);
const resolveExecApprovalAllowedDecisionsMock = vi.hoisted(() =>
vi.fn(
(params?: {
ask?: string | null;
allowAlwaysPersistence?: { kind: string } | null;
}): readonly MockExecApprovalDecision[] =>
params?.ask === "always" || params?.allowAlwaysPersistence?.kind === "one-shot"
? ["allow-once", "deny"]
: ["allow-once", "allow-always", "deny"],
),
);
const resolveExecApprovalUnavailableDecisionsMock = vi.hoisted(() =>
vi.fn(
(params?: {
ask?: string | null;
allowAlwaysPersistence?: { kind: string } | null;
}): readonly MockExecApprovalUnavailableDecision[] =>
params?.ask === "always" || params?.allowAlwaysPersistence?.kind === "one-shot"
? ["allow-always"]
: [],
),
);
const resolveExecHostApprovalContextMock = vi.hoisted(() =>
vi.fn(() => ({
approvals: { allowlist: [] as ExecAllowlistEntry[], file: { version: 1, agents: {} } },
hostSecurity: "full",
hostAsk: "off",
askFallback: "deny",
})),
);
const createAndRegisterDefaultExecApprovalRequestMock = vi.hoisted(() => vi.fn());
const resolveApprovalDecisionOrUndefinedMock = vi.hoisted(() =>
vi.fn(async (): Promise<string | null | undefined> => "allow-once"),
);
const createExecApprovalDecisionStateMock = vi.hoisted(() =>
vi.fn(
(): {
baseDecision: { timedOut: boolean };
approvedByAsk: boolean;
deniedReason: string | null;
} => ({
baseDecision: { timedOut: false },
approvedByAsk: false,
deniedReason: null,
}),
),
);
const buildExecApprovalPendingToolResultMock = vi.hoisted(() => vi.fn());
const sendExecApprovalFollowupResultMock = vi.hoisted(() => vi.fn(async () => undefined));
const enforceStrictInlineEvalApprovalBoundaryMock = vi.hoisted(() =>
vi.fn<StrictInlineEvalBoundary>((value) => ({
approvedByAsk: value.approvedByAsk,
deniedReason: value.deniedReason,
})),
);
const registerExecApprovalRequestForHostOrThrowMock = vi.hoisted(() =>
vi.fn(async () => undefined),
);
const detectInterpreterInlineEvalArgvMock = vi.hoisted(() =>
vi.fn(
(): {
executable: string;
normalizedExecutable: string;
flag: string;
argv: string[];
} | null => null,
),
);
vi.mock("../infra/exec-approvals.js", () => ({
evaluateShellAllowlist: evaluateShellAllowlistMock,
evaluateShellAllowlistWithAuthorization: evaluateShellAllowlistMock,
commandRequiresSecurityAuditSuppressionApproval:
commandRequiresSecurityAuditSuppressionApprovalMock,
hasDurableExecApproval: hasDurableExecApprovalMock,
hasNodeCommandAllowAlwaysMarker: hasNodeCommandAllowAlwaysMarkerMock,
requiresExecApproval: requiresExecApprovalMock,
resolveAllowAlwaysPersistenceDecision: resolveAllowAlwaysPersistenceDecisionMock,
resolveAllowAlwaysPatternCoverage: resolveAllowAlwaysPatternCoverageMock,
resolveExecApprovalAllowedDecisions: resolveExecApprovalAllowedDecisionsMock,
resolveExecApprovalUnavailableDecisions: resolveExecApprovalUnavailableDecisionsMock,
resolveExecApprovalsFromFile: resolveExecApprovalsFromFileMock,
maxAsk: (a: ExecAsk, b: ExecAsk): ExecAsk => {
const order: Record<ExecAsk, number> = { off: 0, "on-miss": 1, always: 2 };
return order[a] >= order[b] ? a : b;
},
}));
vi.mock("../infra/command-analysis/inline-eval.js", () => ({
describeInterpreterInlineEval: vi.fn(() => "inline-eval"),
detectInterpreterInlineEvalArgv: detectInterpreterInlineEvalArgvMock,
}));
vi.mock("../infra/node-shell.js", () => ({
buildNodeShellCommand: vi.fn(() => ["/bin/sh", "-lc", "bun ./script.ts"]),
}));
vi.mock("../infra/system-run-approval-context.js", () => ({
parsePreparedSystemRunPayload: parsePreparedSystemRunPayloadMock,
}));
vi.mock("./bash-tools.exec-approval-request.js", () => ({
buildExecApprovalRequesterContext: vi.fn(() => ({})),
buildExecApprovalTurnSourceContext: vi.fn(() => ({})),
registerExecApprovalRequestForHostOrThrow: registerExecApprovalRequestForHostOrThrowMock,
}));
vi.mock("./bash-tools.exec-host-shared.js", () => ({
resolveExecHostApprovalContext: resolveExecHostApprovalContextMock,
buildDefaultExecApprovalRequestArgs: vi.fn(() => ({})),
createAndRegisterDefaultExecApprovalRequest: createAndRegisterDefaultExecApprovalRequestMock,
shouldResolveExecApprovalUnavailableInline: vi.fn(() => false),
buildExecApprovalFollowupTarget: vi.fn((value) => value),
resolveApprovalDecisionOrUndefined: resolveApprovalDecisionOrUndefinedMock,
createExecApprovalDecisionState: createExecApprovalDecisionStateMock,
enforceStrictInlineEvalApprovalBoundary: enforceStrictInlineEvalApprovalBoundaryMock,
sendExecApprovalFollowupResult: sendExecApprovalFollowupResultMock,
buildExecApprovalPendingToolResult: buildExecApprovalPendingToolResultMock,
buildHeadlessExecApprovalDeniedMessage: vi.fn(() => "denied"),
}));
vi.mock("./bash-tools.exec-runtime.js", () => ({
DEFAULT_NOTIFY_TAIL_CHARS: 1000,
createApprovalSlug: vi.fn(() => "slug"),
normalizeNotifyOutput: vi.fn((value: string) => value),
}));
vi.mock("./tools/gateway.js", () => ({
callGatewayTool: callGatewayToolMock,
}));
const resolveNodeIdFromListMock = vi.hoisted(() =>
vi.fn((nodes: Array<{ nodeId: string; displayName?: string }>, query?: string) => {
if (!query) {
if (nodes.length === 1) {
return nodes[0].nodeId;
}
throw new Error("node required");
}
const byId = nodes.find((n) => n.nodeId === query);
if (byId) {
return byId.nodeId;
}
const byName = nodes.find((n) => n.displayName === query);
if (byName) {
return byName.nodeId;
}
if (query.length >= 6) {
const byPrefix = nodes.find((n) => n.nodeId.startsWith(query));
if (byPrefix) {
return byPrefix.nodeId;
}
}
throw new Error(`unknown node: ${query}`);
}),
);
vi.mock("./tools/nodes-utils.js", () => ({
listNodes: listNodesMock,
resolveNodeIdFromList: resolveNodeIdFromListMock,
}));
vi.mock("../logger.js", () => ({
logInfo: vi.fn(),
}));
let executeNodeHostCommand: typeof import("./bash-tools.exec-host-node.js").executeNodeHostCommand;
type MockNodeInvokeParams = {
command?: string;
params?: Record<string, unknown>;
};
type GatewayToolCall = {
method: string;
options: { timeoutMs?: number };
params?: MockNodeInvokeParams;
callOptions?: unknown;
};
function requireGatewayCall(index: number): GatewayToolCall {
const call = callGatewayToolMock.mock.calls[index];
if (!call) {
throw new Error(`expected gateway call at index ${index}`);
}
const [method, options, params, callOptions] = call as [
string,
{ timeoutMs?: number },
MockNodeInvokeParams | undefined,
unknown,
];
return { method, options, params, callOptions };
}
function requireGatewayCommand(command: string): GatewayToolCall {
const call = callGatewayToolMock.mock.calls.find(
([method, , params]) =>
method === "node.invoke" && (params as MockNodeInvokeParams | undefined)?.command === command,
);
if (!call) {
throw new Error(`expected gateway command ${command}`);
}
const [method, options, params, callOptions] = call as [
string,
{ timeoutMs?: number },
MockNodeInvokeParams | undefined,
unknown,
];
return { method, options, params, callOptions };
}
function requireRunParams(call: GatewayToolCall): Record<string, unknown> {
expect(call.method).toBe("node.invoke");
expect(call.params?.command).toBe("system.run");
const params = call.params?.params;
if (!params) {
throw new Error("expected system.run params");
}
return params;
}
function requireRegisteredApprovalRequest(): Record<string, unknown> {
const calls = registerExecApprovalRequestForHostOrThrowMock.mock.calls as unknown as [
Record<string, unknown>,
][];
const firstCall = calls[0];
if (!firstCall) {
throw new Error("expected approval request registration");
}
return firstCall[0];
}
function expectSystemRunInvoke(params: { invokeTimeoutMs: number; runTimeoutMs: number }) {
const call = requireGatewayCommand("system.run");
expect(call.options.timeoutMs).toBe(params.invokeTimeoutMs);
expect(requireRunParams(call).timeoutMs).toBe(params.runTimeoutMs);
}
function mockGatewayInvokesWithNodeApprovals(file: Record<string, unknown>) {
callGatewayToolMock.mockImplementation(
async (method: string, _options: unknown, params: MockNodeInvokeParams | undefined) => {
if (method === "exec.approvals.node.get") {
return { file };
}
if (method !== "node.invoke") {
throw new Error(`unexpected gateway method: ${method}`);
}
if (params?.command === "system.run.prepare") {
return { payload: { plan: preparedPlan } };
}
if (params?.command === "system.run") {
return {
payload: {
success: true,
stdout: "ok",
stderr: "",
exitCode: 0,
timedOut: false,
},
};
}
throw new Error(`unexpected node invoke command: ${String(params?.command)}`);
},
);
}
function usePolicyApprovalRequirementMock() {
requiresExecApprovalMock.mockImplementation((raw: unknown) => {
const params = raw as {
ask: string;
security: string;
analysisOk: boolean;
allowlistSatisfied: boolean;
durableApprovalSatisfied: boolean;
};
return (
params.ask === "always" ||
(params.ask === "on-miss" &&
params.security === "allowlist" &&
(!params.analysisOk || !params.allowlistSatisfied) &&
!params.durableApprovalSatisfied)
);
});
}
function buildAllowlistEvalResult(params?: {
allowlistSatisfied?: boolean;
segmentAllowlistEntry?: { pattern: string } | null;
}) {
return {
allowlistMatches:
params?.allowlistSatisfied && params.segmentAllowlistEntry
? [params.segmentAllowlistEntry]
: [],
analysisOk: true,
allowlistSatisfied: params?.allowlistSatisfied === true,
segments: [{ resolution: null, argv: ["tool", "--version"] }],
segmentAllowlistEntries:
params?.allowlistSatisfied && params.segmentAllowlistEntry
? [params.segmentAllowlistEntry]
: [null],
segmentSatisfiedBy: [params?.allowlistSatisfied ? "allowlist" : null],
};
}
describe("executeNodeHostCommand", () => {
beforeAll(async () => {
({ executeNodeHostCommand } = await import("./bash-tools.exec-host-node.js"));
});
beforeEach(() => {
callGatewayToolMock.mockReset();
callGatewayToolMock.mockImplementation(
async (method: string, _options: unknown, params: MockNodeInvokeParams | undefined) => {
if (method === "exec.approvals.node.get") {
return { file: { version: 1, agents: {} } };
}
if (method === "exec.approval.resolve") {
return { payload: {} };
}
if (method !== "node.invoke") {
throw new Error(`unexpected gateway method: ${method}`);
}
if (params?.command === "system.run.prepare") {
return { payload: { plan: preparedPlan } };
}
if (params?.command === "system.run") {
return {
payload: {
success: true,
stdout: "ok",
stderr: "",
exitCode: 0,
timedOut: false,
},
};
}
throw new Error(`unexpected node invoke command: ${String(params?.command)}`);
},
);
listNodesMock.mockReset();
listNodesMock.mockResolvedValue([
{
nodeId: "node-1",
commands: ["system.run", "system.run.prepare"],
platform: process.platform,
},
]);
parsePreparedSystemRunPayloadMock.mockReset();
parsePreparedSystemRunPayloadMock.mockReturnValue({
plan: preparedPlan,
execPolicy: { security: "full", ask: "off" },
});
commandRequiresSecurityAuditSuppressionApprovalMock.mockReset();
commandRequiresSecurityAuditSuppressionApprovalMock.mockReturnValue(false);
evaluateShellAllowlistMock.mockReset();
evaluateShellAllowlistMock.mockReturnValue({
allowlistMatches: [],
analysisOk: true,
allowlistSatisfied: false,
segments: [{ resolution: null, argv: ["bun", "./script.ts"] }],
segmentAllowlistEntries: [],
});
hasNodeCommandAllowAlwaysMarkerMock.mockClear();
resolveAllowAlwaysPatternCoverageMock.mockReset();
resolveAllowAlwaysPatternCoverageMock.mockReturnValue({
complete: true,
patterns: [{ pattern: "/trusted/bin/tool" }],
});
hasDurableExecApprovalMock.mockReset();
hasDurableExecApprovalMock.mockReturnValue(false);
resolveExecApprovalsFromFileMock.mockReset();
resolveExecApprovalsFromFileMock.mockReturnValue({
allowlist: [],
file: { version: 1, agents: {} },
agent: {
security: "full",
ask: "off",
askFallback: "deny",
autoAllowSkills: false,
},
});
requiresExecApprovalMock.mockReset();
requiresExecApprovalMock.mockReturnValue(true);
hasDurableExecApprovalMock.mockReset();
hasDurableExecApprovalMock.mockReturnValue(false);
resolveAllowAlwaysPersistenceDecisionMock.mockReset();
resolveAllowAlwaysPersistenceDecisionMock.mockReturnValue({
kind: "patterns",
patterns: [{ pattern: "/trusted/bin/tool" }],
});
resolveExecApprovalAllowedDecisionsMock.mockClear();
resolveExecApprovalUnavailableDecisionsMock.mockClear();
resolveExecHostApprovalContextMock.mockReset();
resolveExecHostApprovalContextMock.mockReturnValue({
approvals: { allowlist: [], file: { version: 1, agents: {} } },
hostSecurity: "full",
hostAsk: "off",
askFallback: "deny",
});
createAndRegisterDefaultExecApprovalRequestMock.mockReset();
createAndRegisterDefaultExecApprovalRequestMock.mockImplementation(async (args?: unknown) => {
const register =
args && typeof args === "object" && "register" in args
? (args as { register?: (approvalId: string) => Promise<void> }).register
: undefined;
await register?.("approval-1");
return {
approvalId: "approval-1",
approvalSlug: "slug-1",
warningText: "",
expiresAtMs: Date.now() + 60_000,
preResolvedDecision: null,
initiatingSurface: "origin",
sentApproverDms: false,
unavailableReason: null,
};
});
resolveApprovalDecisionOrUndefinedMock.mockReset();
resolveApprovalDecisionOrUndefinedMock.mockResolvedValue("allow-once");
createExecApprovalDecisionStateMock.mockReset();
createExecApprovalDecisionStateMock.mockReturnValue({
baseDecision: { timedOut: false },
approvedByAsk: false,
deniedReason: null,
});
buildExecApprovalPendingToolResultMock.mockReset();
buildExecApprovalPendingToolResultMock.mockReturnValue({
content: [],
details: { status: "approval-pending" },
});
sendExecApprovalFollowupResultMock.mockReset();
enforceStrictInlineEvalApprovalBoundaryMock.mockReset();
enforceStrictInlineEvalApprovalBoundaryMock.mockImplementation((value) => ({
approvedByAsk: value.approvedByAsk,
deniedReason: value.deniedReason,
}));
detectInterpreterInlineEvalArgvMock.mockReset();
detectInterpreterInlineEvalArgvMock.mockReturnValue(null);
registerExecApprovalRequestForHostOrThrowMock.mockReset();
});
it("forwards prepared systemRunPlan on async node invoke after approval", async () => {
resolveExecHostApprovalContextMock.mockReturnValue({
approvals: { allowlist: [], file: { version: 1, agents: {} } },
hostSecurity: "full",
hostAsk: "always",
askFallback: "deny",
});
const result = await executeNodeHostCommand({
command: "bun ./script.ts",
workdir: "/tmp/work",
env: {},
security: "full",
ask: "off",
defaultTimeoutSec: 30,
approvalRunningNoticeMs: 0,
warnings: [],
agentId: "requested-agent",
sessionKey: "requested-session",
turnSourceChannel: "telegram",
turnSourceTo: "telegram:12345",
turnSourceAccountId: "work",
turnSourceThreadId: "42",
});
expect(result.details?.status).toBe("approval-pending");
expect(requireRegisteredApprovalRequest().systemRunPlan).toEqual(preparedPlan);
await vi.waitFor(() => {
expect(callGatewayToolMock).toHaveBeenCalledTimes(3);
});
const call = requireGatewayCall(2);
expect(call.options.timeoutMs).toBe(35_000);
expect(call.callOptions).toEqual({ scopes: ["operator.write", "operator.approvals"] });
const runParams = requireRunParams(call);
expect(runParams.approved).toBe(true);
expect(runParams.approvalDecision).toBe("allow-once");
expect(runParams.systemRunPlan).toEqual(preparedPlan);
expect(runParams.timeoutMs).toBe(30_000);
expect(runParams.turnSourceChannel).toBe("telegram");
expect(runParams.turnSourceTo).toBe("telegram:12345");
expect(runParams.turnSourceAccountId).toBe("work");
expect(runParams.turnSourceThreadId).toBe("42");
});
it("does not build a human approval prompt for node auto-review allows", async () => {
const autoReviewer = vi.fn<ExecAutoReviewer>(async () => ({
decision: "allow-once",
risk: "low",
rationale: "safe read",
}));
resolveExecHostApprovalContextMock.mockReturnValue({
approvals: { allowlist: [], file: { version: 1, agents: {} } },
hostSecurity: "allowlist",
hostAsk: "on-miss",
askFallback: "deny",
});
requiresExecApprovalMock.mockImplementation(
(params?: { allowlistSatisfied?: boolean; durableApprovalSatisfied?: boolean }) =>
params?.allowlistSatisfied !== true && params?.durableApprovalSatisfied !== true,
);
const result = await executeNodeHostCommand({
command: "bun ./script.ts",
workdir: "/tmp/work",
env: {},
security: "allowlist",
ask: "on-miss",
autoReview: true,
autoReviewer,
defaultTimeoutSec: 30,
approvalRunningNoticeMs: 0,
warnings: [],
agentId: "requested-agent",
sessionKey: "requested-session",
});
expect(result.details?.status).toBe("completed");
expect(autoReviewer).toHaveBeenCalledWith(
expect.objectContaining({
command: "bun ./script.ts",
argv: ["bun", "./script.ts"],
host: "node",
reason: "allowlist-miss",
}),
);
expect(createAndRegisterDefaultExecApprovalRequestMock).not.toHaveBeenCalled();
expect(registerExecApprovalRequestForHostOrThrowMock).toHaveBeenCalledWith(
expect.objectContaining({
host: "node",
requireDeliveryRoute: false,
suppressDelivery: true,
}),
);
expect(callGatewayToolMock).toHaveBeenCalledWith(
"exec.approval.resolve",
{ timeoutMs: 15_000 },
{ id: expect.any(String), decision: "allow-once" },
{ scopes: ["operator.approvals"] },
);
});
it("reviews the prepared node plan before suppressing human approval", async () => {
const divergentPlan = {
argv: ["rm", "-rf", "/tmp/work"],
cwd: "/tmp/work",
commandText: "rm -rf /tmp/work",
commandPreview: "./scripts/check_mail.sh --limit 5",
agentId: "prepared-agent",
sessionKey: "prepared-session",
};
parsePreparedSystemRunPayloadMock.mockReturnValue({
plan: divergentPlan,
execPolicy: { security: "full", ask: "off" },
});
const nodeAllowlist = [{ pattern: "./scripts/check_mail.sh" }];
resolveExecApprovalsFromFileMock.mockReturnValue({
allowlist: nodeAllowlist,
file: { version: 1, agents: {} },
agent: {
security: "full",
ask: "off",
askFallback: "deny",
autoAllowSkills: false,
},
});
evaluateShellAllowlistMock.mockImplementation(
(params?: { command?: string; allowlist?: unknown[] }) => {
const command = params?.command ?? "";
const hasNodeAllowlist = Array.isArray(params?.allowlist) && params.allowlist.length > 0;
const previewMatch = command === "./scripts/check_mail.sh --limit 5";
return {
allowlistMatches: previewMatch && hasNodeAllowlist ? [{}] : [],
analysisOk: true,
allowlistSatisfied: previewMatch && hasNodeAllowlist,
segments: [
previewMatch
? {
resolution: null,
argv: ["./scripts/check_mail.sh", "--limit", "5"],
raw: "./scripts/check_mail.sh --limit 5",
}
: {
resolution: null,
argv: ["rm", "-rf", "/tmp/work"],
raw: "rm -rf /tmp/work",
},
],
segmentAllowlistEntries: previewMatch && hasNodeAllowlist ? [{}] : [],
};
},
);
const autoReviewer = vi.fn<ExecAutoReviewer>(async (input) =>
input.command.includes("rm -rf")
? {
decision: "ask",
risk: "high",
rationale: "destructive prepared plan",
}
: {
decision: "allow-once",
risk: "low",
rationale: "safe requested text",
},
);
resolveExecHostApprovalContextMock.mockReturnValue({
approvals: { allowlist: [], file: { version: 1, agents: {} } },
hostSecurity: "allowlist",
hostAsk: "on-miss",
askFallback: "deny",
});
requiresExecApprovalMock.mockImplementation(
(params?: { allowlistSatisfied?: boolean; durableApprovalSatisfied?: boolean }) =>
params?.allowlistSatisfied !== true && params?.durableApprovalSatisfied !== true,
);
const result = await executeNodeHostCommand({
command: "echo SAFE",
workdir: "/tmp/work",
env: {},
security: "allowlist",
ask: "on-miss",
autoReview: true,
autoReviewer,
defaultTimeoutSec: 30,
approvalRunningNoticeMs: 0,
warnings: [],
agentId: "requested-agent",
sessionKey: "requested-session",
});
expect(result.details?.status).toBe("approval-pending");
expect(autoReviewer).toHaveBeenCalledWith(
expect.objectContaining({
command: "rm -rf /tmp/work",
argv: ["rm", "-rf", "/tmp/work"],
agent: {
id: "prepared-agent",
sessionKey: "prepared-session",
},
}),
);
expect(createAndRegisterDefaultExecApprovalRequestMock).toHaveBeenCalled();
expect(callGatewayToolMock).not.toHaveBeenCalledWith(
"exec.approval.resolve",
expect.anything(),
expect.anything(),
expect.anything(),
);
});
it("honors node allowlist matches on prepared POSIX shell payloads", async () => {
const wrapperPlan = {
argv: ["/bin/sh", "-lc", "./scripts/check_mail.sh --limit 5"],
cwd: "/tmp/work",
commandText: `/bin/sh -lc "./scripts/check_mail.sh --limit 5"`,
commandPreview: "./scripts/check_mail.sh --limit 5",
agentId: "prepared-agent",
sessionKey: "prepared-session",
};
parsePreparedSystemRunPayloadMock.mockReturnValue({
plan: wrapperPlan,
execPolicy: { security: "full", ask: "off" },
});
const nodeAllowlist = [{ pattern: "./scripts/check_mail.sh" }];
resolveExecApprovalsFromFileMock.mockReturnValue({
allowlist: nodeAllowlist,
file: { version: 1, agents: {} },
agent: {
security: "full",
ask: "off",
askFallback: "deny",
autoAllowSkills: false,
},
});
evaluateShellAllowlistMock.mockImplementation(
(params?: { command?: string; allowlist?: unknown[] }) => {
const command = params?.command ?? "";
const hasNodeAllowlist = Array.isArray(params?.allowlist) && params.allowlist.length > 0;
const semanticMatch = command === "./scripts/check_mail.sh --limit 5";
return {
allowlistMatches: semanticMatch && hasNodeAllowlist ? [{}] : [],
analysisOk: true,
allowlistSatisfied: semanticMatch && hasNodeAllowlist,
segments: [
command.startsWith("/bin/sh")
? {
resolution: null,
argv: ["/bin/sh", "-lc", "./scripts/check_mail.sh --limit 5"],
raw: `/bin/sh -lc "./scripts/check_mail.sh --limit 5"`,
}
: {
resolution: null,
argv: ["./scripts/check_mail.sh", "--limit", "5"],
raw: "./scripts/check_mail.sh --limit 5",
},
],
segmentAllowlistEntries: semanticMatch && hasNodeAllowlist ? [{}] : [],
};
},
);
const autoReviewer = vi.fn<ExecAutoReviewer>(async () => ({
decision: "ask",
risk: "medium",
rationale: "should not be needed",
}));
resolveExecHostApprovalContextMock.mockReturnValue({
approvals: { allowlist: [], file: { version: 1, agents: {} } },
hostSecurity: "allowlist",
hostAsk: "on-miss",
askFallback: "deny",
});
requiresExecApprovalMock.mockImplementation(
(params?: { allowlistSatisfied?: boolean; durableApprovalSatisfied?: boolean }) =>
params?.allowlistSatisfied !== true && params?.durableApprovalSatisfied !== true,
);
const result = await executeNodeHostCommand({
command: "./scripts/check_mail.sh --limit 5",
workdir: "/tmp/work",
env: {},
security: "allowlist",
ask: "on-miss",
autoReview: true,
autoReviewer,
defaultTimeoutSec: 30,
approvalRunningNoticeMs: 0,
warnings: [],
agentId: "requested-agent",
sessionKey: "requested-session",
});
expect(result.details?.status).toBe("completed");
expect(autoReviewer).not.toHaveBeenCalled();
expect(createAndRegisterDefaultExecApprovalRequestMock).not.toHaveBeenCalled();
expect(resolveExecApprovalsFromFileMock).toHaveBeenCalledWith(
expect.objectContaining({ agentId: "prepared-agent" }),
);
expectSystemRunInvoke({ invokeTimeoutMs: 35_000, runTimeoutMs: 30_000 });
});
it("does not let transport wrapper allowlist matches approve shell payloads", async () => {
const wrapperPlan = {
argv: ["/bin/sh", "-lc", "./scripts/untrusted.sh"],
cwd: "/tmp/work",
commandText: `/bin/sh -lc "./scripts/untrusted.sh"`,
commandPreview: "./scripts/untrusted.sh",
agentId: "prepared-agent",
sessionKey: "prepared-session",
};
parsePreparedSystemRunPayloadMock.mockReturnValue({
plan: wrapperPlan,
execPolicy: { security: "full", ask: "off" },
});
const nodeAllowlist = [{ pattern: "/bin/sh" }];
resolveExecApprovalsFromFileMock.mockReturnValue({
allowlist: nodeAllowlist,
file: { version: 1, agents: {} },
agent: {
security: "full",
ask: "off",
askFallback: "deny",
autoAllowSkills: false,
},
});
evaluateShellAllowlistMock.mockImplementation(
(params?: { command?: string; allowlist?: unknown[] }) => {
const command = params?.command ?? "";
const hasNodeAllowlist = Array.isArray(params?.allowlist) && params.allowlist.length > 0;
const wrapperMatch = command.startsWith("/bin/sh") && hasNodeAllowlist;
return {
allowlistMatches: wrapperMatch ? [{}] : [],
analysisOk: true,
allowlistSatisfied: wrapperMatch,
segments: [
command.startsWith("/bin/sh")
? {
resolution: null,
argv: ["/bin/sh", "-lc", "./scripts/untrusted.sh"],
raw: `/bin/sh -lc "./scripts/untrusted.sh"`,
}
: {
resolution: null,
argv: ["./scripts/untrusted.sh"],
raw: "./scripts/untrusted.sh",
},
],
segmentAllowlistEntries: wrapperMatch ? [{}] : [],
};
},
);
requiresExecApprovalMock.mockImplementation(
(params?: { allowlistSatisfied?: boolean; durableApprovalSatisfied?: boolean }) =>
params?.allowlistSatisfied !== true && params?.durableApprovalSatisfied !== true,
);
hasDurableExecApprovalMock.mockImplementation(
(params?: { segmentAllowlistEntries?: unknown[] }) =>
Array.isArray(params?.segmentAllowlistEntries) && params.segmentAllowlistEntries.length > 0,
);
const autoReviewer = vi.fn<ExecAutoReviewer>(async () => ({
decision: "ask",
risk: "medium",
rationale: "inner payload is not allowlisted",
}));
resolveExecHostApprovalContextMock.mockReturnValue({
approvals: { allowlist: [], file: { version: 1, agents: {} } },
hostSecurity: "allowlist",
hostAsk: "on-miss",
askFallback: "deny",
});
const result = await executeNodeHostCommand({
command: "./scripts/untrusted.sh",
workdir: "/tmp/work",
env: {},
security: "allowlist",
ask: "on-miss",
autoReview: true,
autoReviewer,
defaultTimeoutSec: 30,
approvalRunningNoticeMs: 0,
warnings: [],
agentId: "requested-agent",
sessionKey: "requested-session",
});
expect(result.details?.status).toBe("approval-pending");
expect(autoReviewer).toHaveBeenCalledWith(
expect.objectContaining({
command: `/bin/sh -lc "./scripts/untrusted.sh"`,
argv: ["./scripts/untrusted.sh"],
}),
);
expect(createAndRegisterDefaultExecApprovalRequestMock).toHaveBeenCalled();
});
it("reuses exact durable approvals for prepared shell wrappers", async () => {
const wrapperPlan = {
argv: ["/bin/sh", "-lc", "cd ."],
cwd: "/tmp/work",
commandText: `/bin/sh -lc "cd ."`,
commandPreview: "cd .",
agentId: "prepared-agent",
sessionKey: "prepared-session",
};
parsePreparedSystemRunPayloadMock.mockReturnValue({
plan: wrapperPlan,
execPolicy: { security: "full", ask: "off" },
});
resolveExecApprovalsFromFileMock.mockReturnValue({
allowlist: [
{
pattern: exactCommandMarker(wrapperPlan.commandText),
source: "allow-always",
commandText: wrapperPlan.commandText,
},
],
file: { version: 1, agents: {} },
agent: {
security: "full",
ask: "off",
askFallback: "deny",
autoAllowSkills: false,
},
});
evaluateShellAllowlistMock.mockImplementation((params?: { command?: string }) => {
const command = params?.command ?? "";
return {
allowlistMatches: [],
analysisOk: true,
allowlistSatisfied: false,
segments: [
command.startsWith("/bin/sh")
? {
resolution: null,
argv: ["/bin/sh", "-lc", "cd ."],
raw: `/bin/sh -lc "cd ."`,
}
: {
resolution: null,
argv: ["cd", "."],
raw: "cd .",
},
],
segmentAllowlistEntries: [],
};
});
hasDurableExecApprovalMock.mockImplementation(
(params?: { commandText?: string | null }) => params?.commandText === wrapperPlan.commandText,
);
requiresExecApprovalMock.mockImplementation(
(params?: { allowlistSatisfied?: boolean; durableApprovalSatisfied?: boolean }) =>
params?.allowlistSatisfied !== true && params?.durableApprovalSatisfied !== true,
);
resolveExecHostApprovalContextMock.mockReturnValue({
approvals: { allowlist: [], file: { version: 1, agents: {} } },
hostSecurity: "allowlist",
hostAsk: "on-miss",
askFallback: "deny",
});
const result = await executeNodeHostCommand({
command: "cd .",
workdir: "/tmp/work",
env: {},
security: "allowlist",
ask: "on-miss",
autoReview: true,
defaultTimeoutSec: 30,
approvalRunningNoticeMs: 0,
warnings: [],
agentId: "requested-agent",
sessionKey: "requested-session",
});
expect(result.details?.status).toBe("completed");
expect(createAndRegisterDefaultExecApprovalRequestMock).not.toHaveBeenCalled();
expectSystemRunInvoke({ invokeTimeoutMs: 35_000, runTimeoutMs: 30_000 });
});
it("keeps non-transport login shells approval-gated", async () => {
const loginPlan = {
argv: ["bash", "-lc", "./scripts/check_mail.sh --limit 5"],
cwd: "/tmp/work",
commandText: `bash -lc "./scripts/check_mail.sh --limit 5"`,
commandPreview: "./scripts/check_mail.sh --limit 5",
agentId: "prepared-agent",
sessionKey: "prepared-session",
};
parsePreparedSystemRunPayloadMock.mockReturnValue({
plan: loginPlan,
execPolicy: { security: "full", ask: "off" },
});
const nodeAllowlist = [{ pattern: "./scripts/check_mail.sh" }];
resolveExecApprovalsFromFileMock.mockReturnValue({
allowlist: nodeAllowlist,
file: { version: 1, agents: {} },
agent: {
security: "full",
ask: "off",
askFallback: "deny",
autoAllowSkills: false,
},
});
evaluateShellAllowlistMock.mockImplementation(
(params?: { command?: string; allowlist?: unknown[] }) => {
const command = params?.command ?? "";
const hasNodeAllowlist = Array.isArray(params?.allowlist) && params.allowlist.length > 0;
const semanticMatch = command === "./scripts/check_mail.sh --limit 5";
return {
allowlistMatches: semanticMatch && hasNodeAllowlist ? [{}] : [],
analysisOk: true,
allowlistSatisfied: semanticMatch && hasNodeAllowlist,
segments: [
command.startsWith("bash")
? {
resolution: null,
argv: ["bash", "-lc", "./scripts/check_mail.sh --limit 5"],
raw: `bash -lc "./scripts/check_mail.sh --limit 5"`,
}
: {
resolution: null,
argv: ["./scripts/check_mail.sh", "--limit", "5"],
raw: "./scripts/check_mail.sh --limit 5",
},
],
segmentAllowlistEntries: semanticMatch && hasNodeAllowlist ? [{}] : [],
};
},
);
requiresExecApprovalMock.mockImplementation(
(params?: { allowlistSatisfied?: boolean; durableApprovalSatisfied?: boolean }) =>
params?.allowlistSatisfied !== true && params?.durableApprovalSatisfied !== true,
);
const autoReviewer = vi.fn<ExecAutoReviewer>(async () => ({
decision: "ask",
risk: "medium",
rationale: "login shell needs human approval",
}));
resolveExecHostApprovalContextMock.mockReturnValue({
approvals: { allowlist: [], file: { version: 1, agents: {} } },
hostSecurity: "allowlist",
hostAsk: "on-miss",
askFallback: "deny",
});
const result = await executeNodeHostCommand({
command: "./scripts/check_mail.sh --limit 5",
workdir: "/tmp/work",
env: {},
security: "allowlist",
ask: "on-miss",
autoReview: true,
autoReviewer,
defaultTimeoutSec: 30,
approvalRunningNoticeMs: 0,
warnings: [],
agentId: "requested-agent",
sessionKey: "requested-session",
});
expect(result.details?.status).toBe("approval-pending");
expect(autoReviewer).toHaveBeenCalledWith(
expect.objectContaining({
command: `bash -lc "./scripts/check_mail.sh --limit 5"`,
argv: ["bash", "-lc", "./scripts/check_mail.sh --limit 5"],
}),
);
expect(createAndRegisterDefaultExecApprovalRequestMock).toHaveBeenCalled();
});
it("requires human approval when prepared shell payload has multiple commands", async () => {
const chainPlan = {
argv: ["/bin/sh", "-lc", "openclaw status; id"],
cwd: "/tmp/work",
commandText: `/bin/sh -lc "openclaw status; id"`,
commandPreview: "openclaw status; id",
agentId: "prepared-agent",
sessionKey: "prepared-session",
};
parsePreparedSystemRunPayloadMock.mockReturnValue({
plan: chainPlan,
execPolicy: { security: "full", ask: "off" },
});
evaluateShellAllowlistMock.mockImplementation((params?: { command?: string }) => {
const command = params?.command ?? "";
return {
allowlistMatches: [],
analysisOk: true,
allowlistSatisfied: false,
segments: command.startsWith("/bin/sh")
? [
{
resolution: null,
argv: ["/bin/sh", "-lc", "openclaw status; id"],
raw: `/bin/sh -lc "openclaw status; id"`,
},
]
: [
{
resolution: null,
argv: ["openclaw", "status"],
raw: "openclaw status",
},
{
resolution: null,
argv: ["id"],
raw: "id",
},
],
segmentAllowlistEntries: [],
};
});
const autoReviewer = vi.fn<ExecAutoReviewer>(async () => ({
decision: "allow-once",
risk: "low",
rationale: "test reviewer would allow it",
}));
resolveExecHostApprovalContextMock.mockReturnValue({
approvals: { allowlist: [], file: { version: 1, agents: {} } },
hostSecurity: "allowlist",
hostAsk: "on-miss",
askFallback: "deny",
});
const result = await executeNodeHostCommand({
command: "openclaw status; id",
workdir: "/tmp/work",
env: {},
security: "allowlist",
ask: "on-miss",
autoReview: true,
autoReviewer,
defaultTimeoutSec: 30,
approvalRunningNoticeMs: 0,
warnings: [],
agentId: "requested-agent",
sessionKey: "requested-session",
});
expect(result.details?.status).toBe("approval-pending");
expect(autoReviewer).not.toHaveBeenCalled();
expect(createAndRegisterDefaultExecApprovalRequestMock).toHaveBeenCalled();
});
it("does not treat read-only suppression inspections as wrapper writes", async () => {
const wrapperPlan = {
argv: ["/bin/sh", "-lc", "openclaw config get security.audit.suppressions"],
cwd: "/tmp/work",
commandText: `/bin/sh -lc "openclaw config get security.audit.suppressions"`,
commandPreview: "openclaw config get security.audit.suppressions",
agentId: "prepared-agent",
sessionKey: "prepared-session",
};
parsePreparedSystemRunPayloadMock.mockReturnValue({
plan: wrapperPlan,
execPolicy: { security: "full", ask: "off" },
});
evaluateShellAllowlistMock.mockImplementation((params?: { command?: string }) => {
const command = params?.command ?? "";
return {
allowlistMatches: [],
analysisOk: true,
allowlistSatisfied: true,
segments: [
command.startsWith("/bin/sh")
? {
resolution: null,
argv: ["/bin/sh", "-lc", "openclaw config get security.audit.suppressions"],
raw: `/bin/sh -lc "openclaw config get security.audit.suppressions"`,
}
: {
resolution: null,
argv: ["openclaw", "config", "get", "security.audit.suppressions"],
raw: "openclaw config get security.audit.suppressions",
},
],
segmentAllowlistEntries: [],
};
});
commandRequiresSecurityAuditSuppressionApprovalMock.mockImplementation(
(params?: { command?: string }) => params?.command?.startsWith("/bin/sh") === true,
);
requiresExecApprovalMock.mockReturnValue(false);
resolveExecHostApprovalContextMock.mockReturnValue({
approvals: { allowlist: [], file: { version: 1, agents: {} } },
hostSecurity: "allowlist",
hostAsk: "on-miss",
askFallback: "deny",
});
const result = await executeNodeHostCommand({
command: "openclaw config get security.audit.suppressions",
workdir: "/tmp/work",
env: {},
security: "allowlist",
ask: "on-miss",
autoReview: true,
defaultTimeoutSec: 30,
approvalRunningNoticeMs: 0,
warnings: [],
agentId: "requested-agent",
sessionKey: "requested-session",
});
expect(result.details?.status).toBe("completed");
expect(createAndRegisterDefaultExecApprovalRequestMock).not.toHaveBeenCalled();
expectSystemRunInvoke({ invokeTimeoutMs: 35_000, runTimeoutMs: 30_000 });
});
it("requests human approval when node auto-review asks on an approval miss", async () => {
const autoReviewer = vi.fn<ExecAutoReviewer>(async () => ({
decision: "ask",
risk: "medium",
rationale: "needs a person",
}));
const warnings: string[] = [];
resolveExecHostApprovalContextMock.mockReturnValue({
approvals: { allowlist: [], file: { version: 1, agents: {} } },
hostSecurity: "allowlist",
hostAsk: "on-miss",
askFallback: "deny",
});
const result = await executeNodeHostCommand({
command: "bun ./script.ts",
workdir: "/tmp/work",
env: {},
security: "allowlist",
ask: "on-miss",
autoReview: true,
autoReviewer,
defaultTimeoutSec: 30,
approvalRunningNoticeMs: 0,
warnings,
agentId: "requested-agent",
sessionKey: "requested-session",
});
expect(result.details?.status).toBe("approval-pending");
expect(autoReviewer).toHaveBeenCalledTimes(1);
expect(createAndRegisterDefaultExecApprovalRequestMock).toHaveBeenCalledTimes(1);
expect(warnings.join("\n")).toContain("needs a person");
});
it.each([
{
name: "ask always",
nodeSecurity: "full",
nodeAsk: "always",
},
{
name: "deny security",
nodeSecurity: "deny",
nodeAsk: "off",
},
] as const)(
"requests human approval when node policy has $name floor",
async ({ nodeSecurity, nodeAsk }) => {
const autoReviewer = vi.fn<ExecAutoReviewer>(async () => ({
decision: "allow-once",
risk: "low",
rationale: "test reviewer would allow it",
}));
resolveExecHostApprovalContextMock.mockReturnValue({
approvals: { allowlist: [], file: { version: 1, agents: {} } },
hostSecurity: "allowlist",
hostAsk: "on-miss",
askFallback: "deny",
});
parsePreparedSystemRunPayloadMock.mockReturnValue({
plan: preparedPlan,
execPolicy: { security: nodeSecurity, ask: nodeAsk },
});
resolveExecApprovalsFromFileMock.mockReturnValue({
allowlist: [],
file: { version: 1, agents: {} },
agent: {
security: nodeSecurity,
ask: nodeAsk,
askFallback: "deny",
autoAllowSkills: false,
},
});
callGatewayToolMock.mockImplementation(
async (method: string, _options: unknown, params: MockNodeInvokeParams | undefined) => {
if (method === "exec.approvals.node.get") {
return { file: { version: 1, agents: {} } };
}
if (method === "exec.approval.resolve") {
return { payload: {} };
}
if (method !== "node.invoke") {
throw new Error(`unexpected gateway method: ${method}`);
}
if (params?.command === "system.run.prepare") {
return {
payload: {
plan: preparedPlan,
execPolicy: { security: nodeSecurity, ask: nodeAsk },
},
};
}
if (params?.command === "system.run") {
return {
payload: {
success: true,
stdout: "ok",
stderr: "",
exitCode: 0,
timedOut: false,
},
};
}
throw new Error(`unexpected node invoke command: ${String(params?.command)}`);
},
);
const result = await executeNodeHostCommand({
command: "bun ./script.ts",
workdir: "/tmp/work",
env: {},
security: "allowlist",
ask: "on-miss",
autoReview: true,
autoReviewer,
defaultTimeoutSec: 30,
approvalRunningNoticeMs: 0,
warnings: [],
agentId: "requested-agent",
sessionKey: "requested-session",
});
expect(result.details?.status).toBe("approval-pending");
expect(autoReviewer).not.toHaveBeenCalled();
expect(createAndRegisterDefaultExecApprovalRequestMock).toHaveBeenCalledTimes(1);
expect(
callGatewayToolMock.mock.calls.some(([method]) => method === "exec.approval.resolve"),
).toBe(false);
},
);
it("requests human approval when node approval policy is unavailable", async () => {
const autoReviewer = vi.fn<ExecAutoReviewer>(async () => ({
decision: "allow-once",
risk: "low",
rationale: "test reviewer would allow it",
}));
resolveExecHostApprovalContextMock.mockReturnValue({
approvals: { allowlist: [], file: { version: 1, agents: {} } },
hostSecurity: "allowlist",
hostAsk: "on-miss",
askFallback: "deny",
});
callGatewayToolMock.mockImplementation(
async (method: string, _options: unknown, params: MockNodeInvokeParams | undefined) => {
if (method === "exec.approvals.node.get") {
throw new Error("node approvals unavailable");
}
if (method === "exec.approval.resolve") {
return { payload: {} };
}
if (method !== "node.invoke") {
throw new Error(`unexpected gateway method: ${method}`);
}
if (params?.command === "system.run.prepare") {
return { payload: { plan: preparedPlan } };
}
if (params?.command === "system.run") {
return {
payload: {
success: true,
stdout: "ok",
stderr: "",
exitCode: 0,
timedOut: false,
},
};
}
throw new Error(`unexpected node invoke command: ${String(params?.command)}`);
},
);
const result = await executeNodeHostCommand({
command: "bun ./script.ts",
workdir: "/tmp/work",
env: {},
security: "allowlist",
ask: "on-miss",
autoReview: true,
autoReviewer,
defaultTimeoutSec: 30,
approvalRunningNoticeMs: 0,
warnings: [],
agentId: "requested-agent",
sessionKey: "requested-session",
});
expect(result.details?.status).toBe("approval-pending");
expect(autoReviewer).not.toHaveBeenCalled();
expect(createAndRegisterDefaultExecApprovalRequestMock).toHaveBeenCalledTimes(1);
expect(
callGatewayToolMock.mock.calls.some(([method]) => method === "exec.approval.resolve"),
).toBe(false);
});
it("does not use fallback-full when node approval policy is unavailable", async () => {
const autoReviewer = vi.fn<ExecAutoReviewer>(async () => ({
decision: "allow-once",
risk: "low",
rationale: "test reviewer would allow it",
}));
resolveExecHostApprovalContextMock.mockReturnValue({
approvals: { allowlist: [], file: { version: 1, agents: {} } },
hostSecurity: "allowlist",
hostAsk: "on-miss",
askFallback: "full",
});
callGatewayToolMock.mockImplementation(
async (method: string, _options: unknown, params: MockNodeInvokeParams | undefined) => {
if (method === "exec.approvals.node.get") {
throw new Error("node approvals unavailable");
}
if (method !== "node.invoke") {
throw new Error(`unexpected gateway method: ${method}`);
}
if (params?.command === "system.run.prepare") {
return { payload: { plan: preparedPlan } };
}
if (params?.command === "system.run") {
return {
payload: {
success: true,
stdout: "should-not-run",
stderr: "",
exitCode: 0,
timedOut: false,
},
};
}
throw new Error(`unexpected node invoke command: ${String(params?.command)}`);
},
);
resolveApprovalDecisionOrUndefinedMock.mockResolvedValue(null);
createExecApprovalDecisionStateMock.mockReturnValue({
baseDecision: { timedOut: true },
approvedByAsk: true,
deniedReason: null,
});
enforceStrictInlineEvalApprovalBoundaryMock.mockImplementation((value) =>
value.requiresAutoReviewHumanApproval === true && value.baseDecision.timedOut
? { approvedByAsk: false, deniedReason: "approval-timeout" }
: { approvedByAsk: value.approvedByAsk, deniedReason: value.deniedReason },
);
const result = await executeNodeHostCommand({
command: "bun ./script.ts",
workdir: "/tmp/work",
env: {},
security: "allowlist",
ask: "on-miss",
autoReview: true,
autoReviewer,
defaultTimeoutSec: 30,
approvalRunningNoticeMs: 0,
warnings: [],
agentId: "requested-agent",
sessionKey: "requested-session",
});
expect(result.details?.status).toBe("approval-pending");
expect(autoReviewer).not.toHaveBeenCalled();
await vi.waitFor(() => {
expect(sendExecApprovalFollowupResultMock).toHaveBeenCalledWith(
expect.objectContaining({
approvalId: "approval-1",
sessionKey: "requested-session",
}),
"Exec denied (node=node-1 id=approval-1, approval-timeout): bun ./script.ts",
);
});
expect(
callGatewayToolMock.mock.calls.some(
([method, , params]) =>
method === "node.invoke" &&
(params as MockNodeInvokeParams | undefined)?.command === "system.run",
),
).toBe(false);
});
it("auto-reviews strict inline-eval commands before asking a human", async () => {
const inlinePlan = {
argv: ["/bin/sh", "-lc", "python3 -c 'print(1)'"],
cwd: "/tmp/work",
commandText: `/bin/sh -lc "python3 -c 'print(1)'"`,
commandPreview: "python3 -c 'print(1)'",
agentId: "requested-agent",
sessionKey: "requested-session",
};
parsePreparedSystemRunPayloadMock.mockReturnValue({
plan: inlinePlan,
execPolicy: { security: "full", ask: "off" },
});
const autoReviewer = vi.fn<ExecAutoReviewer>(async () => ({
decision: "allow-once",
risk: "low",
rationale: "safe inline eval",
}));
detectInterpreterInlineEvalArgvMock.mockImplementation((argv?: unknown) =>
Array.isArray(argv) && argv[0] === "python3" ? INLINE_EVAL_HIT : null,
);
evaluateShellAllowlistMock.mockImplementation((params?: { command?: string }) => {
const command = params?.command ?? "";
const segment = command.startsWith("/bin/sh")
? {
resolution: null,
argv: ["/bin/sh", "-lc", "python3 -c 'print(1)'"],
raw: `/bin/sh -lc "python3 -c 'print(1)'"`,
}
: {
resolution: null,
argv: ["python3", "-c", "print(1)"],
raw: "python3 -c 'print(1)'",
};
return {
allowlistMatches: [],
analysisOk: true,
allowlistSatisfied: false,
segments: [segment],
segmentAllowlistEntries: [],
};
});
resolveExecHostApprovalContextMock.mockReturnValue({
approvals: { allowlist: [], file: { version: 1, agents: {} } },
hostSecurity: "allowlist",
hostAsk: "on-miss",
askFallback: "deny",
});
const warnings: string[] = [];
const result = await executeNodeHostCommand({
command: "python3 -c 'print(1)'",
workdir: "/tmp/work",
env: {},
security: "allowlist",
ask: "on-miss",
autoReview: true,
autoReviewer,
strictInlineEval: true,
defaultTimeoutSec: 30,
approvalRunningNoticeMs: 0,
warnings,
agentId: "requested-agent",
sessionKey: "requested-session",
});
expect(result.details?.status).toBe("completed");
expect(autoReviewer).toHaveBeenCalledWith(
expect.objectContaining({
command: `/bin/sh -lc "python3 -c 'print(1)'"`,
argv: ["python3", "-c", "print(1)"],
host: "node",
reason: "strict-inline-eval",
analysis: expect.objectContaining({
inlineEval: true,
}),
}),
);
expect(createAndRegisterDefaultExecApprovalRequestMock).not.toHaveBeenCalled();
expect(warnings[0]).toContain("requires reviewer or explicit approval");
});
it("keeps security audit suppression edits off the auto-review path", async () => {
const autoReviewer = vi.fn<ExecAutoReviewer>(async () => ({
decision: "allow-once",
risk: "low",
rationale: "test reviewer would allow it",
}));
const warnings: string[] = [];
commandRequiresSecurityAuditSuppressionApprovalMock.mockReturnValue(true);
resolveExecHostApprovalContextMock.mockReturnValue({
approvals: { allowlist: [], file: { version: 1, agents: {} } },
hostSecurity: "allowlist",
hostAsk: "on-miss",
askFallback: "deny",
});
const result = await executeNodeHostCommand({
command: "openclaw config set security.audit.suppressions '[]'",
workdir: "/tmp/work",
env: {},
security: "allowlist",
ask: "on-miss",
autoReview: true,
autoReviewer,
defaultTimeoutSec: 30,
approvalRunningNoticeMs: 0,
warnings,
agentId: "requested-agent",
sessionKey: "requested-session",
});
expect(result.details?.status).toBe("approval-pending");
expect(autoReviewer).not.toHaveBeenCalled();
expect(createAndRegisterDefaultExecApprovalRequestMock).toHaveBeenCalledTimes(1);
expect(warnings).toContain(
"Warning: security audit suppression changes require explicit approval unless exec is running in yolo mode.",
);
});
it("requests human approval when node auto-review cannot bind a single parsed command", async () => {
const autoReviewer = vi.fn<ExecAutoReviewer>(async () => ({
decision: "allow-once",
risk: "low",
rationale: "test reviewer would allow it",
}));
evaluateShellAllowlistMock.mockReturnValue({
allowlistMatches: [],
analysisOk: true,
allowlistSatisfied: false,
segments: [
{ raw: "echo ok", resolution: null, argv: ["echo", "ok"] },
{ raw: "pwd", resolution: null, argv: ["pwd"] },
],
segmentAllowlistEntries: [],
});
resolveExecHostApprovalContextMock.mockReturnValue({
approvals: { allowlist: [], file: { version: 1, agents: {} } },
hostSecurity: "allowlist",
hostAsk: "on-miss",
askFallback: "deny",
});
const result = await executeNodeHostCommand({
command: "echo ok; pwd",
workdir: "/tmp/work",
env: {},
security: "allowlist",
ask: "on-miss",
autoReview: true,
autoReviewer,
defaultTimeoutSec: 30,
approvalRunningNoticeMs: 0,
warnings: [],
agentId: "requested-agent",
sessionKey: "requested-session",
});
expect(result.details?.status).toBe("approval-pending");
expect(autoReviewer).not.toHaveBeenCalled();
expect(createAndRegisterDefaultExecApprovalRequestMock).toHaveBeenCalledTimes(1);
});
it("requests human approval when node runtime policy requires ask always", async () => {
const autoReviewer = vi.fn<ExecAutoReviewer>(async () => ({
decision: "allow-once",
risk: "low",
rationale: "test reviewer would allow it",
}));
parsePreparedSystemRunPayloadMock.mockReturnValue({
plan: preparedPlan,
execPolicy: { security: "full", ask: "always" },
});
resolveExecApprovalsFromFileMock.mockReturnValue({
allowlist: [],
file: { version: 1, agents: {} },
agent: {
security: "full",
ask: "off",
askFallback: "deny",
autoAllowSkills: false,
},
});
resolveExecHostApprovalContextMock.mockReturnValue({
approvals: { allowlist: [], file: { version: 1, agents: {} } },
hostSecurity: "allowlist",
hostAsk: "on-miss",
askFallback: "deny",
});
const result = await executeNodeHostCommand({
command: "bun ./script.ts",
workdir: "/tmp/work",
env: {},
security: "allowlist",
ask: "on-miss",
autoReview: true,
autoReviewer,
defaultTimeoutSec: 30,
approvalRunningNoticeMs: 0,
warnings: [],
agentId: "requested-agent",
sessionKey: "requested-session",
});
expect(result.details?.status).toBe("approval-pending");
expect(autoReviewer).not.toHaveBeenCalled();
expect(createAndRegisterDefaultExecApprovalRequestMock).toHaveBeenCalledTimes(1);
expect(resolveExecApprovalAllowedDecisionsMock).toHaveBeenCalledWith({
ask: "always",
allowAlwaysPersistence: {
kind: "patterns",
patterns: [{ pattern: "/trusted/bin/tool" }],
},
});
expect(requireRegisteredApprovalRequest().unavailableDecisions).toEqual(["allow-always"]);
expect(buildExecApprovalPendingToolResultMock).toHaveBeenCalledWith(
expect.objectContaining({
allowedDecisions: ["allow-once", "deny"],
}),
);
});
it("omits allow-always from node approval prompts when node runtime policy is missing", async () => {
const autoReviewer = vi.fn<ExecAutoReviewer>(async () => ({
decision: "allow-once",
risk: "low",
rationale: "test reviewer would allow it",
}));
parsePreparedSystemRunPayloadMock.mockReturnValue({
plan: preparedPlan,
execPolicy: undefined,
});
resolveExecHostApprovalContextMock.mockReturnValue({
approvals: { allowlist: [], file: { version: 1, agents: {} } },
hostSecurity: "allowlist",
hostAsk: "on-miss",
askFallback: "deny",
});
const result = await executeNodeHostCommand({
command: "bun ./script.ts",
workdir: "/tmp/work",
env: {},
security: "allowlist",
ask: "on-miss",
autoReview: true,
autoReviewer,
defaultTimeoutSec: 30,
approvalRunningNoticeMs: 0,
warnings: [],
agentId: "requested-agent",
sessionKey: "requested-session",
});
expect(result.details?.status).toBe("approval-pending");
expect(autoReviewer).not.toHaveBeenCalled();
expect(resolveExecApprovalAllowedDecisionsMock).toHaveBeenCalledWith({
ask: "always",
allowAlwaysPersistence: {
kind: "patterns",
patterns: [{ pattern: "/trusted/bin/tool" }],
},
});
expect(requireRegisteredApprovalRequest().unavailableDecisions).toEqual(["allow-always"]);
});
it("offers allow-always for prepared node commands with complete node coverage", async () => {
const preparedWrapperPlan = {
...preparedPlan,
argv: ["/bin/sh", "-lc", "git status"],
commandText: '/bin/sh -lc "git status"',
commandPreview: "git status",
};
mockGatewayInvokesWithNodeApprovals({ version: 1, agents: {} });
usePolicyApprovalRequirementMock();
parsePreparedSystemRunPayloadMock.mockReturnValueOnce({
plan: preparedWrapperPlan,
execPolicy: { security: "full", ask: "off" },
allowAlwaysCoverage: {
complete: true,
patterns: [{ pattern: "/node/bin/git" }],
},
});
resolveAllowAlwaysPersistenceDecisionMock.mockImplementationOnce((params) => {
const commandText = params.commandText?.trim();
return params.preparedCoverage?.complete === true && params.preparedCoverage.patterns.length
? {
kind: "patterns",
...(commandText ? { commandText } : {}),
patterns: params.preparedCoverage.patterns,
}
: {
kind: "one-shot",
reasons: ["no-reusable-pattern"],
};
});
resolveExecHostApprovalContextMock.mockReturnValue({
approvals: { allowlist: [], file: { version: 1, agents: {} } },
hostSecurity: "allowlist",
hostAsk: "on-miss",
askFallback: "deny",
});
resolveApprovalDecisionOrUndefinedMock.mockResolvedValue(undefined);
const result = await executeNodeHostCommand({
command: "git status",
workdir: "/tmp/work",
env: {},
security: "allowlist",
ask: "on-miss",
defaultTimeoutSec: 30,
approvalRunningNoticeMs: 0,
warnings: [],
agentId: "requested-agent",
sessionKey: "requested-session",
});
expect(result.details?.status).toBe("approval-pending");
expect(resolveAllowAlwaysPersistenceDecisionMock).toHaveBeenCalledWith(
expect.objectContaining({
commandText: '/bin/sh -lc "git status"',
preparedCoverage: {
complete: true,
patterns: [{ pattern: "/node/bin/git" }],
},
}),
);
expect(resolveExecApprovalAllowedDecisionsMock).toHaveBeenCalledWith({
ask: "on-miss",
allowAlwaysPersistence: {
kind: "patterns",
commandText: '/bin/sh -lc "git status"',
patterns: [{ pattern: "/node/bin/git" }],
},
});
expect(requireRegisteredApprovalRequest().unavailableDecisions).toBeUndefined();
});
it("does not use fallback-full when node auto-review cannot parse the command", async () => {
const autoReviewer = vi.fn<ExecAutoReviewer>(async () => ({
decision: "allow-once",
risk: "low",
rationale: "test reviewer would allow it",
}));
evaluateShellAllowlistMock.mockReturnValue({
allowlistMatches: [],
analysisOk: false,
allowlistSatisfied: false,
segments: [],
segmentAllowlistEntries: [],
});
resolveExecHostApprovalContextMock.mockReturnValue({
approvals: { allowlist: [], file: { version: 1, agents: {} } },
hostSecurity: "allowlist",
hostAsk: "on-miss",
askFallback: "full",
});
resolveApprovalDecisionOrUndefinedMock.mockResolvedValue(null);
createExecApprovalDecisionStateMock.mockReturnValue({
baseDecision: { timedOut: true },
approvedByAsk: true,
deniedReason: null,
});
enforceStrictInlineEvalApprovalBoundaryMock.mockImplementation((value) =>
value.requiresAutoReviewHumanApproval === true && value.baseDecision.timedOut
? { approvedByAsk: false, deniedReason: "approval-timeout" }
: { approvedByAsk: value.approvedByAsk, deniedReason: value.deniedReason },
);
const result = await executeNodeHostCommand({
command: "echo 'unterminated",
workdir: "/tmp/work",
env: {},
security: "allowlist",
ask: "on-miss",
autoReview: true,
autoReviewer,
defaultTimeoutSec: 30,
approvalRunningNoticeMs: 0,
warnings: [],
agentId: "requested-agent",
sessionKey: "requested-session",
});
expect(result.details?.status).toBe("approval-pending");
expect(autoReviewer).not.toHaveBeenCalled();
await vi.waitFor(() => {
expect(sendExecApprovalFollowupResultMock).toHaveBeenCalledWith(
expect.objectContaining({
approvalId: "approval-1",
sessionKey: "requested-session",
}),
"Exec denied (node=node-1 id=approval-1, approval-timeout): echo 'unterminated",
);
});
expect(
callGatewayToolMock.mock.calls.some(
([method, , params]) =>
method === "node.invoke" &&
(params as MockNodeInvokeParams | undefined)?.command === "system.run",
),
).toBe(false);
});
it("does not use fallback-full when node auto-review asks for human approval", async () => {
const autoReviewer = vi.fn<ExecAutoReviewer>(async () => ({
decision: "ask",
risk: "medium",
rationale: "needs a person",
}));
resolveExecHostApprovalContextMock.mockReturnValue({
approvals: { allowlist: [], file: { version: 1, agents: {} } },
hostSecurity: "allowlist",
hostAsk: "on-miss",
askFallback: "full",
});
resolveApprovalDecisionOrUndefinedMock.mockResolvedValue(null);
createExecApprovalDecisionStateMock.mockReturnValue({
baseDecision: { timedOut: true },
approvedByAsk: true,
deniedReason: null,
});
enforceStrictInlineEvalApprovalBoundaryMock.mockImplementation((value) =>
value.requiresAutoReviewHumanApproval === true && value.baseDecision.timedOut
? { approvedByAsk: false, deniedReason: "approval-timeout" }
: { approvedByAsk: value.approvedByAsk, deniedReason: value.deniedReason },
);
const result = await executeNodeHostCommand({
command: "bun ./script.ts",
workdir: "/tmp/work",
env: {},
security: "allowlist",
ask: "on-miss",
autoReview: true,
autoReviewer,
defaultTimeoutSec: 30,
approvalRunningNoticeMs: 0,
warnings: [],
agentId: "requested-agent",
sessionKey: "requested-session",
});
expect(result.details?.status).toBe("approval-pending");
await vi.waitFor(() => {
expect(sendExecApprovalFollowupResultMock).toHaveBeenCalledWith(
expect.objectContaining({
approvalId: "approval-1",
sessionKey: "requested-session",
}),
"Exec denied (node=node-1 id=approval-1, approval-timeout): bun ./script.ts",
);
});
expect(
callGatewayToolMock.mock.calls.some(
([method, , params]) =>
method === "node.invoke" &&
(params as MockNodeInvokeParams | undefined)?.command === "system.run",
),
).toBe(false);
});
it("builds a local systemRunPlan when approval is required and the node omits prepare", async () => {
listNodesMock.mockResolvedValueOnce([
{
nodeId: "node-1",
commands: ["system.run", "system.which", "system.notify"],
platform: "darwin",
},
]);
resolveExecHostApprovalContextMock.mockReturnValue({
approvals: { allowlist: [], file: { version: 1, agents: {} } },
hostSecurity: "full",
hostAsk: "always",
askFallback: "deny",
});
const result = await executeNodeHostCommand({
command: "bun ./script.ts",
workdir: "/tmp/work",
env: {},
security: "full",
ask: "off",
defaultTimeoutSec: 30,
approvalRunningNoticeMs: 0,
warnings: [],
agentId: "requested-agent",
sessionKey: "requested-session",
});
expect(result.details?.status).toBe("approval-pending");
expect(parsePreparedSystemRunPayloadMock).not.toHaveBeenCalled();
const expectedPlan = {
argv: ["/bin/sh", "-lc", "bun ./script.ts"],
cwd: "/tmp/work",
commandText: '/bin/sh -lc "bun ./script.ts"',
commandPreview: "bun ./script.ts",
agentId: "requested-agent",
sessionKey: "requested-session",
};
expect(requireRegisteredApprovalRequest().systemRunPlan).toEqual(expectedPlan);
await vi.waitFor(() => {
const call = requireGatewayCommand("system.run");
expect(call.callOptions).toEqual({ scopes: ["operator.write", "operator.approvals"] });
const runParams = requireRunParams(call);
expect(runParams.rawCommand).toBe(expectedPlan.commandText);
expect(runParams.systemRunPlan).toEqual(expectedPlan);
});
});
it("requires approval when node allowlist matching would depend on gateway PATH", async () => {
const allowlistEntry = { pattern: "/trusted/bin/tool" };
mockGatewayInvokesWithNodeApprovals({ version: 1, agents: {} });
usePolicyApprovalRequirementMock();
resolveExecApprovalsFromFileMock.mockReturnValue({
agent: { security: "allowlist", ask: "on-miss" },
allowlist: [allowlistEntry],
file: { version: 1, agents: {} },
});
evaluateShellAllowlistMock.mockImplementation((raw: unknown) => {
const params = raw as ShellAllowlistMockParams;
const hasNodeAllowlist = (params.allowlist ?? []).length > 0;
const gatewayPathWouldMatch = params.env?.PATH?.includes("/trusted/bin") === true;
return buildAllowlistEvalResult({
allowlistSatisfied: hasNodeAllowlist && gatewayPathWouldMatch,
segmentAllowlistEntry: allowlistEntry,
});
});
resolveExecHostApprovalContextMock.mockReturnValue({
approvals: { allowlist: [], file: { version: 1, agents: {} } },
hostSecurity: "allowlist",
hostAsk: "on-miss",
askFallback: "deny",
});
resolveApprovalDecisionOrUndefinedMock.mockResolvedValue(undefined);
const result = await executeNodeHostCommand({
command: "tool --version",
workdir: "/tmp/work",
env: { PATH: "/trusted/bin:/usr/bin" },
security: "allowlist",
ask: "on-miss",
defaultTimeoutSec: 30,
approvalRunningNoticeMs: 0,
warnings: [],
agentId: "requested-agent",
sessionKey: "requested-session",
});
expect(result.details?.status).toBe("approval-pending");
expect(registerExecApprovalRequestForHostOrThrowMock).toHaveBeenCalledTimes(1);
expect(requireRegisteredApprovalRequest().env).toBeUndefined();
const evalEnvs = evaluateShellAllowlistMock.mock.calls.map(
([raw]) => (raw as ShellAllowlistMockParams).env,
);
expect(evalEnvs.length).toBeGreaterThanOrEqual(2);
expect(evalEnvs.every((env) => env?.PATH === "" && env?.Path === "")).toBe(true);
await vi.waitFor(() => {
expect(resolveApprovalDecisionOrUndefinedMock).toHaveBeenCalledTimes(1);
});
});
it("reuses exact node allow-always command entries for prechecks", async () => {
const allowlistEntry = {
pattern: "/trusted/bin/tool",
source: "allow-always" as const,
};
const commandMarker = { pattern: nodeCommandMarker, source: "allow-always" as const };
mockGatewayInvokesWithNodeApprovals({ version: 1, agents: {} });
usePolicyApprovalRequirementMock();
resolveExecApprovalsFromFileMock.mockReturnValue({
agent: { security: "allowlist", ask: "on-miss" },
allowlist: [commandMarker, allowlistEntry],
file: { version: 1, agents: {} },
});
evaluateShellAllowlistMock.mockImplementation((raw: unknown) => {
const params = raw as ShellAllowlistMockParams;
expect(params.env?.PATH).toBe("");
expect(params.env?.Path).toBe("");
return {
allowlistMatches: [],
analysisOk: true,
allowlistSatisfied: false,
segments: [{ resolution: null, argv: ["/trusted/bin/tool", "--version"] }],
segmentAllowlistEntries: [null],
};
});
resolveAllowAlwaysPatternCoverageMock.mockImplementation((raw: unknown) => {
const params = raw as { segments?: MockAllowlistSegment[]; env?: NodeJS.ProcessEnv };
expect(params.env?.PATH).toBe("");
expect(params.env?.Path).toBe("");
expect(params.segments?.[0]?.argv[0]).toBe("/trusted/bin/tool");
return {
complete: true,
patterns: [{ pattern: "/trusted/bin/tool" }],
};
});
resolveExecHostApprovalContextMock.mockReturnValue({
approvals: { allowlist: [], file: { version: 1, agents: {} } },
hostSecurity: "allowlist",
hostAsk: "on-miss",
askFallback: "deny",
});
const result = await executeNodeHostCommand({
command: "/trusted/bin/tool --version",
workdir: "/tmp/work",
env: { PATH: "/gateway/bin:/usr/bin" },
security: "allowlist",
ask: "on-miss",
defaultTimeoutSec: 30,
approvalRunningNoticeMs: 0,
warnings: [],
agentId: "requested-agent",
sessionKey: "requested-session",
});
expect(result.details?.status).toBe("completed");
expect(registerExecApprovalRequestForHostOrThrowMock).not.toHaveBeenCalled();
expect(requiresExecApprovalMock).toHaveBeenLastCalledWith(
expect.objectContaining({
analysisOk: true,
allowlistSatisfied: false,
durableApprovalSatisfied: true,
}),
);
expect(requireRunParams(requireGatewayCommand("system.run")).env).toBeUndefined();
});
it("omits allow-always from node approval prompts when persistence is one-shot", async () => {
mockGatewayInvokesWithNodeApprovals({ version: 1, agents: {} });
usePolicyApprovalRequirementMock();
resolveAllowAlwaysPersistenceDecisionMock.mockReturnValue({
kind: "one-shot",
reasons: ["unplanned"],
});
resolveExecHostApprovalContextMock.mockReturnValue({
approvals: { allowlist: [], file: { version: 1, agents: {} } },
hostSecurity: "allowlist",
hostAsk: "on-miss",
askFallback: "deny",
});
resolveApprovalDecisionOrUndefinedMock.mockResolvedValue(undefined);
const result = await executeNodeHostCommand({
command: "bun ./script.ts",
workdir: "/tmp/work",
env: {},
security: "allowlist",
ask: "on-miss",
defaultTimeoutSec: 30,
approvalRunningNoticeMs: 0,
warnings: [],
agentId: "requested-agent",
sessionKey: "requested-session",
});
expect(result.details?.status).toBe("approval-pending");
expect(resolveAllowAlwaysPersistenceDecisionMock).toHaveBeenCalledWith(
expect.objectContaining({
commandText: "bun ./script.ts",
platform: process.platform,
runtimePayload: false,
}),
);
expect(resolveExecApprovalAllowedDecisionsMock).toHaveBeenCalledWith({
ask: "on-miss",
allowAlwaysPersistence: { kind: "one-shot", reasons: ["unplanned"] },
});
expect(requireRegisteredApprovalRequest().unavailableDecisions).toEqual(["allow-always"]);
expect(buildExecApprovalPendingToolResultMock).toHaveBeenCalledWith(
expect.objectContaining({
allowedDecisions: ["allow-once", "deny"],
}),
);
});
it("reuses de-duplicated node allow-always metadata for repeated command segments", async () => {
const allowlistEntry = {
pattern: "/trusted/bin/tool",
source: "allow-always" as const,
};
const commandMarker = { pattern: nodeCommandMarker, source: "allow-always" as const };
mockGatewayInvokesWithNodeApprovals({ version: 1, agents: {} });
usePolicyApprovalRequirementMock();
resolveExecApprovalsFromFileMock.mockReturnValue({
agent: { security: "allowlist", ask: "on-miss" },
allowlist: [commandMarker, allowlistEntry],
file: { version: 1, agents: {} },
});
evaluateShellAllowlistMock.mockReturnValue({
allowlistMatches: [],
analysisOk: true,
allowlistSatisfied: false,
segments: [
{ resolution: null, argv: ["/trusted/bin/tool", "a"] },
{ resolution: null, argv: ["/trusted/bin/tool", "b"] },
],
segmentAllowlistEntries: [null, null],
});
resolveAllowAlwaysPatternCoverageMock.mockReturnValue({
complete: true,
patterns: [{ pattern: "/trusted/bin/tool" }],
});
resolveExecHostApprovalContextMock.mockReturnValue({
approvals: { allowlist: [], file: { version: 1, agents: {} } },
hostSecurity: "allowlist",
hostAsk: "on-miss",
askFallback: "deny",
});
const result = await executeNodeHostCommand({
command: "/trusted/bin/tool a && /trusted/bin/tool b",
workdir: "/tmp/work",
env: {},
security: "allowlist",
ask: "on-miss",
defaultTimeoutSec: 30,
approvalRunningNoticeMs: 0,
warnings: [],
agentId: "requested-agent",
sessionKey: "requested-session",
});
expect(result.details?.status).toBe("completed");
expect(registerExecApprovalRequestForHostOrThrowMock).not.toHaveBeenCalled();
expect(requiresExecApprovalMock).toHaveBeenLastCalledWith(
expect.objectContaining({
allowlistSatisfied: false,
durableApprovalSatisfied: true,
}),
);
});
it("does not reuse partial node allow-always metadata for compound commands", async () => {
const allowlistEntry = {
pattern: "/trusted/bin/foo",
source: "allow-always" as const,
};
const commandMarker = { pattern: nodeCommandMarker, source: "allow-always" as const };
mockGatewayInvokesWithNodeApprovals({ version: 1, agents: {} });
usePolicyApprovalRequirementMock();
resolveExecApprovalsFromFileMock.mockReturnValue({
agent: { security: "allowlist", ask: "on-miss" },
allowlist: [commandMarker, allowlistEntry],
file: { version: 1, agents: {} },
});
evaluateShellAllowlistMock.mockReturnValue({
allowlistMatches: [],
analysisOk: true,
allowlistSatisfied: false,
segments: [
{ resolution: null, argv: ["foo"] },
{ resolution: null, argv: ["bar"] },
],
segmentAllowlistEntries: [null, null],
});
resolveAllowAlwaysPatternCoverageMock.mockReturnValue({
complete: true,
patterns: [{ pattern: "/trusted/bin/foo" }, { pattern: "/trusted/bin/bar" }],
});
resolveExecHostApprovalContextMock.mockReturnValue({
approvals: { allowlist: [], file: { version: 1, agents: {} } },
hostSecurity: "allowlist",
hostAsk: "on-miss",
askFallback: "deny",
});
resolveApprovalDecisionOrUndefinedMock.mockResolvedValue(undefined);
const result = await executeNodeHostCommand({
command: "foo && bar",
workdir: "/tmp/work",
env: {},
security: "allowlist",
ask: "on-miss",
defaultTimeoutSec: 30,
approvalRunningNoticeMs: 0,
warnings: [],
agentId: "requested-agent",
sessionKey: "requested-session",
});
expect(result.details?.status).toBe("approval-pending");
expect(registerExecApprovalRequestForHostOrThrowMock).toHaveBeenCalledTimes(1);
expect(requiresExecApprovalMock).toHaveBeenLastCalledWith(
expect.objectContaining({
allowlistSatisfied: false,
durableApprovalSatisfied: false,
}),
);
});
it("does not reuse a node command marker when concrete allow-always coverage is empty", async () => {
const commandMarker = { pattern: nodeCommandMarker, source: "allow-always" as const };
mockGatewayInvokesWithNodeApprovals({ version: 1, agents: {} });
usePolicyApprovalRequirementMock();
resolveExecApprovalsFromFileMock.mockReturnValue({
agent: { security: "allowlist", ask: "on-miss" },
allowlist: [commandMarker],
file: { version: 1, agents: {} },
});
evaluateShellAllowlistMock.mockReturnValue({
allowlistMatches: [],
analysisOk: true,
allowlistSatisfied: false,
segments: [{ resolution: null, argv: ["tool", "--version"] }],
segmentAllowlistEntries: [null],
});
resolveAllowAlwaysPatternCoverageMock.mockReturnValue({
complete: false,
patterns: [],
});
resolveExecHostApprovalContextMock.mockReturnValue({
approvals: { allowlist: [], file: { version: 1, agents: {} } },
hostSecurity: "allowlist",
hostAsk: "on-miss",
askFallback: "deny",
});
resolveApprovalDecisionOrUndefinedMock.mockResolvedValue(undefined);
const result = await executeNodeHostCommand({
command: "tool --version",
workdir: "/tmp/work",
env: {},
security: "allowlist",
ask: "on-miss",
defaultTimeoutSec: 30,
approvalRunningNoticeMs: 0,
warnings: [],
agentId: "requested-agent",
sessionKey: "requested-session",
});
expect(result.details?.status).toBe("approval-pending");
expect(registerExecApprovalRequestForHostOrThrowMock).toHaveBeenCalledTimes(1);
expect(requiresExecApprovalMock).toHaveBeenLastCalledWith(
expect.objectContaining({
allowlistSatisfied: false,
durableApprovalSatisfied: false,
}),
);
});
it("reuses current node-reported coverage when gateway analysis cannot resolve node paths", async () => {
const commandMarker = { pattern: nodeCommandMarker, source: "allow-always" as const };
const allowlistEntry = {
pattern: "/node/bin/tool",
source: "allow-always" as const,
};
mockGatewayInvokesWithNodeApprovals({ version: 1, agents: {} });
usePolicyApprovalRequirementMock();
parsePreparedSystemRunPayloadMock.mockReturnValueOnce({
plan: preparedPlan,
execPolicy: { security: "full", ask: "off" },
allowAlwaysCoverage: {
complete: true,
patterns: [{ pattern: "/node/bin/tool" }],
},
});
resolveExecApprovalsFromFileMock.mockReturnValue({
agent: { security: "allowlist", ask: "on-miss" },
allowlist: [commandMarker, allowlistEntry],
file: { version: 1, agents: {} },
});
evaluateShellAllowlistMock.mockReturnValue({
allowlistMatches: [],
analysisOk: true,
allowlistSatisfied: false,
segments: [{ resolution: null, argv: ["tool", "--version"] }],
segmentAllowlistEntries: [null],
});
resolveAllowAlwaysPatternCoverageMock.mockReturnValue({
complete: false,
patterns: [],
});
resolveExecHostApprovalContextMock.mockReturnValue({
approvals: { allowlist: [], file: { version: 1, agents: {} } },
hostSecurity: "allowlist",
hostAsk: "on-miss",
askFallback: "deny",
});
const result = await executeNodeHostCommand({
command: "tool --version",
workdir: "/tmp/work",
env: {},
security: "allowlist",
ask: "on-miss",
defaultTimeoutSec: 30,
approvalRunningNoticeMs: 0,
warnings: [],
agentId: "requested-agent",
sessionKey: "requested-session",
});
expect(result.details?.status).toBe("completed");
expect(registerExecApprovalRequestForHostOrThrowMock).not.toHaveBeenCalled();
expect(requiresExecApprovalMock).toHaveBeenLastCalledWith(
expect.objectContaining({
allowlistSatisfied: false,
durableApprovalSatisfied: true,
}),
);
});
it("does not reuse last-used node metadata without an exact command marker", async () => {
const allowlistEntries = [
{
pattern: "/trusted/bin/foo",
argPattern: "^a\x00$",
source: "allow-always" as const,
lastUsedCommand: preparedPlan.commandText,
},
{
pattern: "/trusted/bin/foo",
argPattern: "^b\x00$",
source: "allow-always" as const,
lastUsedCommand: preparedPlan.commandText,
},
];
mockGatewayInvokesWithNodeApprovals({ version: 1, agents: {} });
usePolicyApprovalRequirementMock();
resolveExecApprovalsFromFileMock.mockReturnValue({
agent: { security: "allowlist", ask: "on-miss" },
allowlist: allowlistEntries,
file: { version: 1, agents: {} },
});
evaluateShellAllowlistMock.mockReturnValue({
allowlistMatches: [],
analysisOk: true,
allowlistSatisfied: false,
segments: [
{ resolution: null, argv: ["foo", "a"] },
{ resolution: null, argv: ["foo", "b"] },
{ resolution: null, argv: ["missingcmd"] },
],
segmentAllowlistEntries: [null, null, null],
});
resolveAllowAlwaysPatternCoverageMock.mockReturnValue({ complete: false, patterns: [] });
resolveExecHostApprovalContextMock.mockReturnValue({
approvals: { allowlist: [], file: { version: 1, agents: {} } },
hostSecurity: "allowlist",
hostAsk: "on-miss",
askFallback: "deny",
});
resolveApprovalDecisionOrUndefinedMock.mockResolvedValue(undefined);
const result = await executeNodeHostCommand({
command: "foo a && foo b && missingcmd",
workdir: "/tmp/work",
env: {},
security: "allowlist",
ask: "on-miss",
defaultTimeoutSec: 30,
approvalRunningNoticeMs: 0,
warnings: [],
agentId: "requested-agent",
sessionKey: "requested-session",
});
expect(result.details?.status).toBe("approval-pending");
expect(registerExecApprovalRequestForHostOrThrowMock).toHaveBeenCalledTimes(1);
expect(requiresExecApprovalMock).toHaveBeenLastCalledWith(
expect.objectContaining({
allowlistSatisfied: false,
durableApprovalSatisfied: false,
}),
);
});
it("does not reuse node allow-always metadata when only representable segments match", async () => {
const allowlistEntries = [
{
pattern: "/bin/echo",
source: "allow-always" as const,
},
{
pattern: "/bin/date",
source: "allow-always" as const,
},
];
const commandMarker = { pattern: nodeCommandMarker, source: "allow-always" as const };
mockGatewayInvokesWithNodeApprovals({ version: 1, agents: {} });
usePolicyApprovalRequirementMock();
resolveExecApprovalsFromFileMock.mockReturnValue({
agent: { security: "allowlist", ask: "on-miss" },
allowlist: [commandMarker, ...allowlistEntries],
file: { version: 1, agents: {} },
});
evaluateShellAllowlistMock.mockReturnValue({
allowlistMatches: [],
analysisOk: true,
allowlistSatisfied: false,
segments: [
{ resolution: null, argv: ["sh", "-c", "/bin/echo ok && /bin/date"] },
{ resolution: null, argv: ["missingcmd"] },
],
segmentAllowlistEntries: [null, null],
});
resolveAllowAlwaysPatternCoverageMock.mockReturnValue({
complete: false,
patterns: [{ pattern: "/bin/echo" }, { pattern: "/bin/date" }],
});
resolveExecHostApprovalContextMock.mockReturnValue({
approvals: { allowlist: [], file: { version: 1, agents: {} } },
hostSecurity: "allowlist",
hostAsk: "on-miss",
askFallback: "deny",
});
resolveApprovalDecisionOrUndefinedMock.mockResolvedValue(undefined);
const result = await executeNodeHostCommand({
command: 'sh -c "/bin/echo ok && /bin/date" && missingcmd',
workdir: "/tmp/work",
env: {},
security: "allowlist",
ask: "on-miss",
defaultTimeoutSec: 30,
approvalRunningNoticeMs: 0,
warnings: [],
agentId: "requested-agent",
sessionKey: "requested-session",
});
expect(result.details?.status).toBe("approval-pending");
expect(registerExecApprovalRequestForHostOrThrowMock).toHaveBeenCalledTimes(1);
expect(requiresExecApprovalMock).toHaveBeenLastCalledWith(
expect.objectContaining({
allowlistSatisfied: false,
durableApprovalSatisfied: false,
}),
);
});
it("does not use unresolved node allow-always fallback for shell wrappers", async () => {
const allowlistEntry = {
pattern: "/trusted/bin/foo",
source: "allow-always" as const,
};
mockGatewayInvokesWithNodeApprovals({ version: 1, agents: {} });
usePolicyApprovalRequirementMock();
resolveExecApprovalsFromFileMock.mockReturnValue({
agent: { security: "allowlist", ask: "on-miss" },
allowlist: [allowlistEntry],
file: { version: 1, agents: {} },
});
evaluateShellAllowlistMock.mockReturnValue({
allowlistMatches: [],
analysisOk: true,
allowlistSatisfied: false,
segments: [{ resolution: null, argv: ["bash", "-lc", "foo && missingcmd"] }],
segmentAllowlistEntries: [null],
});
resolveAllowAlwaysPatternCoverageMock.mockReturnValue({ complete: false, patterns: [] });
resolveExecHostApprovalContextMock.mockReturnValue({
approvals: { allowlist: [], file: { version: 1, agents: {} } },
hostSecurity: "allowlist",
hostAsk: "on-miss",
askFallback: "deny",
});
resolveApprovalDecisionOrUndefinedMock.mockResolvedValue(undefined);
const result = await executeNodeHostCommand({
command: 'bash -lc "foo && missingcmd"',
workdir: "/tmp/work",
env: {},
security: "allowlist",
ask: "on-miss",
defaultTimeoutSec: 30,
approvalRunningNoticeMs: 0,
warnings: [],
agentId: "requested-agent",
sessionKey: "requested-session",
});
expect(result.details?.status).toBe("approval-pending");
expect(registerExecApprovalRequestForHostOrThrowMock).toHaveBeenCalledTimes(1);
expect(requiresExecApprovalMock).toHaveBeenLastCalledWith(
expect.objectContaining({
allowlistSatisfied: false,
durableApprovalSatisfied: false,
}),
);
});
it("uses forwarded node env overrides for node approval prechecks", async () => {
const allowlistEntry = { pattern: "/trusted/bin/tool" };
mockGatewayInvokesWithNodeApprovals({ version: 1, agents: {} });
usePolicyApprovalRequirementMock();
resolveExecApprovalsFromFileMock.mockReturnValue({
agent: { security: "allowlist", ask: "on-miss" },
allowlist: [allowlistEntry],
file: { version: 1, agents: {} },
});
evaluateShellAllowlistMock.mockImplementation((raw: unknown) => {
const params = raw as ShellAllowlistMockParams;
const hasNodeAllowlist = (params.allowlist ?? []).length > 0;
return buildAllowlistEvalResult({
allowlistSatisfied:
hasNodeAllowlist &&
params.env != null &&
params.env.FOO === "bar" &&
params.env.PATH === "",
segmentAllowlistEntry: allowlistEntry,
});
});
resolveExecHostApprovalContextMock.mockReturnValue({
approvals: { allowlist: [], file: { version: 1, agents: {} } },
hostSecurity: "allowlist",
hostAsk: "on-miss",
askFallback: "deny",
});
const result = await executeNodeHostCommand({
command: "tool --version",
workdir: "/tmp/work",
env: { PATH: "/gateway/bin:/usr/bin" },
requestedEnv: { FOO: "bar" },
security: "allowlist",
ask: "on-miss",
defaultTimeoutSec: 30,
approvalRunningNoticeMs: 0,
warnings: [],
agentId: "requested-agent",
sessionKey: "requested-session",
});
expect(result.details?.status).toBe("completed");
expect(registerExecApprovalRequestForHostOrThrowMock).not.toHaveBeenCalled();
expect(requiresExecApprovalMock).toHaveBeenLastCalledWith(
expect.objectContaining({
analysisOk: true,
allowlistSatisfied: true,
durableApprovalSatisfied: false,
}),
);
expect(requireGatewayCommand("system.run.prepare").params?.params?.env).toEqual({
FOO: "bar",
});
expect(requireRunParams(requireGatewayCommand("system.run")).env).toEqual({ FOO: "bar" });
const evalEnvs = evaluateShellAllowlistMock.mock.calls.map(
([raw]) => (raw as ShellAllowlistMockParams).env,
);
expect(evalEnvs.length).toBeGreaterThanOrEqual(2);
expect(evalEnvs.every((env) => env != null && env.FOO === "bar" && env.PATH === "")).toBe(true);
});
it("skips approval prepare in full/off mode", async () => {
await executeNodeHostCommand({
command: "bun ./script.ts",
workdir: "/tmp/work",
env: {},
security: "full",
ask: "off",
defaultTimeoutSec: 30,
approvalRunningNoticeMs: 0,
warnings: [],
agentId: "requested-agent",
sessionKey: "requested-session",
notifyOnExit: false,
});
expect(callGatewayToolMock).toHaveBeenCalledTimes(1);
const call = requireGatewayCall(0);
expect(call.options.timeoutMs).toBe(35_000);
const runParams = requireRunParams(call);
expect(runParams.command).toEqual(["/bin/sh", "-lc", "bun ./script.ts"]);
expect(runParams.rawCommand).toBe("bun ./script.ts");
expect(typeof runParams.runId).toBe("string");
expect(runParams.suppressNotifyOnExit).toBe(true);
expect(runParams.timeoutMs).toBe(30_000);
expect(Object.hasOwn(runParams, "systemRunPlan")).toBe(false);
});
it("rejects disconnected node targets before invoking system.run", async () => {
listNodesMock.mockResolvedValueOnce([
{
nodeId: "node-1",
commands: ["system.run", "system.run.prepare"],
connected: false,
platform: process.platform,
},
]);
await expect(
executeNodeHostCommand({
command: "git log --oneline -5",
workdir: "/tmp/work",
env: {},
security: "allowlist",
ask: "off",
requestedNode: "node-1",
defaultTimeoutSec: 30,
approvalRunningNoticeMs: 0,
warnings: [],
agentId: "requested-agent",
sessionKey: "requested-session",
}),
).rejects.toThrow(
"exec host=node requires a connected node (node-1 is currently disconnected)",
);
expect(callGatewayToolMock).not.toHaveBeenCalled();
});
it("returns a non-empty placeholder for silent node exec results", async () => {
callGatewayToolMock.mockImplementationOnce(
async (method: string, _options: unknown, params: MockNodeInvokeParams | undefined) => {
if (method === "node.invoke" && params?.command === "system.run") {
return {
payload: {
success: true,
stdout: "",
stderr: "",
exitCode: 0,
timedOut: false,
},
};
}
throw new Error(`unexpected node invoke command: ${String(params?.command)}`);
},
);
const result = await executeNodeHostCommand({
command: "mkdir /tmp/quiet",
workdir: "/tmp/work",
env: {},
security: "full",
ask: "off",
defaultTimeoutSec: 30,
approvalRunningNoticeMs: 0,
warnings: [],
agentId: "requested-agent",
sessionKey: "requested-session",
});
expect(result.content).toEqual([{ type: "text", text: "(no output)" }]);
const details = result.details;
expect(details?.status).toBe("completed");
if (details?.status !== "completed") {
throw new Error(`expected completed details, got ${details?.status ?? "missing"}`);
}
expect(details.exitCode).toBe(0);
expect(details.aggregated).toBe("");
expect(details.cwd).toBe("/tmp/work");
});
it("forwards explicit timeouts to node system.run", async () => {
await executeNodeHostCommand({
command: "bun ./script.ts",
workdir: "/tmp/work",
env: {},
security: "full",
ask: "off",
timeoutSec: 12,
defaultTimeoutSec: 30,
approvalRunningNoticeMs: 0,
warnings: [],
agentId: "requested-agent",
sessionKey: "requested-session",
});
expectSystemRunInvoke({ invokeTimeoutMs: 17_000, runTimeoutMs: 12_000 });
});
it("normalizes unsafe explicit timeouts before invoking node system.run", async () => {
await executeNodeHostCommand({
command: "bun ./script.ts",
workdir: "/tmp/work",
env: {},
security: "full",
ask: "off",
timeoutSec: Number.POSITIVE_INFINITY,
defaultTimeoutSec: 30,
approvalRunningNoticeMs: 0,
warnings: [],
agentId: "requested-agent",
sessionKey: "requested-session",
});
expectSystemRunInvoke({ invokeTimeoutMs: 35_000, runTimeoutMs: 30_000 });
callGatewayToolMock.mockClear();
await executeNodeHostCommand({
command: "bun ./script.ts",
workdir: "/tmp/work",
env: {},
security: "full",
ask: "off",
timeoutSec: 3_000_000,
defaultTimeoutSec: 30,
approvalRunningNoticeMs: 0,
warnings: [],
agentId: "requested-agent",
sessionKey: "requested-session",
});
expectSystemRunInvoke({
invokeTimeoutMs: MAX_SAFE_TIMEOUT_DELAY_MS,
runTimeoutMs: MAX_SAFE_TIMEOUT_DELAY_MS,
});
callGatewayToolMock.mockClear();
await executeNodeHostCommand({
command: "bun ./script.ts",
workdir: "/tmp/work",
env: {},
security: "full",
ask: "off",
timeoutSec: Number.MAX_VALUE,
defaultTimeoutSec: 30,
approvalRunningNoticeMs: 0,
warnings: [],
agentId: "requested-agent",
sessionKey: "requested-session",
});
expectSystemRunInvoke({
invokeTimeoutMs: MAX_SAFE_TIMEOUT_DELAY_MS,
runTimeoutMs: MAX_SAFE_TIMEOUT_DELAY_MS,
});
});
it("forwards timeout zero to node system.run and keeps the invoke wait bounded", async () => {
await executeNodeHostCommand({
command: "bun ./script.ts",
workdir: "/tmp/work",
env: {},
security: "full",
ask: "off",
timeoutSec: 0,
defaultTimeoutSec: 30,
approvalRunningNoticeMs: 0,
warnings: [],
agentId: "requested-agent",
sessionKey: "requested-session",
});
expectSystemRunInvoke({ invokeTimeoutMs: 35_000, runTimeoutMs: 0 });
});
it("allows exec when requestedNode is display name matching boundNode's device", async () => {
listNodesMock.mockResolvedValue([
{
nodeId: "f2396b588d391d30a79d300e196a17cf197f34969b5e2485d2734c953567f44e",
displayName: "home-wsl-debian",
commands: ["system.run"],
platform: process.platform,
},
]);
const result = await executeNodeHostCommand({
command: "echo hello",
workdir: "/tmp/work",
env: {},
security: "full",
ask: "off",
defaultTimeoutSec: 30,
approvalRunningNoticeMs: 0,
warnings: [],
agentId: "test-agent",
sessionKey: "test-session",
boundNode: "f2396b588d391d30a79d300e196a17cf197f34969b5e2485d2734c953567f44e",
requestedNode: "home-wsl-debian",
});
expect(result.details?.status).toBeDefined();
});
it("allows exec when requestedNode is partial ID matching boundNode's device", async () => {
listNodesMock.mockResolvedValue([
{
nodeId: "f2396b588d391d30a79d300e196a17cf197f34969b5e2485d2734c953567f44e",
displayName: "home-wsl-debian",
commands: ["system.run"],
platform: process.platform,
},
]);
const result = await executeNodeHostCommand({
command: "echo hello",
workdir: "/tmp/work",
env: {},
security: "full",
ask: "off",
defaultTimeoutSec: 30,
approvalRunningNoticeMs: 0,
warnings: [],
agentId: "test-agent",
sessionKey: "test-session",
boundNode: "f2396b588d391d30a79d300e196a17cf197f34969b5e2485d2734c953567f44e",
requestedNode: "f2396b588d391d",
});
expect(result.details?.status).toBeDefined();
});
it("rejects exec when requestedNode resolves to a different node than boundNode", async () => {
listNodesMock.mockResolvedValue([
{
nodeId: "f2396b588d391d30a79d300e196a17cf197f34969b5e2485d2734c953567f44e",
displayName: "home-wsl-debian",
commands: ["system.run"],
platform: process.platform,
},
{
nodeId: "aaaa1111bbbb2222cccc3333dddd4444eeee5555ffff6666aaa7777bbb88889999",
displayName: "other-node",
commands: ["system.run"],
platform: process.platform,
},
]);
await expect(
executeNodeHostCommand({
command: "echo hello",
workdir: "/tmp/work",
env: {},
security: "full",
ask: "off",
defaultTimeoutSec: 30,
approvalRunningNoticeMs: 0,
warnings: [],
agentId: "test-agent",
sessionKey: "test-session",
boundNode: "f2396b588d391d30a79d300e196a17cf197f34969b5e2485d2734c953567f44e",
requestedNode: "other-node",
}),
).rejects.toThrow("exec node not allowed (bound to f2396b588d391d30");
});
it("preserves original error when requestedNode matches no known node", async () => {
listNodesMock.mockResolvedValue([
{
nodeId: "f2396b588d391d30a79d300e196a17cf197f34969b5e2485d2734c953567f44e",
displayName: "home-wsl-debian",
commands: ["system.run"],
platform: process.platform,
},
]);
await expect(
executeNodeHostCommand({
command: "echo hello",
workdir: "/tmp/work",
env: {},
security: "full",
ask: "off",
defaultTimeoutSec: 30,
approvalRunningNoticeMs: 0,
warnings: [],
agentId: "test-agent",
sessionKey: "test-session",
requestedNode: "nonexistent-node",
}),
).rejects.toThrow(
"requested node not found: nonexistent-node (unknown node: nonexistent-node)",
);
});
it("allows exec when boundNode is a display name matching the same device as requestedNode", async () => {
listNodesMock.mockResolvedValue([
{
nodeId: "f2396b588d391d30a79d300e196a17cf197f34969b5e2485d2734c953567f44e",
displayName: "home-wsl-debian",
commands: ["system.run"],
platform: process.platform,
},
]);
const result = await executeNodeHostCommand({
command: "echo hello",
workdir: "/tmp/work",
env: {},
security: "full",
ask: "off",
defaultTimeoutSec: 30,
approvalRunningNoticeMs: 0,
warnings: [],
agentId: "test-agent",
sessionKey: "test-session",
boundNode: "home-wsl-debian",
requestedNode: "home-wsl-debian",
});
expect(result.details?.status).toBeDefined();
});
it("auto-reviews strict inline-eval commands with full/off host policy when node policy is available", async () => {
const inlinePlan = {
argv: ["python3", "-c", "print(1)"],
cwd: "/tmp/work",
commandText: "python3 -c 'print(1)'",
commandPreview: null,
agentId: "requested-agent",
sessionKey: "requested-session",
};
parsePreparedSystemRunPayloadMock.mockReturnValue({
plan: inlinePlan,
execPolicy: { security: "full", ask: "off" },
});
const autoReviewer = vi.fn<ExecAutoReviewer>(async () => ({
decision: "allow-once",
risk: "low",
rationale: "safe inline eval",
}));
detectInterpreterInlineEvalArgvMock.mockReturnValue(INLINE_EVAL_HIT);
evaluateShellAllowlistMock.mockReturnValue({
allowlistMatches: [],
analysisOk: true,
allowlistSatisfied: false,
segments: [
{
resolution: null,
argv: ["python3", "-c", "print(1)"],
raw: "python3 -c 'print(1)'",
},
],
segmentAllowlistEntries: [],
});
resolveExecHostApprovalContextMock.mockReturnValue({
approvals: { allowlist: [], file: { version: 1, agents: {} } },
hostSecurity: "full",
hostAsk: "off",
askFallback: "deny",
});
const result = await executeNodeHostCommand({
command: "python3 -c 'print(1)'",
workdir: "/tmp/work",
env: {},
security: "full",
ask: "off",
autoReview: true,
autoReviewer,
strictInlineEval: true,
defaultTimeoutSec: 30,
approvalRunningNoticeMs: 0,
warnings: [],
agentId: "requested-agent",
sessionKey: "requested-session",
});
expect(result.details?.status).toBe("completed");
expect(autoReviewer).toHaveBeenCalledWith(
expect.objectContaining({
command: "python3 -c 'print(1)'",
argv: ["python3", "-c", "print(1)"],
host: "node",
reason: "strict-inline-eval",
}),
);
expect(callGatewayToolMock).toHaveBeenCalledWith(
"exec.approvals.node.get",
{ timeoutMs: 10_000 },
{ nodeId: "node-1" },
);
});
it("denies timed-out inline-eval requests instead of invoking the node", async () => {
detectInterpreterInlineEvalArgvMock.mockReturnValue(INLINE_EVAL_HIT);
resolveApprovalDecisionOrUndefinedMock.mockResolvedValue(null);
createExecApprovalDecisionStateMock.mockReturnValue({
baseDecision: { timedOut: true },
approvedByAsk: true,
deniedReason: null,
});
enforceStrictInlineEvalApprovalBoundaryMock.mockReturnValue({
approvedByAsk: false,
deniedReason: "approval-timeout",
});
resolveExecHostApprovalContextMock.mockReturnValue({
approvals: { allowlist: [], file: { version: 1, agents: {} } },
hostSecurity: "full",
hostAsk: "off",
askFallback: "full",
});
const result = await executeNodeHostCommand({
command: "python3 -c 'print(1)'",
workdir: "/tmp/work",
env: {},
security: "full",
ask: "off",
strictInlineEval: true,
defaultTimeoutSec: 30,
approvalRunningNoticeMs: 0,
warnings: [],
agentId: "requested-agent",
sessionKey: "requested-session",
});
expect(result.details?.status).toBe("approval-pending");
await vi.waitFor(() => {
expect(sendExecApprovalFollowupResultMock).toHaveBeenCalledWith(
expect.objectContaining({
approvalId: "approval-1",
sessionKey: "requested-session",
}),
"Exec denied (node=node-1 id=approval-1, approval-timeout): python3 -c 'print(1)'",
);
});
expect(callGatewayToolMock).toHaveBeenCalledTimes(1);
});
});