mirror of
https://github.com/openclaw/openclaw.git
synced 2026-06-29 21:23:36 +00:00
Replace the exec approval parser/planner path with Tree-sitter-backed authorization planning, carrying planner decisions through node and gateway execution.
This keeps unpersistable shell shapes one-shot, adds typed `unavailableDecisions` for approval prompts, and refreshes coverage for allowlist matching, command rendering, durable allow-always persistence, and host approval paths.
Verification:
- GitHub PR checks for ce2381192d: CLEAN, 142 success, 32 skipped, 0 failed, 0 pending.
- /Users/jmerhi/.nvm/versions/node/v24.12.0/bin/node scripts/plugin-sdk-surface-report.mjs --check
- /Users/jmerhi/.nvm/versions/node/v24.12.0/bin/node scripts/run-vitest.mjs test/scripts/plugin-sdk-surface-report.test.ts --reporter=verbose
- Focused exec approval suite: 13 files, 467 tests.
3178 lines
107 KiB
TypeScript
3178 lines
107 KiB
TypeScript
/**
|
|
* Node-host exec orchestration tests.
|
|
* Covers node target resolution, remote prepare/invoke payloads, approvals,
|
|
* auto-review, and follow-up execution paths.
|
|
*/
|
|
import crypto from "node:crypto";
|
|
import { beforeAll, beforeEach, describe, expect, it, vi } from "vitest";
|
|
import type { ExecAllowlistEntry } from "../infra/exec-approvals.types.js";
|
|
import { MAX_SAFE_TIMEOUT_DELAY_MS } from "../utils/timer-delay.js";
|
|
|
|
type StrictInlineEvalBoundary =
|
|
typeof import("./bash-tools.exec-host-shared.js").enforceStrictInlineEvalApprovalBoundary;
|
|
type ExecAutoReviewer = typeof import("../infra/exec-auto-review.js").defaultExecAutoReviewer;
|
|
type ExecAsk = import("../infra/exec-approvals.js").ExecAsk;
|
|
type ExecSecurity = import("../infra/exec-approvals.js").ExecSecurity;
|
|
type MockAllowAlwaysPersistenceInput = Parameters<
|
|
typeof import("../infra/exec-approvals.js").resolveAllowAlwaysPersistenceDecision
|
|
>[0];
|
|
type MockAllowAlwaysPersistenceDecision =
|
|
import("../infra/exec-approvals.js").AllowAlwaysPersistenceDecision;
|
|
type MockExecApprovalDecision = import("../infra/exec-approvals.js").ExecApprovalDecision;
|
|
type MockExecApprovalUnavailableDecision =
|
|
import("../infra/exec-approvals.js").ExecApprovalUnavailableDecision;
|
|
type MockAllowlistSegment = {
|
|
raw?: string;
|
|
resolution: null;
|
|
argv: string[];
|
|
};
|
|
type MockAllowlistResult = {
|
|
allowlistMatches: unknown[];
|
|
analysisOk: boolean;
|
|
allowlistSatisfied: boolean;
|
|
segments: MockAllowlistSegment[];
|
|
segmentAllowlistEntries: unknown[];
|
|
segmentSatisfiedBy?: unknown[];
|
|
};
|
|
type MockExecAllowlistEntry = {
|
|
pattern: string;
|
|
argPattern?: string;
|
|
source?: "allow-always";
|
|
commandText?: string;
|
|
};
|
|
type MockExecApprovalsResolved = {
|
|
allowlist: MockExecAllowlistEntry[];
|
|
file: { version: 1; agents: Record<string, unknown> };
|
|
agent: {
|
|
security: ExecSecurity;
|
|
ask: ExecAsk;
|
|
askFallback?: "deny";
|
|
autoAllowSkills?: false;
|
|
};
|
|
};
|
|
type ShellAllowlistMockParams = {
|
|
command?: string;
|
|
allowlist?: unknown[];
|
|
env?: NodeJS.ProcessEnv;
|
|
};
|
|
type RequiresExecApprovalMockParams = {
|
|
ask?: string;
|
|
security?: string;
|
|
analysisOk?: boolean;
|
|
allowlistSatisfied?: boolean;
|
|
durableApprovalSatisfied?: boolean;
|
|
};
|
|
|
|
const INLINE_EVAL_HIT = {
|
|
executable: "python3",
|
|
normalizedExecutable: "python3",
|
|
flag: "-c",
|
|
argv: ["python3", "-c", "print(1)"],
|
|
};
|
|
|
|
const preparedPlan = vi.hoisted(() => ({
|
|
argv: ["bun", "./script.ts"],
|
|
cwd: "/tmp/work",
|
|
commandText: "bun ./script.ts",
|
|
commandPreview: "bun ./script.ts",
|
|
agentId: "prepared-agent",
|
|
sessionKey: "prepared-session",
|
|
mutableFileOperand: {
|
|
argvIndex: 1,
|
|
path: "/tmp/work/script.ts",
|
|
sha256: "abc123",
|
|
},
|
|
}));
|
|
const nodeCommandMarker = vi.hoisted(() => "=node-command:test");
|
|
const exactCommandMarker = (commandText: string): string =>
|
|
`=command:${crypto.createHash("sha256").update(commandText).digest("hex").slice(0, 16)}`;
|
|
|
|
const callGatewayToolMock = vi.hoisted(() => vi.fn());
|
|
const listNodesMock = vi.hoisted(() => vi.fn());
|
|
const parsePreparedSystemRunPayloadMock = vi.hoisted(() => vi.fn());
|
|
const commandRequiresSecurityAuditSuppressionApprovalMock = vi.hoisted(() => vi.fn(() => false));
|
|
const evaluateShellAllowlistMock = vi.hoisted(() =>
|
|
vi.fn(
|
|
(_raw?: ShellAllowlistMockParams): MockAllowlistResult => ({
|
|
allowlistMatches: [],
|
|
analysisOk: true,
|
|
allowlistSatisfied: false,
|
|
segments: [{ resolution: null, argv: ["bun", "./script.ts"] }],
|
|
segmentAllowlistEntries: [],
|
|
segmentSatisfiedBy: [],
|
|
}),
|
|
),
|
|
);
|
|
const hasNodeCommandAllowAlwaysMarkerMock = vi.hoisted(() =>
|
|
vi.fn((raw: unknown): boolean =>
|
|
((raw as { allowlist?: Array<{ pattern?: string }> }).allowlist ?? []).some(
|
|
(entry) => entry.pattern === "=node-command:test",
|
|
),
|
|
),
|
|
);
|
|
const resolveAllowAlwaysPatternCoverageMock = vi.hoisted(() =>
|
|
vi.fn((_raw: unknown): unknown => ({
|
|
complete: true,
|
|
patterns: [{ pattern: "/trusted/bin/tool" }],
|
|
})),
|
|
);
|
|
const resolveExecApprovalsFromFileMock = vi.hoisted(() =>
|
|
vi.fn(
|
|
(): MockExecApprovalsResolved => ({
|
|
allowlist: [],
|
|
file: { version: 1, agents: {} },
|
|
agent: {
|
|
security: "full",
|
|
ask: "off",
|
|
askFallback: "deny",
|
|
autoAllowSkills: false,
|
|
},
|
|
}),
|
|
),
|
|
);
|
|
const requiresExecApprovalMock = vi.hoisted(() =>
|
|
vi.fn((_raw?: RequiresExecApprovalMockParams) => true),
|
|
);
|
|
const hasDurableExecApprovalMock = vi.hoisted(() => vi.fn(() => false));
|
|
const resolveAllowAlwaysPersistenceDecisionMock = vi.hoisted(() =>
|
|
vi.fn(
|
|
(_raw: MockAllowAlwaysPersistenceInput): MockAllowAlwaysPersistenceDecision => ({
|
|
kind: "patterns",
|
|
patterns: [{ pattern: "/trusted/bin/tool" }],
|
|
}),
|
|
),
|
|
);
|
|
const resolveExecApprovalAllowedDecisionsMock = vi.hoisted(() =>
|
|
vi.fn(
|
|
(params?: {
|
|
ask?: string | null;
|
|
allowAlwaysPersistence?: { kind: string } | null;
|
|
}): readonly MockExecApprovalDecision[] =>
|
|
params?.ask === "always" || params?.allowAlwaysPersistence?.kind === "one-shot"
|
|
? ["allow-once", "deny"]
|
|
: ["allow-once", "allow-always", "deny"],
|
|
),
|
|
);
|
|
const resolveExecApprovalUnavailableDecisionsMock = vi.hoisted(() =>
|
|
vi.fn(
|
|
(params?: {
|
|
ask?: string | null;
|
|
allowAlwaysPersistence?: { kind: string } | null;
|
|
}): readonly MockExecApprovalUnavailableDecision[] =>
|
|
params?.ask === "always" || params?.allowAlwaysPersistence?.kind === "one-shot"
|
|
? ["allow-always"]
|
|
: [],
|
|
),
|
|
);
|
|
const resolveExecHostApprovalContextMock = vi.hoisted(() =>
|
|
vi.fn(() => ({
|
|
approvals: { allowlist: [] as ExecAllowlistEntry[], file: { version: 1, agents: {} } },
|
|
hostSecurity: "full",
|
|
hostAsk: "off",
|
|
askFallback: "deny",
|
|
})),
|
|
);
|
|
const createAndRegisterDefaultExecApprovalRequestMock = vi.hoisted(() => vi.fn());
|
|
const resolveApprovalDecisionOrUndefinedMock = vi.hoisted(() =>
|
|
vi.fn(async (): Promise<string | null | undefined> => "allow-once"),
|
|
);
|
|
const createExecApprovalDecisionStateMock = vi.hoisted(() =>
|
|
vi.fn(
|
|
(): {
|
|
baseDecision: { timedOut: boolean };
|
|
approvedByAsk: boolean;
|
|
deniedReason: string | null;
|
|
} => ({
|
|
baseDecision: { timedOut: false },
|
|
approvedByAsk: false,
|
|
deniedReason: null,
|
|
}),
|
|
),
|
|
);
|
|
const buildExecApprovalPendingToolResultMock = vi.hoisted(() => vi.fn());
|
|
const sendExecApprovalFollowupResultMock = vi.hoisted(() => vi.fn(async () => undefined));
|
|
const enforceStrictInlineEvalApprovalBoundaryMock = vi.hoisted(() =>
|
|
vi.fn<StrictInlineEvalBoundary>((value) => ({
|
|
approvedByAsk: value.approvedByAsk,
|
|
deniedReason: value.deniedReason,
|
|
})),
|
|
);
|
|
const registerExecApprovalRequestForHostOrThrowMock = vi.hoisted(() =>
|
|
vi.fn(async () => undefined),
|
|
);
|
|
const detectInterpreterInlineEvalArgvMock = vi.hoisted(() =>
|
|
vi.fn(
|
|
(): {
|
|
executable: string;
|
|
normalizedExecutable: string;
|
|
flag: string;
|
|
argv: string[];
|
|
} | null => null,
|
|
),
|
|
);
|
|
|
|
vi.mock("../infra/exec-approvals.js", () => ({
|
|
evaluateShellAllowlist: evaluateShellAllowlistMock,
|
|
evaluateShellAllowlistWithAuthorization: evaluateShellAllowlistMock,
|
|
commandRequiresSecurityAuditSuppressionApproval:
|
|
commandRequiresSecurityAuditSuppressionApprovalMock,
|
|
hasDurableExecApproval: hasDurableExecApprovalMock,
|
|
hasNodeCommandAllowAlwaysMarker: hasNodeCommandAllowAlwaysMarkerMock,
|
|
requiresExecApproval: requiresExecApprovalMock,
|
|
resolveAllowAlwaysPersistenceDecision: resolveAllowAlwaysPersistenceDecisionMock,
|
|
resolveAllowAlwaysPatternCoverage: resolveAllowAlwaysPatternCoverageMock,
|
|
resolveExecApprovalAllowedDecisions: resolveExecApprovalAllowedDecisionsMock,
|
|
resolveExecApprovalUnavailableDecisions: resolveExecApprovalUnavailableDecisionsMock,
|
|
resolveExecApprovalsFromFile: resolveExecApprovalsFromFileMock,
|
|
maxAsk: (a: ExecAsk, b: ExecAsk): ExecAsk => {
|
|
const order: Record<ExecAsk, number> = { off: 0, "on-miss": 1, always: 2 };
|
|
return order[a] >= order[b] ? a : b;
|
|
},
|
|
}));
|
|
|
|
vi.mock("../infra/command-analysis/inline-eval.js", () => ({
|
|
describeInterpreterInlineEval: vi.fn(() => "inline-eval"),
|
|
detectInterpreterInlineEvalArgv: detectInterpreterInlineEvalArgvMock,
|
|
}));
|
|
|
|
vi.mock("../infra/node-shell.js", () => ({
|
|
buildNodeShellCommand: vi.fn(() => ["/bin/sh", "-lc", "bun ./script.ts"]),
|
|
}));
|
|
|
|
vi.mock("../infra/system-run-approval-context.js", () => ({
|
|
parsePreparedSystemRunPayload: parsePreparedSystemRunPayloadMock,
|
|
}));
|
|
|
|
vi.mock("./bash-tools.exec-approval-request.js", () => ({
|
|
buildExecApprovalRequesterContext: vi.fn(() => ({})),
|
|
buildExecApprovalTurnSourceContext: vi.fn(() => ({})),
|
|
registerExecApprovalRequestForHostOrThrow: registerExecApprovalRequestForHostOrThrowMock,
|
|
}));
|
|
|
|
vi.mock("./bash-tools.exec-host-shared.js", () => ({
|
|
resolveExecHostApprovalContext: resolveExecHostApprovalContextMock,
|
|
buildDefaultExecApprovalRequestArgs: vi.fn(() => ({})),
|
|
createAndRegisterDefaultExecApprovalRequest: createAndRegisterDefaultExecApprovalRequestMock,
|
|
shouldResolveExecApprovalUnavailableInline: vi.fn(() => false),
|
|
buildExecApprovalFollowupTarget: vi.fn((value) => value),
|
|
resolveApprovalDecisionOrUndefined: resolveApprovalDecisionOrUndefinedMock,
|
|
createExecApprovalDecisionState: createExecApprovalDecisionStateMock,
|
|
enforceStrictInlineEvalApprovalBoundary: enforceStrictInlineEvalApprovalBoundaryMock,
|
|
sendExecApprovalFollowupResult: sendExecApprovalFollowupResultMock,
|
|
buildExecApprovalPendingToolResult: buildExecApprovalPendingToolResultMock,
|
|
buildHeadlessExecApprovalDeniedMessage: vi.fn(() => "denied"),
|
|
}));
|
|
|
|
vi.mock("./bash-tools.exec-runtime.js", () => ({
|
|
DEFAULT_NOTIFY_TAIL_CHARS: 1000,
|
|
createApprovalSlug: vi.fn(() => "slug"),
|
|
normalizeNotifyOutput: vi.fn((value: string) => value),
|
|
}));
|
|
|
|
vi.mock("./tools/gateway.js", () => ({
|
|
callGatewayTool: callGatewayToolMock,
|
|
}));
|
|
|
|
const resolveNodeIdFromListMock = vi.hoisted(() =>
|
|
vi.fn((nodes: Array<{ nodeId: string; displayName?: string }>, query?: string) => {
|
|
if (!query) {
|
|
if (nodes.length === 1) {
|
|
return nodes[0].nodeId;
|
|
}
|
|
throw new Error("node required");
|
|
}
|
|
const byId = nodes.find((n) => n.nodeId === query);
|
|
if (byId) {
|
|
return byId.nodeId;
|
|
}
|
|
const byName = nodes.find((n) => n.displayName === query);
|
|
if (byName) {
|
|
return byName.nodeId;
|
|
}
|
|
if (query.length >= 6) {
|
|
const byPrefix = nodes.find((n) => n.nodeId.startsWith(query));
|
|
if (byPrefix) {
|
|
return byPrefix.nodeId;
|
|
}
|
|
}
|
|
throw new Error(`unknown node: ${query}`);
|
|
}),
|
|
);
|
|
|
|
vi.mock("./tools/nodes-utils.js", () => ({
|
|
listNodes: listNodesMock,
|
|
resolveNodeIdFromList: resolveNodeIdFromListMock,
|
|
}));
|
|
|
|
vi.mock("../logger.js", () => ({
|
|
logInfo: vi.fn(),
|
|
}));
|
|
|
|
let executeNodeHostCommand: typeof import("./bash-tools.exec-host-node.js").executeNodeHostCommand;
|
|
|
|
type MockNodeInvokeParams = {
|
|
command?: string;
|
|
params?: Record<string, unknown>;
|
|
};
|
|
|
|
type GatewayToolCall = {
|
|
method: string;
|
|
options: { timeoutMs?: number };
|
|
params?: MockNodeInvokeParams;
|
|
callOptions?: unknown;
|
|
};
|
|
|
|
function requireGatewayCall(index: number): GatewayToolCall {
|
|
const call = callGatewayToolMock.mock.calls[index];
|
|
if (!call) {
|
|
throw new Error(`expected gateway call at index ${index}`);
|
|
}
|
|
const [method, options, params, callOptions] = call as [
|
|
string,
|
|
{ timeoutMs?: number },
|
|
MockNodeInvokeParams | undefined,
|
|
unknown,
|
|
];
|
|
return { method, options, params, callOptions };
|
|
}
|
|
|
|
function requireGatewayCommand(command: string): GatewayToolCall {
|
|
const call = callGatewayToolMock.mock.calls.find(
|
|
([method, , params]) =>
|
|
method === "node.invoke" && (params as MockNodeInvokeParams | undefined)?.command === command,
|
|
);
|
|
if (!call) {
|
|
throw new Error(`expected gateway command ${command}`);
|
|
}
|
|
const [method, options, params, callOptions] = call as [
|
|
string,
|
|
{ timeoutMs?: number },
|
|
MockNodeInvokeParams | undefined,
|
|
unknown,
|
|
];
|
|
return { method, options, params, callOptions };
|
|
}
|
|
|
|
function requireRunParams(call: GatewayToolCall): Record<string, unknown> {
|
|
expect(call.method).toBe("node.invoke");
|
|
expect(call.params?.command).toBe("system.run");
|
|
const params = call.params?.params;
|
|
if (!params) {
|
|
throw new Error("expected system.run params");
|
|
}
|
|
return params;
|
|
}
|
|
|
|
function requireRegisteredApprovalRequest(): Record<string, unknown> {
|
|
const calls = registerExecApprovalRequestForHostOrThrowMock.mock.calls as unknown as [
|
|
Record<string, unknown>,
|
|
][];
|
|
const firstCall = calls[0];
|
|
if (!firstCall) {
|
|
throw new Error("expected approval request registration");
|
|
}
|
|
return firstCall[0];
|
|
}
|
|
|
|
function expectSystemRunInvoke(params: { invokeTimeoutMs: number; runTimeoutMs: number }) {
|
|
const call = requireGatewayCommand("system.run");
|
|
expect(call.options.timeoutMs).toBe(params.invokeTimeoutMs);
|
|
expect(requireRunParams(call).timeoutMs).toBe(params.runTimeoutMs);
|
|
}
|
|
|
|
function mockGatewayInvokesWithNodeApprovals(file: Record<string, unknown>) {
|
|
callGatewayToolMock.mockImplementation(
|
|
async (method: string, _options: unknown, params: MockNodeInvokeParams | undefined) => {
|
|
if (method === "exec.approvals.node.get") {
|
|
return { file };
|
|
}
|
|
if (method !== "node.invoke") {
|
|
throw new Error(`unexpected gateway method: ${method}`);
|
|
}
|
|
if (params?.command === "system.run.prepare") {
|
|
return { payload: { plan: preparedPlan } };
|
|
}
|
|
if (params?.command === "system.run") {
|
|
return {
|
|
payload: {
|
|
success: true,
|
|
stdout: "ok",
|
|
stderr: "",
|
|
exitCode: 0,
|
|
timedOut: false,
|
|
},
|
|
};
|
|
}
|
|
throw new Error(`unexpected node invoke command: ${String(params?.command)}`);
|
|
},
|
|
);
|
|
}
|
|
|
|
function usePolicyApprovalRequirementMock() {
|
|
requiresExecApprovalMock.mockImplementation((raw: unknown) => {
|
|
const params = raw as {
|
|
ask: string;
|
|
security: string;
|
|
analysisOk: boolean;
|
|
allowlistSatisfied: boolean;
|
|
durableApprovalSatisfied: boolean;
|
|
};
|
|
return (
|
|
params.ask === "always" ||
|
|
(params.ask === "on-miss" &&
|
|
params.security === "allowlist" &&
|
|
(!params.analysisOk || !params.allowlistSatisfied) &&
|
|
!params.durableApprovalSatisfied)
|
|
);
|
|
});
|
|
}
|
|
|
|
function buildAllowlistEvalResult(params?: {
|
|
allowlistSatisfied?: boolean;
|
|
segmentAllowlistEntry?: { pattern: string } | null;
|
|
}) {
|
|
return {
|
|
allowlistMatches:
|
|
params?.allowlistSatisfied && params.segmentAllowlistEntry
|
|
? [params.segmentAllowlistEntry]
|
|
: [],
|
|
analysisOk: true,
|
|
allowlistSatisfied: params?.allowlistSatisfied === true,
|
|
segments: [{ resolution: null, argv: ["tool", "--version"] }],
|
|
segmentAllowlistEntries:
|
|
params?.allowlistSatisfied && params.segmentAllowlistEntry
|
|
? [params.segmentAllowlistEntry]
|
|
: [null],
|
|
segmentSatisfiedBy: [params?.allowlistSatisfied ? "allowlist" : null],
|
|
};
|
|
}
|
|
|
|
describe("executeNodeHostCommand", () => {
|
|
beforeAll(async () => {
|
|
({ executeNodeHostCommand } = await import("./bash-tools.exec-host-node.js"));
|
|
});
|
|
|
|
beforeEach(() => {
|
|
callGatewayToolMock.mockReset();
|
|
callGatewayToolMock.mockImplementation(
|
|
async (method: string, _options: unknown, params: MockNodeInvokeParams | undefined) => {
|
|
if (method === "exec.approvals.node.get") {
|
|
return { file: { version: 1, agents: {} } };
|
|
}
|
|
if (method === "exec.approval.resolve") {
|
|
return { payload: {} };
|
|
}
|
|
if (method !== "node.invoke") {
|
|
throw new Error(`unexpected gateway method: ${method}`);
|
|
}
|
|
if (params?.command === "system.run.prepare") {
|
|
return { payload: { plan: preparedPlan } };
|
|
}
|
|
if (params?.command === "system.run") {
|
|
return {
|
|
payload: {
|
|
success: true,
|
|
stdout: "ok",
|
|
stderr: "",
|
|
exitCode: 0,
|
|
timedOut: false,
|
|
},
|
|
};
|
|
}
|
|
throw new Error(`unexpected node invoke command: ${String(params?.command)}`);
|
|
},
|
|
);
|
|
listNodesMock.mockReset();
|
|
listNodesMock.mockResolvedValue([
|
|
{
|
|
nodeId: "node-1",
|
|
commands: ["system.run", "system.run.prepare"],
|
|
platform: process.platform,
|
|
},
|
|
]);
|
|
parsePreparedSystemRunPayloadMock.mockReset();
|
|
parsePreparedSystemRunPayloadMock.mockReturnValue({
|
|
plan: preparedPlan,
|
|
execPolicy: { security: "full", ask: "off" },
|
|
});
|
|
commandRequiresSecurityAuditSuppressionApprovalMock.mockReset();
|
|
commandRequiresSecurityAuditSuppressionApprovalMock.mockReturnValue(false);
|
|
evaluateShellAllowlistMock.mockReset();
|
|
evaluateShellAllowlistMock.mockReturnValue({
|
|
allowlistMatches: [],
|
|
analysisOk: true,
|
|
allowlistSatisfied: false,
|
|
segments: [{ resolution: null, argv: ["bun", "./script.ts"] }],
|
|
segmentAllowlistEntries: [],
|
|
});
|
|
hasNodeCommandAllowAlwaysMarkerMock.mockClear();
|
|
resolveAllowAlwaysPatternCoverageMock.mockReset();
|
|
resolveAllowAlwaysPatternCoverageMock.mockReturnValue({
|
|
complete: true,
|
|
patterns: [{ pattern: "/trusted/bin/tool" }],
|
|
});
|
|
hasDurableExecApprovalMock.mockReset();
|
|
hasDurableExecApprovalMock.mockReturnValue(false);
|
|
resolveExecApprovalsFromFileMock.mockReset();
|
|
resolveExecApprovalsFromFileMock.mockReturnValue({
|
|
allowlist: [],
|
|
file: { version: 1, agents: {} },
|
|
agent: {
|
|
security: "full",
|
|
ask: "off",
|
|
askFallback: "deny",
|
|
autoAllowSkills: false,
|
|
},
|
|
});
|
|
requiresExecApprovalMock.mockReset();
|
|
requiresExecApprovalMock.mockReturnValue(true);
|
|
hasDurableExecApprovalMock.mockReset();
|
|
hasDurableExecApprovalMock.mockReturnValue(false);
|
|
resolveAllowAlwaysPersistenceDecisionMock.mockReset();
|
|
resolveAllowAlwaysPersistenceDecisionMock.mockReturnValue({
|
|
kind: "patterns",
|
|
patterns: [{ pattern: "/trusted/bin/tool" }],
|
|
});
|
|
resolveExecApprovalAllowedDecisionsMock.mockClear();
|
|
resolveExecApprovalUnavailableDecisionsMock.mockClear();
|
|
resolveExecHostApprovalContextMock.mockReset();
|
|
resolveExecHostApprovalContextMock.mockReturnValue({
|
|
approvals: { allowlist: [], file: { version: 1, agents: {} } },
|
|
hostSecurity: "full",
|
|
hostAsk: "off",
|
|
askFallback: "deny",
|
|
});
|
|
createAndRegisterDefaultExecApprovalRequestMock.mockReset();
|
|
createAndRegisterDefaultExecApprovalRequestMock.mockImplementation(async (args?: unknown) => {
|
|
const register =
|
|
args && typeof args === "object" && "register" in args
|
|
? (args as { register?: (approvalId: string) => Promise<void> }).register
|
|
: undefined;
|
|
await register?.("approval-1");
|
|
return {
|
|
approvalId: "approval-1",
|
|
approvalSlug: "slug-1",
|
|
warningText: "",
|
|
expiresAtMs: Date.now() + 60_000,
|
|
preResolvedDecision: null,
|
|
initiatingSurface: "origin",
|
|
sentApproverDms: false,
|
|
unavailableReason: null,
|
|
};
|
|
});
|
|
resolveApprovalDecisionOrUndefinedMock.mockReset();
|
|
resolveApprovalDecisionOrUndefinedMock.mockResolvedValue("allow-once");
|
|
createExecApprovalDecisionStateMock.mockReset();
|
|
createExecApprovalDecisionStateMock.mockReturnValue({
|
|
baseDecision: { timedOut: false },
|
|
approvedByAsk: false,
|
|
deniedReason: null,
|
|
});
|
|
buildExecApprovalPendingToolResultMock.mockReset();
|
|
buildExecApprovalPendingToolResultMock.mockReturnValue({
|
|
content: [],
|
|
details: { status: "approval-pending" },
|
|
});
|
|
sendExecApprovalFollowupResultMock.mockReset();
|
|
enforceStrictInlineEvalApprovalBoundaryMock.mockReset();
|
|
enforceStrictInlineEvalApprovalBoundaryMock.mockImplementation((value) => ({
|
|
approvedByAsk: value.approvedByAsk,
|
|
deniedReason: value.deniedReason,
|
|
}));
|
|
detectInterpreterInlineEvalArgvMock.mockReset();
|
|
detectInterpreterInlineEvalArgvMock.mockReturnValue(null);
|
|
registerExecApprovalRequestForHostOrThrowMock.mockReset();
|
|
});
|
|
|
|
it("forwards prepared systemRunPlan on async node invoke after approval", async () => {
|
|
resolveExecHostApprovalContextMock.mockReturnValue({
|
|
approvals: { allowlist: [], file: { version: 1, agents: {} } },
|
|
hostSecurity: "full",
|
|
hostAsk: "always",
|
|
askFallback: "deny",
|
|
});
|
|
|
|
const result = await executeNodeHostCommand({
|
|
command: "bun ./script.ts",
|
|
workdir: "/tmp/work",
|
|
env: {},
|
|
security: "full",
|
|
ask: "off",
|
|
defaultTimeoutSec: 30,
|
|
approvalRunningNoticeMs: 0,
|
|
warnings: [],
|
|
agentId: "requested-agent",
|
|
sessionKey: "requested-session",
|
|
turnSourceChannel: "telegram",
|
|
turnSourceTo: "telegram:12345",
|
|
turnSourceAccountId: "work",
|
|
turnSourceThreadId: "42",
|
|
});
|
|
|
|
expect(result.details?.status).toBe("approval-pending");
|
|
expect(requireRegisteredApprovalRequest().systemRunPlan).toEqual(preparedPlan);
|
|
|
|
await vi.waitFor(() => {
|
|
expect(callGatewayToolMock).toHaveBeenCalledTimes(3);
|
|
});
|
|
|
|
const call = requireGatewayCall(2);
|
|
expect(call.options.timeoutMs).toBe(35_000);
|
|
expect(call.callOptions).toEqual({ scopes: ["operator.write", "operator.approvals"] });
|
|
const runParams = requireRunParams(call);
|
|
expect(runParams.approved).toBe(true);
|
|
expect(runParams.approvalDecision).toBe("allow-once");
|
|
expect(runParams.systemRunPlan).toEqual(preparedPlan);
|
|
expect(runParams.timeoutMs).toBe(30_000);
|
|
expect(runParams.turnSourceChannel).toBe("telegram");
|
|
expect(runParams.turnSourceTo).toBe("telegram:12345");
|
|
expect(runParams.turnSourceAccountId).toBe("work");
|
|
expect(runParams.turnSourceThreadId).toBe("42");
|
|
});
|
|
|
|
it("does not build a human approval prompt for node auto-review allows", async () => {
|
|
const autoReviewer = vi.fn<ExecAutoReviewer>(async () => ({
|
|
decision: "allow-once",
|
|
risk: "low",
|
|
rationale: "safe read",
|
|
}));
|
|
resolveExecHostApprovalContextMock.mockReturnValue({
|
|
approvals: { allowlist: [], file: { version: 1, agents: {} } },
|
|
hostSecurity: "allowlist",
|
|
hostAsk: "on-miss",
|
|
askFallback: "deny",
|
|
});
|
|
requiresExecApprovalMock.mockImplementation(
|
|
(params?: { allowlistSatisfied?: boolean; durableApprovalSatisfied?: boolean }) =>
|
|
params?.allowlistSatisfied !== true && params?.durableApprovalSatisfied !== true,
|
|
);
|
|
|
|
const result = await executeNodeHostCommand({
|
|
command: "bun ./script.ts",
|
|
workdir: "/tmp/work",
|
|
env: {},
|
|
security: "allowlist",
|
|
ask: "on-miss",
|
|
autoReview: true,
|
|
autoReviewer,
|
|
defaultTimeoutSec: 30,
|
|
approvalRunningNoticeMs: 0,
|
|
warnings: [],
|
|
agentId: "requested-agent",
|
|
sessionKey: "requested-session",
|
|
});
|
|
|
|
expect(result.details?.status).toBe("completed");
|
|
expect(autoReviewer).toHaveBeenCalledWith(
|
|
expect.objectContaining({
|
|
command: "bun ./script.ts",
|
|
argv: ["bun", "./script.ts"],
|
|
host: "node",
|
|
reason: "allowlist-miss",
|
|
}),
|
|
);
|
|
expect(createAndRegisterDefaultExecApprovalRequestMock).not.toHaveBeenCalled();
|
|
expect(registerExecApprovalRequestForHostOrThrowMock).toHaveBeenCalledWith(
|
|
expect.objectContaining({
|
|
host: "node",
|
|
requireDeliveryRoute: false,
|
|
suppressDelivery: true,
|
|
}),
|
|
);
|
|
expect(callGatewayToolMock).toHaveBeenCalledWith(
|
|
"exec.approval.resolve",
|
|
{ timeoutMs: 15_000 },
|
|
{ id: expect.any(String), decision: "allow-once" },
|
|
{ scopes: ["operator.approvals"] },
|
|
);
|
|
});
|
|
|
|
it("reviews the prepared node plan before suppressing human approval", async () => {
|
|
const divergentPlan = {
|
|
argv: ["rm", "-rf", "/tmp/work"],
|
|
cwd: "/tmp/work",
|
|
commandText: "rm -rf /tmp/work",
|
|
commandPreview: "./scripts/check_mail.sh --limit 5",
|
|
agentId: "prepared-agent",
|
|
sessionKey: "prepared-session",
|
|
};
|
|
parsePreparedSystemRunPayloadMock.mockReturnValue({
|
|
plan: divergentPlan,
|
|
execPolicy: { security: "full", ask: "off" },
|
|
});
|
|
const nodeAllowlist = [{ pattern: "./scripts/check_mail.sh" }];
|
|
resolveExecApprovalsFromFileMock.mockReturnValue({
|
|
allowlist: nodeAllowlist,
|
|
file: { version: 1, agents: {} },
|
|
agent: {
|
|
security: "full",
|
|
ask: "off",
|
|
askFallback: "deny",
|
|
autoAllowSkills: false,
|
|
},
|
|
});
|
|
evaluateShellAllowlistMock.mockImplementation(
|
|
(params?: { command?: string; allowlist?: unknown[] }) => {
|
|
const command = params?.command ?? "";
|
|
const hasNodeAllowlist = Array.isArray(params?.allowlist) && params.allowlist.length > 0;
|
|
const previewMatch = command === "./scripts/check_mail.sh --limit 5";
|
|
return {
|
|
allowlistMatches: previewMatch && hasNodeAllowlist ? [{}] : [],
|
|
analysisOk: true,
|
|
allowlistSatisfied: previewMatch && hasNodeAllowlist,
|
|
segments: [
|
|
previewMatch
|
|
? {
|
|
resolution: null,
|
|
argv: ["./scripts/check_mail.sh", "--limit", "5"],
|
|
raw: "./scripts/check_mail.sh --limit 5",
|
|
}
|
|
: {
|
|
resolution: null,
|
|
argv: ["rm", "-rf", "/tmp/work"],
|
|
raw: "rm -rf /tmp/work",
|
|
},
|
|
],
|
|
segmentAllowlistEntries: previewMatch && hasNodeAllowlist ? [{}] : [],
|
|
};
|
|
},
|
|
);
|
|
const autoReviewer = vi.fn<ExecAutoReviewer>(async (input) =>
|
|
input.command.includes("rm -rf")
|
|
? {
|
|
decision: "ask",
|
|
risk: "high",
|
|
rationale: "destructive prepared plan",
|
|
}
|
|
: {
|
|
decision: "allow-once",
|
|
risk: "low",
|
|
rationale: "safe requested text",
|
|
},
|
|
);
|
|
resolveExecHostApprovalContextMock.mockReturnValue({
|
|
approvals: { allowlist: [], file: { version: 1, agents: {} } },
|
|
hostSecurity: "allowlist",
|
|
hostAsk: "on-miss",
|
|
askFallback: "deny",
|
|
});
|
|
requiresExecApprovalMock.mockImplementation(
|
|
(params?: { allowlistSatisfied?: boolean; durableApprovalSatisfied?: boolean }) =>
|
|
params?.allowlistSatisfied !== true && params?.durableApprovalSatisfied !== true,
|
|
);
|
|
|
|
const result = await executeNodeHostCommand({
|
|
command: "echo SAFE",
|
|
workdir: "/tmp/work",
|
|
env: {},
|
|
security: "allowlist",
|
|
ask: "on-miss",
|
|
autoReview: true,
|
|
autoReviewer,
|
|
defaultTimeoutSec: 30,
|
|
approvalRunningNoticeMs: 0,
|
|
warnings: [],
|
|
agentId: "requested-agent",
|
|
sessionKey: "requested-session",
|
|
});
|
|
|
|
expect(result.details?.status).toBe("approval-pending");
|
|
expect(autoReviewer).toHaveBeenCalledWith(
|
|
expect.objectContaining({
|
|
command: "rm -rf /tmp/work",
|
|
argv: ["rm", "-rf", "/tmp/work"],
|
|
agent: {
|
|
id: "prepared-agent",
|
|
sessionKey: "prepared-session",
|
|
},
|
|
}),
|
|
);
|
|
expect(createAndRegisterDefaultExecApprovalRequestMock).toHaveBeenCalled();
|
|
expect(callGatewayToolMock).not.toHaveBeenCalledWith(
|
|
"exec.approval.resolve",
|
|
expect.anything(),
|
|
expect.anything(),
|
|
expect.anything(),
|
|
);
|
|
});
|
|
|
|
it("honors node allowlist matches on prepared POSIX shell payloads", async () => {
|
|
const wrapperPlan = {
|
|
argv: ["/bin/sh", "-lc", "./scripts/check_mail.sh --limit 5"],
|
|
cwd: "/tmp/work",
|
|
commandText: `/bin/sh -lc "./scripts/check_mail.sh --limit 5"`,
|
|
commandPreview: "./scripts/check_mail.sh --limit 5",
|
|
agentId: "prepared-agent",
|
|
sessionKey: "prepared-session",
|
|
};
|
|
parsePreparedSystemRunPayloadMock.mockReturnValue({
|
|
plan: wrapperPlan,
|
|
execPolicy: { security: "full", ask: "off" },
|
|
});
|
|
const nodeAllowlist = [{ pattern: "./scripts/check_mail.sh" }];
|
|
resolveExecApprovalsFromFileMock.mockReturnValue({
|
|
allowlist: nodeAllowlist,
|
|
file: { version: 1, agents: {} },
|
|
agent: {
|
|
security: "full",
|
|
ask: "off",
|
|
askFallback: "deny",
|
|
autoAllowSkills: false,
|
|
},
|
|
});
|
|
evaluateShellAllowlistMock.mockImplementation(
|
|
(params?: { command?: string; allowlist?: unknown[] }) => {
|
|
const command = params?.command ?? "";
|
|
const hasNodeAllowlist = Array.isArray(params?.allowlist) && params.allowlist.length > 0;
|
|
const semanticMatch = command === "./scripts/check_mail.sh --limit 5";
|
|
return {
|
|
allowlistMatches: semanticMatch && hasNodeAllowlist ? [{}] : [],
|
|
analysisOk: true,
|
|
allowlistSatisfied: semanticMatch && hasNodeAllowlist,
|
|
segments: [
|
|
command.startsWith("/bin/sh")
|
|
? {
|
|
resolution: null,
|
|
argv: ["/bin/sh", "-lc", "./scripts/check_mail.sh --limit 5"],
|
|
raw: `/bin/sh -lc "./scripts/check_mail.sh --limit 5"`,
|
|
}
|
|
: {
|
|
resolution: null,
|
|
argv: ["./scripts/check_mail.sh", "--limit", "5"],
|
|
raw: "./scripts/check_mail.sh --limit 5",
|
|
},
|
|
],
|
|
segmentAllowlistEntries: semanticMatch && hasNodeAllowlist ? [{}] : [],
|
|
};
|
|
},
|
|
);
|
|
const autoReviewer = vi.fn<ExecAutoReviewer>(async () => ({
|
|
decision: "ask",
|
|
risk: "medium",
|
|
rationale: "should not be needed",
|
|
}));
|
|
resolveExecHostApprovalContextMock.mockReturnValue({
|
|
approvals: { allowlist: [], file: { version: 1, agents: {} } },
|
|
hostSecurity: "allowlist",
|
|
hostAsk: "on-miss",
|
|
askFallback: "deny",
|
|
});
|
|
requiresExecApprovalMock.mockImplementation(
|
|
(params?: { allowlistSatisfied?: boolean; durableApprovalSatisfied?: boolean }) =>
|
|
params?.allowlistSatisfied !== true && params?.durableApprovalSatisfied !== true,
|
|
);
|
|
|
|
const result = await executeNodeHostCommand({
|
|
command: "./scripts/check_mail.sh --limit 5",
|
|
workdir: "/tmp/work",
|
|
env: {},
|
|
security: "allowlist",
|
|
ask: "on-miss",
|
|
autoReview: true,
|
|
autoReviewer,
|
|
defaultTimeoutSec: 30,
|
|
approvalRunningNoticeMs: 0,
|
|
warnings: [],
|
|
agentId: "requested-agent",
|
|
sessionKey: "requested-session",
|
|
});
|
|
|
|
expect(result.details?.status).toBe("completed");
|
|
expect(autoReviewer).not.toHaveBeenCalled();
|
|
expect(createAndRegisterDefaultExecApprovalRequestMock).not.toHaveBeenCalled();
|
|
expect(resolveExecApprovalsFromFileMock).toHaveBeenCalledWith(
|
|
expect.objectContaining({ agentId: "prepared-agent" }),
|
|
);
|
|
expectSystemRunInvoke({ invokeTimeoutMs: 35_000, runTimeoutMs: 30_000 });
|
|
});
|
|
|
|
it("does not let transport wrapper allowlist matches approve shell payloads", async () => {
|
|
const wrapperPlan = {
|
|
argv: ["/bin/sh", "-lc", "./scripts/untrusted.sh"],
|
|
cwd: "/tmp/work",
|
|
commandText: `/bin/sh -lc "./scripts/untrusted.sh"`,
|
|
commandPreview: "./scripts/untrusted.sh",
|
|
agentId: "prepared-agent",
|
|
sessionKey: "prepared-session",
|
|
};
|
|
parsePreparedSystemRunPayloadMock.mockReturnValue({
|
|
plan: wrapperPlan,
|
|
execPolicy: { security: "full", ask: "off" },
|
|
});
|
|
const nodeAllowlist = [{ pattern: "/bin/sh" }];
|
|
resolveExecApprovalsFromFileMock.mockReturnValue({
|
|
allowlist: nodeAllowlist,
|
|
file: { version: 1, agents: {} },
|
|
agent: {
|
|
security: "full",
|
|
ask: "off",
|
|
askFallback: "deny",
|
|
autoAllowSkills: false,
|
|
},
|
|
});
|
|
evaluateShellAllowlistMock.mockImplementation(
|
|
(params?: { command?: string; allowlist?: unknown[] }) => {
|
|
const command = params?.command ?? "";
|
|
const hasNodeAllowlist = Array.isArray(params?.allowlist) && params.allowlist.length > 0;
|
|
const wrapperMatch = command.startsWith("/bin/sh") && hasNodeAllowlist;
|
|
return {
|
|
allowlistMatches: wrapperMatch ? [{}] : [],
|
|
analysisOk: true,
|
|
allowlistSatisfied: wrapperMatch,
|
|
segments: [
|
|
command.startsWith("/bin/sh")
|
|
? {
|
|
resolution: null,
|
|
argv: ["/bin/sh", "-lc", "./scripts/untrusted.sh"],
|
|
raw: `/bin/sh -lc "./scripts/untrusted.sh"`,
|
|
}
|
|
: {
|
|
resolution: null,
|
|
argv: ["./scripts/untrusted.sh"],
|
|
raw: "./scripts/untrusted.sh",
|
|
},
|
|
],
|
|
segmentAllowlistEntries: wrapperMatch ? [{}] : [],
|
|
};
|
|
},
|
|
);
|
|
requiresExecApprovalMock.mockImplementation(
|
|
(params?: { allowlistSatisfied?: boolean; durableApprovalSatisfied?: boolean }) =>
|
|
params?.allowlistSatisfied !== true && params?.durableApprovalSatisfied !== true,
|
|
);
|
|
hasDurableExecApprovalMock.mockImplementation(
|
|
(params?: { segmentAllowlistEntries?: unknown[] }) =>
|
|
Array.isArray(params?.segmentAllowlistEntries) && params.segmentAllowlistEntries.length > 0,
|
|
);
|
|
const autoReviewer = vi.fn<ExecAutoReviewer>(async () => ({
|
|
decision: "ask",
|
|
risk: "medium",
|
|
rationale: "inner payload is not allowlisted",
|
|
}));
|
|
resolveExecHostApprovalContextMock.mockReturnValue({
|
|
approvals: { allowlist: [], file: { version: 1, agents: {} } },
|
|
hostSecurity: "allowlist",
|
|
hostAsk: "on-miss",
|
|
askFallback: "deny",
|
|
});
|
|
|
|
const result = await executeNodeHostCommand({
|
|
command: "./scripts/untrusted.sh",
|
|
workdir: "/tmp/work",
|
|
env: {},
|
|
security: "allowlist",
|
|
ask: "on-miss",
|
|
autoReview: true,
|
|
autoReviewer,
|
|
defaultTimeoutSec: 30,
|
|
approvalRunningNoticeMs: 0,
|
|
warnings: [],
|
|
agentId: "requested-agent",
|
|
sessionKey: "requested-session",
|
|
});
|
|
|
|
expect(result.details?.status).toBe("approval-pending");
|
|
expect(autoReviewer).toHaveBeenCalledWith(
|
|
expect.objectContaining({
|
|
command: `/bin/sh -lc "./scripts/untrusted.sh"`,
|
|
argv: ["./scripts/untrusted.sh"],
|
|
}),
|
|
);
|
|
expect(createAndRegisterDefaultExecApprovalRequestMock).toHaveBeenCalled();
|
|
});
|
|
|
|
it("reuses exact durable approvals for prepared shell wrappers", async () => {
|
|
const wrapperPlan = {
|
|
argv: ["/bin/sh", "-lc", "cd ."],
|
|
cwd: "/tmp/work",
|
|
commandText: `/bin/sh -lc "cd ."`,
|
|
commandPreview: "cd .",
|
|
agentId: "prepared-agent",
|
|
sessionKey: "prepared-session",
|
|
};
|
|
parsePreparedSystemRunPayloadMock.mockReturnValue({
|
|
plan: wrapperPlan,
|
|
execPolicy: { security: "full", ask: "off" },
|
|
});
|
|
resolveExecApprovalsFromFileMock.mockReturnValue({
|
|
allowlist: [
|
|
{
|
|
pattern: exactCommandMarker(wrapperPlan.commandText),
|
|
source: "allow-always",
|
|
commandText: wrapperPlan.commandText,
|
|
},
|
|
],
|
|
file: { version: 1, agents: {} },
|
|
agent: {
|
|
security: "full",
|
|
ask: "off",
|
|
askFallback: "deny",
|
|
autoAllowSkills: false,
|
|
},
|
|
});
|
|
evaluateShellAllowlistMock.mockImplementation((params?: { command?: string }) => {
|
|
const command = params?.command ?? "";
|
|
return {
|
|
allowlistMatches: [],
|
|
analysisOk: true,
|
|
allowlistSatisfied: false,
|
|
segments: [
|
|
command.startsWith("/bin/sh")
|
|
? {
|
|
resolution: null,
|
|
argv: ["/bin/sh", "-lc", "cd ."],
|
|
raw: `/bin/sh -lc "cd ."`,
|
|
}
|
|
: {
|
|
resolution: null,
|
|
argv: ["cd", "."],
|
|
raw: "cd .",
|
|
},
|
|
],
|
|
segmentAllowlistEntries: [],
|
|
};
|
|
});
|
|
hasDurableExecApprovalMock.mockImplementation(
|
|
(params?: { commandText?: string | null }) => params?.commandText === wrapperPlan.commandText,
|
|
);
|
|
requiresExecApprovalMock.mockImplementation(
|
|
(params?: { allowlistSatisfied?: boolean; durableApprovalSatisfied?: boolean }) =>
|
|
params?.allowlistSatisfied !== true && params?.durableApprovalSatisfied !== true,
|
|
);
|
|
resolveExecHostApprovalContextMock.mockReturnValue({
|
|
approvals: { allowlist: [], file: { version: 1, agents: {} } },
|
|
hostSecurity: "allowlist",
|
|
hostAsk: "on-miss",
|
|
askFallback: "deny",
|
|
});
|
|
|
|
const result = await executeNodeHostCommand({
|
|
command: "cd .",
|
|
workdir: "/tmp/work",
|
|
env: {},
|
|
security: "allowlist",
|
|
ask: "on-miss",
|
|
autoReview: true,
|
|
defaultTimeoutSec: 30,
|
|
approvalRunningNoticeMs: 0,
|
|
warnings: [],
|
|
agentId: "requested-agent",
|
|
sessionKey: "requested-session",
|
|
});
|
|
|
|
expect(result.details?.status).toBe("completed");
|
|
expect(createAndRegisterDefaultExecApprovalRequestMock).not.toHaveBeenCalled();
|
|
expectSystemRunInvoke({ invokeTimeoutMs: 35_000, runTimeoutMs: 30_000 });
|
|
});
|
|
|
|
it("keeps non-transport login shells approval-gated", async () => {
|
|
const loginPlan = {
|
|
argv: ["bash", "-lc", "./scripts/check_mail.sh --limit 5"],
|
|
cwd: "/tmp/work",
|
|
commandText: `bash -lc "./scripts/check_mail.sh --limit 5"`,
|
|
commandPreview: "./scripts/check_mail.sh --limit 5",
|
|
agentId: "prepared-agent",
|
|
sessionKey: "prepared-session",
|
|
};
|
|
parsePreparedSystemRunPayloadMock.mockReturnValue({
|
|
plan: loginPlan,
|
|
execPolicy: { security: "full", ask: "off" },
|
|
});
|
|
const nodeAllowlist = [{ pattern: "./scripts/check_mail.sh" }];
|
|
resolveExecApprovalsFromFileMock.mockReturnValue({
|
|
allowlist: nodeAllowlist,
|
|
file: { version: 1, agents: {} },
|
|
agent: {
|
|
security: "full",
|
|
ask: "off",
|
|
askFallback: "deny",
|
|
autoAllowSkills: false,
|
|
},
|
|
});
|
|
evaluateShellAllowlistMock.mockImplementation(
|
|
(params?: { command?: string; allowlist?: unknown[] }) => {
|
|
const command = params?.command ?? "";
|
|
const hasNodeAllowlist = Array.isArray(params?.allowlist) && params.allowlist.length > 0;
|
|
const semanticMatch = command === "./scripts/check_mail.sh --limit 5";
|
|
return {
|
|
allowlistMatches: semanticMatch && hasNodeAllowlist ? [{}] : [],
|
|
analysisOk: true,
|
|
allowlistSatisfied: semanticMatch && hasNodeAllowlist,
|
|
segments: [
|
|
command.startsWith("bash")
|
|
? {
|
|
resolution: null,
|
|
argv: ["bash", "-lc", "./scripts/check_mail.sh --limit 5"],
|
|
raw: `bash -lc "./scripts/check_mail.sh --limit 5"`,
|
|
}
|
|
: {
|
|
resolution: null,
|
|
argv: ["./scripts/check_mail.sh", "--limit", "5"],
|
|
raw: "./scripts/check_mail.sh --limit 5",
|
|
},
|
|
],
|
|
segmentAllowlistEntries: semanticMatch && hasNodeAllowlist ? [{}] : [],
|
|
};
|
|
},
|
|
);
|
|
requiresExecApprovalMock.mockImplementation(
|
|
(params?: { allowlistSatisfied?: boolean; durableApprovalSatisfied?: boolean }) =>
|
|
params?.allowlistSatisfied !== true && params?.durableApprovalSatisfied !== true,
|
|
);
|
|
const autoReviewer = vi.fn<ExecAutoReviewer>(async () => ({
|
|
decision: "ask",
|
|
risk: "medium",
|
|
rationale: "login shell needs human approval",
|
|
}));
|
|
resolveExecHostApprovalContextMock.mockReturnValue({
|
|
approvals: { allowlist: [], file: { version: 1, agents: {} } },
|
|
hostSecurity: "allowlist",
|
|
hostAsk: "on-miss",
|
|
askFallback: "deny",
|
|
});
|
|
|
|
const result = await executeNodeHostCommand({
|
|
command: "./scripts/check_mail.sh --limit 5",
|
|
workdir: "/tmp/work",
|
|
env: {},
|
|
security: "allowlist",
|
|
ask: "on-miss",
|
|
autoReview: true,
|
|
autoReviewer,
|
|
defaultTimeoutSec: 30,
|
|
approvalRunningNoticeMs: 0,
|
|
warnings: [],
|
|
agentId: "requested-agent",
|
|
sessionKey: "requested-session",
|
|
});
|
|
|
|
expect(result.details?.status).toBe("approval-pending");
|
|
expect(autoReviewer).toHaveBeenCalledWith(
|
|
expect.objectContaining({
|
|
command: `bash -lc "./scripts/check_mail.sh --limit 5"`,
|
|
argv: ["bash", "-lc", "./scripts/check_mail.sh --limit 5"],
|
|
}),
|
|
);
|
|
expect(createAndRegisterDefaultExecApprovalRequestMock).toHaveBeenCalled();
|
|
});
|
|
|
|
it("requires human approval when prepared shell payload has multiple commands", async () => {
|
|
const chainPlan = {
|
|
argv: ["/bin/sh", "-lc", "openclaw status; id"],
|
|
cwd: "/tmp/work",
|
|
commandText: `/bin/sh -lc "openclaw status; id"`,
|
|
commandPreview: "openclaw status; id",
|
|
agentId: "prepared-agent",
|
|
sessionKey: "prepared-session",
|
|
};
|
|
parsePreparedSystemRunPayloadMock.mockReturnValue({
|
|
plan: chainPlan,
|
|
execPolicy: { security: "full", ask: "off" },
|
|
});
|
|
evaluateShellAllowlistMock.mockImplementation((params?: { command?: string }) => {
|
|
const command = params?.command ?? "";
|
|
return {
|
|
allowlistMatches: [],
|
|
analysisOk: true,
|
|
allowlistSatisfied: false,
|
|
segments: command.startsWith("/bin/sh")
|
|
? [
|
|
{
|
|
resolution: null,
|
|
argv: ["/bin/sh", "-lc", "openclaw status; id"],
|
|
raw: `/bin/sh -lc "openclaw status; id"`,
|
|
},
|
|
]
|
|
: [
|
|
{
|
|
resolution: null,
|
|
argv: ["openclaw", "status"],
|
|
raw: "openclaw status",
|
|
},
|
|
{
|
|
resolution: null,
|
|
argv: ["id"],
|
|
raw: "id",
|
|
},
|
|
],
|
|
segmentAllowlistEntries: [],
|
|
};
|
|
});
|
|
const autoReviewer = vi.fn<ExecAutoReviewer>(async () => ({
|
|
decision: "allow-once",
|
|
risk: "low",
|
|
rationale: "test reviewer would allow it",
|
|
}));
|
|
resolveExecHostApprovalContextMock.mockReturnValue({
|
|
approvals: { allowlist: [], file: { version: 1, agents: {} } },
|
|
hostSecurity: "allowlist",
|
|
hostAsk: "on-miss",
|
|
askFallback: "deny",
|
|
});
|
|
|
|
const result = await executeNodeHostCommand({
|
|
command: "openclaw status; id",
|
|
workdir: "/tmp/work",
|
|
env: {},
|
|
security: "allowlist",
|
|
ask: "on-miss",
|
|
autoReview: true,
|
|
autoReviewer,
|
|
defaultTimeoutSec: 30,
|
|
approvalRunningNoticeMs: 0,
|
|
warnings: [],
|
|
agentId: "requested-agent",
|
|
sessionKey: "requested-session",
|
|
});
|
|
|
|
expect(result.details?.status).toBe("approval-pending");
|
|
expect(autoReviewer).not.toHaveBeenCalled();
|
|
expect(createAndRegisterDefaultExecApprovalRequestMock).toHaveBeenCalled();
|
|
});
|
|
|
|
it("does not treat read-only suppression inspections as wrapper writes", async () => {
|
|
const wrapperPlan = {
|
|
argv: ["/bin/sh", "-lc", "openclaw config get security.audit.suppressions"],
|
|
cwd: "/tmp/work",
|
|
commandText: `/bin/sh -lc "openclaw config get security.audit.suppressions"`,
|
|
commandPreview: "openclaw config get security.audit.suppressions",
|
|
agentId: "prepared-agent",
|
|
sessionKey: "prepared-session",
|
|
};
|
|
parsePreparedSystemRunPayloadMock.mockReturnValue({
|
|
plan: wrapperPlan,
|
|
execPolicy: { security: "full", ask: "off" },
|
|
});
|
|
evaluateShellAllowlistMock.mockImplementation((params?: { command?: string }) => {
|
|
const command = params?.command ?? "";
|
|
return {
|
|
allowlistMatches: [],
|
|
analysisOk: true,
|
|
allowlistSatisfied: true,
|
|
segments: [
|
|
command.startsWith("/bin/sh")
|
|
? {
|
|
resolution: null,
|
|
argv: ["/bin/sh", "-lc", "openclaw config get security.audit.suppressions"],
|
|
raw: `/bin/sh -lc "openclaw config get security.audit.suppressions"`,
|
|
}
|
|
: {
|
|
resolution: null,
|
|
argv: ["openclaw", "config", "get", "security.audit.suppressions"],
|
|
raw: "openclaw config get security.audit.suppressions",
|
|
},
|
|
],
|
|
segmentAllowlistEntries: [],
|
|
};
|
|
});
|
|
commandRequiresSecurityAuditSuppressionApprovalMock.mockImplementation(
|
|
(params?: { command?: string }) => params?.command?.startsWith("/bin/sh") === true,
|
|
);
|
|
requiresExecApprovalMock.mockReturnValue(false);
|
|
resolveExecHostApprovalContextMock.mockReturnValue({
|
|
approvals: { allowlist: [], file: { version: 1, agents: {} } },
|
|
hostSecurity: "allowlist",
|
|
hostAsk: "on-miss",
|
|
askFallback: "deny",
|
|
});
|
|
|
|
const result = await executeNodeHostCommand({
|
|
command: "openclaw config get security.audit.suppressions",
|
|
workdir: "/tmp/work",
|
|
env: {},
|
|
security: "allowlist",
|
|
ask: "on-miss",
|
|
autoReview: true,
|
|
defaultTimeoutSec: 30,
|
|
approvalRunningNoticeMs: 0,
|
|
warnings: [],
|
|
agentId: "requested-agent",
|
|
sessionKey: "requested-session",
|
|
});
|
|
|
|
expect(result.details?.status).toBe("completed");
|
|
expect(createAndRegisterDefaultExecApprovalRequestMock).not.toHaveBeenCalled();
|
|
expectSystemRunInvoke({ invokeTimeoutMs: 35_000, runTimeoutMs: 30_000 });
|
|
});
|
|
|
|
it("requests human approval when node auto-review asks on an approval miss", async () => {
|
|
const autoReviewer = vi.fn<ExecAutoReviewer>(async () => ({
|
|
decision: "ask",
|
|
risk: "medium",
|
|
rationale: "needs a person",
|
|
}));
|
|
const warnings: string[] = [];
|
|
resolveExecHostApprovalContextMock.mockReturnValue({
|
|
approvals: { allowlist: [], file: { version: 1, agents: {} } },
|
|
hostSecurity: "allowlist",
|
|
hostAsk: "on-miss",
|
|
askFallback: "deny",
|
|
});
|
|
|
|
const result = await executeNodeHostCommand({
|
|
command: "bun ./script.ts",
|
|
workdir: "/tmp/work",
|
|
env: {},
|
|
security: "allowlist",
|
|
ask: "on-miss",
|
|
autoReview: true,
|
|
autoReviewer,
|
|
defaultTimeoutSec: 30,
|
|
approvalRunningNoticeMs: 0,
|
|
warnings,
|
|
agentId: "requested-agent",
|
|
sessionKey: "requested-session",
|
|
});
|
|
|
|
expect(result.details?.status).toBe("approval-pending");
|
|
expect(autoReviewer).toHaveBeenCalledTimes(1);
|
|
expect(createAndRegisterDefaultExecApprovalRequestMock).toHaveBeenCalledTimes(1);
|
|
expect(warnings.join("\n")).toContain("needs a person");
|
|
});
|
|
|
|
it.each([
|
|
{
|
|
name: "ask always",
|
|
nodeSecurity: "full",
|
|
nodeAsk: "always",
|
|
},
|
|
{
|
|
name: "deny security",
|
|
nodeSecurity: "deny",
|
|
nodeAsk: "off",
|
|
},
|
|
] as const)(
|
|
"requests human approval when node policy has $name floor",
|
|
async ({ nodeSecurity, nodeAsk }) => {
|
|
const autoReviewer = vi.fn<ExecAutoReviewer>(async () => ({
|
|
decision: "allow-once",
|
|
risk: "low",
|
|
rationale: "test reviewer would allow it",
|
|
}));
|
|
resolveExecHostApprovalContextMock.mockReturnValue({
|
|
approvals: { allowlist: [], file: { version: 1, agents: {} } },
|
|
hostSecurity: "allowlist",
|
|
hostAsk: "on-miss",
|
|
askFallback: "deny",
|
|
});
|
|
parsePreparedSystemRunPayloadMock.mockReturnValue({
|
|
plan: preparedPlan,
|
|
execPolicy: { security: nodeSecurity, ask: nodeAsk },
|
|
});
|
|
resolveExecApprovalsFromFileMock.mockReturnValue({
|
|
allowlist: [],
|
|
file: { version: 1, agents: {} },
|
|
agent: {
|
|
security: nodeSecurity,
|
|
ask: nodeAsk,
|
|
askFallback: "deny",
|
|
autoAllowSkills: false,
|
|
},
|
|
});
|
|
callGatewayToolMock.mockImplementation(
|
|
async (method: string, _options: unknown, params: MockNodeInvokeParams | undefined) => {
|
|
if (method === "exec.approvals.node.get") {
|
|
return { file: { version: 1, agents: {} } };
|
|
}
|
|
if (method === "exec.approval.resolve") {
|
|
return { payload: {} };
|
|
}
|
|
if (method !== "node.invoke") {
|
|
throw new Error(`unexpected gateway method: ${method}`);
|
|
}
|
|
if (params?.command === "system.run.prepare") {
|
|
return {
|
|
payload: {
|
|
plan: preparedPlan,
|
|
execPolicy: { security: nodeSecurity, ask: nodeAsk },
|
|
},
|
|
};
|
|
}
|
|
if (params?.command === "system.run") {
|
|
return {
|
|
payload: {
|
|
success: true,
|
|
stdout: "ok",
|
|
stderr: "",
|
|
exitCode: 0,
|
|
timedOut: false,
|
|
},
|
|
};
|
|
}
|
|
throw new Error(`unexpected node invoke command: ${String(params?.command)}`);
|
|
},
|
|
);
|
|
|
|
const result = await executeNodeHostCommand({
|
|
command: "bun ./script.ts",
|
|
workdir: "/tmp/work",
|
|
env: {},
|
|
security: "allowlist",
|
|
ask: "on-miss",
|
|
autoReview: true,
|
|
autoReviewer,
|
|
defaultTimeoutSec: 30,
|
|
approvalRunningNoticeMs: 0,
|
|
warnings: [],
|
|
agentId: "requested-agent",
|
|
sessionKey: "requested-session",
|
|
});
|
|
|
|
expect(result.details?.status).toBe("approval-pending");
|
|
expect(autoReviewer).not.toHaveBeenCalled();
|
|
expect(createAndRegisterDefaultExecApprovalRequestMock).toHaveBeenCalledTimes(1);
|
|
expect(
|
|
callGatewayToolMock.mock.calls.some(([method]) => method === "exec.approval.resolve"),
|
|
).toBe(false);
|
|
},
|
|
);
|
|
|
|
it("requests human approval when node approval policy is unavailable", async () => {
|
|
const autoReviewer = vi.fn<ExecAutoReviewer>(async () => ({
|
|
decision: "allow-once",
|
|
risk: "low",
|
|
rationale: "test reviewer would allow it",
|
|
}));
|
|
resolveExecHostApprovalContextMock.mockReturnValue({
|
|
approvals: { allowlist: [], file: { version: 1, agents: {} } },
|
|
hostSecurity: "allowlist",
|
|
hostAsk: "on-miss",
|
|
askFallback: "deny",
|
|
});
|
|
callGatewayToolMock.mockImplementation(
|
|
async (method: string, _options: unknown, params: MockNodeInvokeParams | undefined) => {
|
|
if (method === "exec.approvals.node.get") {
|
|
throw new Error("node approvals unavailable");
|
|
}
|
|
if (method === "exec.approval.resolve") {
|
|
return { payload: {} };
|
|
}
|
|
if (method !== "node.invoke") {
|
|
throw new Error(`unexpected gateway method: ${method}`);
|
|
}
|
|
if (params?.command === "system.run.prepare") {
|
|
return { payload: { plan: preparedPlan } };
|
|
}
|
|
if (params?.command === "system.run") {
|
|
return {
|
|
payload: {
|
|
success: true,
|
|
stdout: "ok",
|
|
stderr: "",
|
|
exitCode: 0,
|
|
timedOut: false,
|
|
},
|
|
};
|
|
}
|
|
throw new Error(`unexpected node invoke command: ${String(params?.command)}`);
|
|
},
|
|
);
|
|
|
|
const result = await executeNodeHostCommand({
|
|
command: "bun ./script.ts",
|
|
workdir: "/tmp/work",
|
|
env: {},
|
|
security: "allowlist",
|
|
ask: "on-miss",
|
|
autoReview: true,
|
|
autoReviewer,
|
|
defaultTimeoutSec: 30,
|
|
approvalRunningNoticeMs: 0,
|
|
warnings: [],
|
|
agentId: "requested-agent",
|
|
sessionKey: "requested-session",
|
|
});
|
|
|
|
expect(result.details?.status).toBe("approval-pending");
|
|
expect(autoReviewer).not.toHaveBeenCalled();
|
|
expect(createAndRegisterDefaultExecApprovalRequestMock).toHaveBeenCalledTimes(1);
|
|
expect(
|
|
callGatewayToolMock.mock.calls.some(([method]) => method === "exec.approval.resolve"),
|
|
).toBe(false);
|
|
});
|
|
|
|
it("does not use fallback-full when node approval policy is unavailable", async () => {
|
|
const autoReviewer = vi.fn<ExecAutoReviewer>(async () => ({
|
|
decision: "allow-once",
|
|
risk: "low",
|
|
rationale: "test reviewer would allow it",
|
|
}));
|
|
resolveExecHostApprovalContextMock.mockReturnValue({
|
|
approvals: { allowlist: [], file: { version: 1, agents: {} } },
|
|
hostSecurity: "allowlist",
|
|
hostAsk: "on-miss",
|
|
askFallback: "full",
|
|
});
|
|
callGatewayToolMock.mockImplementation(
|
|
async (method: string, _options: unknown, params: MockNodeInvokeParams | undefined) => {
|
|
if (method === "exec.approvals.node.get") {
|
|
throw new Error("node approvals unavailable");
|
|
}
|
|
if (method !== "node.invoke") {
|
|
throw new Error(`unexpected gateway method: ${method}`);
|
|
}
|
|
if (params?.command === "system.run.prepare") {
|
|
return { payload: { plan: preparedPlan } };
|
|
}
|
|
if (params?.command === "system.run") {
|
|
return {
|
|
payload: {
|
|
success: true,
|
|
stdout: "should-not-run",
|
|
stderr: "",
|
|
exitCode: 0,
|
|
timedOut: false,
|
|
},
|
|
};
|
|
}
|
|
throw new Error(`unexpected node invoke command: ${String(params?.command)}`);
|
|
},
|
|
);
|
|
resolveApprovalDecisionOrUndefinedMock.mockResolvedValue(null);
|
|
createExecApprovalDecisionStateMock.mockReturnValue({
|
|
baseDecision: { timedOut: true },
|
|
approvedByAsk: true,
|
|
deniedReason: null,
|
|
});
|
|
enforceStrictInlineEvalApprovalBoundaryMock.mockImplementation((value) =>
|
|
value.requiresAutoReviewHumanApproval === true && value.baseDecision.timedOut
|
|
? { approvedByAsk: false, deniedReason: "approval-timeout" }
|
|
: { approvedByAsk: value.approvedByAsk, deniedReason: value.deniedReason },
|
|
);
|
|
|
|
const result = await executeNodeHostCommand({
|
|
command: "bun ./script.ts",
|
|
workdir: "/tmp/work",
|
|
env: {},
|
|
security: "allowlist",
|
|
ask: "on-miss",
|
|
autoReview: true,
|
|
autoReviewer,
|
|
defaultTimeoutSec: 30,
|
|
approvalRunningNoticeMs: 0,
|
|
warnings: [],
|
|
agentId: "requested-agent",
|
|
sessionKey: "requested-session",
|
|
});
|
|
|
|
expect(result.details?.status).toBe("approval-pending");
|
|
expect(autoReviewer).not.toHaveBeenCalled();
|
|
await vi.waitFor(() => {
|
|
expect(sendExecApprovalFollowupResultMock).toHaveBeenCalledWith(
|
|
expect.objectContaining({
|
|
approvalId: "approval-1",
|
|
sessionKey: "requested-session",
|
|
}),
|
|
"Exec denied (node=node-1 id=approval-1, approval-timeout): bun ./script.ts",
|
|
);
|
|
});
|
|
expect(
|
|
callGatewayToolMock.mock.calls.some(
|
|
([method, , params]) =>
|
|
method === "node.invoke" &&
|
|
(params as MockNodeInvokeParams | undefined)?.command === "system.run",
|
|
),
|
|
).toBe(false);
|
|
});
|
|
|
|
it("auto-reviews strict inline-eval commands before asking a human", async () => {
|
|
const inlinePlan = {
|
|
argv: ["/bin/sh", "-lc", "python3 -c 'print(1)'"],
|
|
cwd: "/tmp/work",
|
|
commandText: `/bin/sh -lc "python3 -c 'print(1)'"`,
|
|
commandPreview: "python3 -c 'print(1)'",
|
|
agentId: "requested-agent",
|
|
sessionKey: "requested-session",
|
|
};
|
|
parsePreparedSystemRunPayloadMock.mockReturnValue({
|
|
plan: inlinePlan,
|
|
execPolicy: { security: "full", ask: "off" },
|
|
});
|
|
const autoReviewer = vi.fn<ExecAutoReviewer>(async () => ({
|
|
decision: "allow-once",
|
|
risk: "low",
|
|
rationale: "safe inline eval",
|
|
}));
|
|
detectInterpreterInlineEvalArgvMock.mockImplementation((argv?: unknown) =>
|
|
Array.isArray(argv) && argv[0] === "python3" ? INLINE_EVAL_HIT : null,
|
|
);
|
|
evaluateShellAllowlistMock.mockImplementation((params?: { command?: string }) => {
|
|
const command = params?.command ?? "";
|
|
const segment = command.startsWith("/bin/sh")
|
|
? {
|
|
resolution: null,
|
|
argv: ["/bin/sh", "-lc", "python3 -c 'print(1)'"],
|
|
raw: `/bin/sh -lc "python3 -c 'print(1)'"`,
|
|
}
|
|
: {
|
|
resolution: null,
|
|
argv: ["python3", "-c", "print(1)"],
|
|
raw: "python3 -c 'print(1)'",
|
|
};
|
|
return {
|
|
allowlistMatches: [],
|
|
analysisOk: true,
|
|
allowlistSatisfied: false,
|
|
segments: [segment],
|
|
segmentAllowlistEntries: [],
|
|
};
|
|
});
|
|
resolveExecHostApprovalContextMock.mockReturnValue({
|
|
approvals: { allowlist: [], file: { version: 1, agents: {} } },
|
|
hostSecurity: "allowlist",
|
|
hostAsk: "on-miss",
|
|
askFallback: "deny",
|
|
});
|
|
const warnings: string[] = [];
|
|
|
|
const result = await executeNodeHostCommand({
|
|
command: "python3 -c 'print(1)'",
|
|
workdir: "/tmp/work",
|
|
env: {},
|
|
security: "allowlist",
|
|
ask: "on-miss",
|
|
autoReview: true,
|
|
autoReviewer,
|
|
strictInlineEval: true,
|
|
defaultTimeoutSec: 30,
|
|
approvalRunningNoticeMs: 0,
|
|
warnings,
|
|
agentId: "requested-agent",
|
|
sessionKey: "requested-session",
|
|
});
|
|
|
|
expect(result.details?.status).toBe("completed");
|
|
expect(autoReviewer).toHaveBeenCalledWith(
|
|
expect.objectContaining({
|
|
command: `/bin/sh -lc "python3 -c 'print(1)'"`,
|
|
argv: ["python3", "-c", "print(1)"],
|
|
host: "node",
|
|
reason: "strict-inline-eval",
|
|
analysis: expect.objectContaining({
|
|
inlineEval: true,
|
|
}),
|
|
}),
|
|
);
|
|
expect(createAndRegisterDefaultExecApprovalRequestMock).not.toHaveBeenCalled();
|
|
expect(warnings[0]).toContain("requires reviewer or explicit approval");
|
|
});
|
|
|
|
it("keeps security audit suppression edits off the auto-review path", async () => {
|
|
const autoReviewer = vi.fn<ExecAutoReviewer>(async () => ({
|
|
decision: "allow-once",
|
|
risk: "low",
|
|
rationale: "test reviewer would allow it",
|
|
}));
|
|
const warnings: string[] = [];
|
|
commandRequiresSecurityAuditSuppressionApprovalMock.mockReturnValue(true);
|
|
resolveExecHostApprovalContextMock.mockReturnValue({
|
|
approvals: { allowlist: [], file: { version: 1, agents: {} } },
|
|
hostSecurity: "allowlist",
|
|
hostAsk: "on-miss",
|
|
askFallback: "deny",
|
|
});
|
|
|
|
const result = await executeNodeHostCommand({
|
|
command: "openclaw config set security.audit.suppressions '[]'",
|
|
workdir: "/tmp/work",
|
|
env: {},
|
|
security: "allowlist",
|
|
ask: "on-miss",
|
|
autoReview: true,
|
|
autoReviewer,
|
|
defaultTimeoutSec: 30,
|
|
approvalRunningNoticeMs: 0,
|
|
warnings,
|
|
agentId: "requested-agent",
|
|
sessionKey: "requested-session",
|
|
});
|
|
|
|
expect(result.details?.status).toBe("approval-pending");
|
|
expect(autoReviewer).not.toHaveBeenCalled();
|
|
expect(createAndRegisterDefaultExecApprovalRequestMock).toHaveBeenCalledTimes(1);
|
|
expect(warnings).toContain(
|
|
"Warning: security audit suppression changes require explicit approval unless exec is running in yolo mode.",
|
|
);
|
|
});
|
|
|
|
it("requests human approval when node auto-review cannot bind a single parsed command", async () => {
|
|
const autoReviewer = vi.fn<ExecAutoReviewer>(async () => ({
|
|
decision: "allow-once",
|
|
risk: "low",
|
|
rationale: "test reviewer would allow it",
|
|
}));
|
|
evaluateShellAllowlistMock.mockReturnValue({
|
|
allowlistMatches: [],
|
|
analysisOk: true,
|
|
allowlistSatisfied: false,
|
|
segments: [
|
|
{ raw: "echo ok", resolution: null, argv: ["echo", "ok"] },
|
|
{ raw: "pwd", resolution: null, argv: ["pwd"] },
|
|
],
|
|
segmentAllowlistEntries: [],
|
|
});
|
|
resolveExecHostApprovalContextMock.mockReturnValue({
|
|
approvals: { allowlist: [], file: { version: 1, agents: {} } },
|
|
hostSecurity: "allowlist",
|
|
hostAsk: "on-miss",
|
|
askFallback: "deny",
|
|
});
|
|
|
|
const result = await executeNodeHostCommand({
|
|
command: "echo ok; pwd",
|
|
workdir: "/tmp/work",
|
|
env: {},
|
|
security: "allowlist",
|
|
ask: "on-miss",
|
|
autoReview: true,
|
|
autoReviewer,
|
|
defaultTimeoutSec: 30,
|
|
approvalRunningNoticeMs: 0,
|
|
warnings: [],
|
|
agentId: "requested-agent",
|
|
sessionKey: "requested-session",
|
|
});
|
|
|
|
expect(result.details?.status).toBe("approval-pending");
|
|
expect(autoReviewer).not.toHaveBeenCalled();
|
|
expect(createAndRegisterDefaultExecApprovalRequestMock).toHaveBeenCalledTimes(1);
|
|
});
|
|
|
|
it("requests human approval when node runtime policy requires ask always", async () => {
|
|
const autoReviewer = vi.fn<ExecAutoReviewer>(async () => ({
|
|
decision: "allow-once",
|
|
risk: "low",
|
|
rationale: "test reviewer would allow it",
|
|
}));
|
|
parsePreparedSystemRunPayloadMock.mockReturnValue({
|
|
plan: preparedPlan,
|
|
execPolicy: { security: "full", ask: "always" },
|
|
});
|
|
resolveExecApprovalsFromFileMock.mockReturnValue({
|
|
allowlist: [],
|
|
file: { version: 1, agents: {} },
|
|
agent: {
|
|
security: "full",
|
|
ask: "off",
|
|
askFallback: "deny",
|
|
autoAllowSkills: false,
|
|
},
|
|
});
|
|
resolveExecHostApprovalContextMock.mockReturnValue({
|
|
approvals: { allowlist: [], file: { version: 1, agents: {} } },
|
|
hostSecurity: "allowlist",
|
|
hostAsk: "on-miss",
|
|
askFallback: "deny",
|
|
});
|
|
|
|
const result = await executeNodeHostCommand({
|
|
command: "bun ./script.ts",
|
|
workdir: "/tmp/work",
|
|
env: {},
|
|
security: "allowlist",
|
|
ask: "on-miss",
|
|
autoReview: true,
|
|
autoReviewer,
|
|
defaultTimeoutSec: 30,
|
|
approvalRunningNoticeMs: 0,
|
|
warnings: [],
|
|
agentId: "requested-agent",
|
|
sessionKey: "requested-session",
|
|
});
|
|
|
|
expect(result.details?.status).toBe("approval-pending");
|
|
expect(autoReviewer).not.toHaveBeenCalled();
|
|
expect(createAndRegisterDefaultExecApprovalRequestMock).toHaveBeenCalledTimes(1);
|
|
expect(resolveExecApprovalAllowedDecisionsMock).toHaveBeenCalledWith({
|
|
ask: "always",
|
|
allowAlwaysPersistence: {
|
|
kind: "patterns",
|
|
patterns: [{ pattern: "/trusted/bin/tool" }],
|
|
},
|
|
});
|
|
expect(requireRegisteredApprovalRequest().unavailableDecisions).toEqual(["allow-always"]);
|
|
expect(buildExecApprovalPendingToolResultMock).toHaveBeenCalledWith(
|
|
expect.objectContaining({
|
|
allowedDecisions: ["allow-once", "deny"],
|
|
}),
|
|
);
|
|
});
|
|
|
|
it("omits allow-always from node approval prompts when node runtime policy is missing", async () => {
|
|
const autoReviewer = vi.fn<ExecAutoReviewer>(async () => ({
|
|
decision: "allow-once",
|
|
risk: "low",
|
|
rationale: "test reviewer would allow it",
|
|
}));
|
|
parsePreparedSystemRunPayloadMock.mockReturnValue({
|
|
plan: preparedPlan,
|
|
execPolicy: undefined,
|
|
});
|
|
resolveExecHostApprovalContextMock.mockReturnValue({
|
|
approvals: { allowlist: [], file: { version: 1, agents: {} } },
|
|
hostSecurity: "allowlist",
|
|
hostAsk: "on-miss",
|
|
askFallback: "deny",
|
|
});
|
|
|
|
const result = await executeNodeHostCommand({
|
|
command: "bun ./script.ts",
|
|
workdir: "/tmp/work",
|
|
env: {},
|
|
security: "allowlist",
|
|
ask: "on-miss",
|
|
autoReview: true,
|
|
autoReviewer,
|
|
defaultTimeoutSec: 30,
|
|
approvalRunningNoticeMs: 0,
|
|
warnings: [],
|
|
agentId: "requested-agent",
|
|
sessionKey: "requested-session",
|
|
});
|
|
|
|
expect(result.details?.status).toBe("approval-pending");
|
|
expect(autoReviewer).not.toHaveBeenCalled();
|
|
expect(resolveExecApprovalAllowedDecisionsMock).toHaveBeenCalledWith({
|
|
ask: "always",
|
|
allowAlwaysPersistence: {
|
|
kind: "patterns",
|
|
patterns: [{ pattern: "/trusted/bin/tool" }],
|
|
},
|
|
});
|
|
expect(requireRegisteredApprovalRequest().unavailableDecisions).toEqual(["allow-always"]);
|
|
});
|
|
|
|
it("offers allow-always for prepared node commands with complete node coverage", async () => {
|
|
const preparedWrapperPlan = {
|
|
...preparedPlan,
|
|
argv: ["/bin/sh", "-lc", "git status"],
|
|
commandText: '/bin/sh -lc "git status"',
|
|
commandPreview: "git status",
|
|
};
|
|
mockGatewayInvokesWithNodeApprovals({ version: 1, agents: {} });
|
|
usePolicyApprovalRequirementMock();
|
|
parsePreparedSystemRunPayloadMock.mockReturnValueOnce({
|
|
plan: preparedWrapperPlan,
|
|
execPolicy: { security: "full", ask: "off" },
|
|
allowAlwaysCoverage: {
|
|
complete: true,
|
|
patterns: [{ pattern: "/node/bin/git" }],
|
|
},
|
|
});
|
|
resolveAllowAlwaysPersistenceDecisionMock.mockImplementationOnce((params) => {
|
|
const commandText = params.commandText?.trim();
|
|
return params.preparedCoverage?.complete === true && params.preparedCoverage.patterns.length
|
|
? {
|
|
kind: "patterns",
|
|
...(commandText ? { commandText } : {}),
|
|
patterns: params.preparedCoverage.patterns,
|
|
}
|
|
: {
|
|
kind: "one-shot",
|
|
reasons: ["no-reusable-pattern"],
|
|
};
|
|
});
|
|
resolveExecHostApprovalContextMock.mockReturnValue({
|
|
approvals: { allowlist: [], file: { version: 1, agents: {} } },
|
|
hostSecurity: "allowlist",
|
|
hostAsk: "on-miss",
|
|
askFallback: "deny",
|
|
});
|
|
resolveApprovalDecisionOrUndefinedMock.mockResolvedValue(undefined);
|
|
|
|
const result = await executeNodeHostCommand({
|
|
command: "git status",
|
|
workdir: "/tmp/work",
|
|
env: {},
|
|
security: "allowlist",
|
|
ask: "on-miss",
|
|
defaultTimeoutSec: 30,
|
|
approvalRunningNoticeMs: 0,
|
|
warnings: [],
|
|
agentId: "requested-agent",
|
|
sessionKey: "requested-session",
|
|
});
|
|
|
|
expect(result.details?.status).toBe("approval-pending");
|
|
expect(resolveAllowAlwaysPersistenceDecisionMock).toHaveBeenCalledWith(
|
|
expect.objectContaining({
|
|
commandText: '/bin/sh -lc "git status"',
|
|
preparedCoverage: {
|
|
complete: true,
|
|
patterns: [{ pattern: "/node/bin/git" }],
|
|
},
|
|
}),
|
|
);
|
|
expect(resolveExecApprovalAllowedDecisionsMock).toHaveBeenCalledWith({
|
|
ask: "on-miss",
|
|
allowAlwaysPersistence: {
|
|
kind: "patterns",
|
|
commandText: '/bin/sh -lc "git status"',
|
|
patterns: [{ pattern: "/node/bin/git" }],
|
|
},
|
|
});
|
|
expect(requireRegisteredApprovalRequest().unavailableDecisions).toBeUndefined();
|
|
});
|
|
|
|
it("does not use fallback-full when node auto-review cannot parse the command", async () => {
|
|
const autoReviewer = vi.fn<ExecAutoReviewer>(async () => ({
|
|
decision: "allow-once",
|
|
risk: "low",
|
|
rationale: "test reviewer would allow it",
|
|
}));
|
|
evaluateShellAllowlistMock.mockReturnValue({
|
|
allowlistMatches: [],
|
|
analysisOk: false,
|
|
allowlistSatisfied: false,
|
|
segments: [],
|
|
segmentAllowlistEntries: [],
|
|
});
|
|
resolveExecHostApprovalContextMock.mockReturnValue({
|
|
approvals: { allowlist: [], file: { version: 1, agents: {} } },
|
|
hostSecurity: "allowlist",
|
|
hostAsk: "on-miss",
|
|
askFallback: "full",
|
|
});
|
|
resolveApprovalDecisionOrUndefinedMock.mockResolvedValue(null);
|
|
createExecApprovalDecisionStateMock.mockReturnValue({
|
|
baseDecision: { timedOut: true },
|
|
approvedByAsk: true,
|
|
deniedReason: null,
|
|
});
|
|
enforceStrictInlineEvalApprovalBoundaryMock.mockImplementation((value) =>
|
|
value.requiresAutoReviewHumanApproval === true && value.baseDecision.timedOut
|
|
? { approvedByAsk: false, deniedReason: "approval-timeout" }
|
|
: { approvedByAsk: value.approvedByAsk, deniedReason: value.deniedReason },
|
|
);
|
|
|
|
const result = await executeNodeHostCommand({
|
|
command: "echo 'unterminated",
|
|
workdir: "/tmp/work",
|
|
env: {},
|
|
security: "allowlist",
|
|
ask: "on-miss",
|
|
autoReview: true,
|
|
autoReviewer,
|
|
defaultTimeoutSec: 30,
|
|
approvalRunningNoticeMs: 0,
|
|
warnings: [],
|
|
agentId: "requested-agent",
|
|
sessionKey: "requested-session",
|
|
});
|
|
|
|
expect(result.details?.status).toBe("approval-pending");
|
|
expect(autoReviewer).not.toHaveBeenCalled();
|
|
await vi.waitFor(() => {
|
|
expect(sendExecApprovalFollowupResultMock).toHaveBeenCalledWith(
|
|
expect.objectContaining({
|
|
approvalId: "approval-1",
|
|
sessionKey: "requested-session",
|
|
}),
|
|
"Exec denied (node=node-1 id=approval-1, approval-timeout): echo 'unterminated",
|
|
);
|
|
});
|
|
expect(
|
|
callGatewayToolMock.mock.calls.some(
|
|
([method, , params]) =>
|
|
method === "node.invoke" &&
|
|
(params as MockNodeInvokeParams | undefined)?.command === "system.run",
|
|
),
|
|
).toBe(false);
|
|
});
|
|
|
|
it("does not use fallback-full when node auto-review asks for human approval", async () => {
|
|
const autoReviewer = vi.fn<ExecAutoReviewer>(async () => ({
|
|
decision: "ask",
|
|
risk: "medium",
|
|
rationale: "needs a person",
|
|
}));
|
|
resolveExecHostApprovalContextMock.mockReturnValue({
|
|
approvals: { allowlist: [], file: { version: 1, agents: {} } },
|
|
hostSecurity: "allowlist",
|
|
hostAsk: "on-miss",
|
|
askFallback: "full",
|
|
});
|
|
resolveApprovalDecisionOrUndefinedMock.mockResolvedValue(null);
|
|
createExecApprovalDecisionStateMock.mockReturnValue({
|
|
baseDecision: { timedOut: true },
|
|
approvedByAsk: true,
|
|
deniedReason: null,
|
|
});
|
|
enforceStrictInlineEvalApprovalBoundaryMock.mockImplementation((value) =>
|
|
value.requiresAutoReviewHumanApproval === true && value.baseDecision.timedOut
|
|
? { approvedByAsk: false, deniedReason: "approval-timeout" }
|
|
: { approvedByAsk: value.approvedByAsk, deniedReason: value.deniedReason },
|
|
);
|
|
|
|
const result = await executeNodeHostCommand({
|
|
command: "bun ./script.ts",
|
|
workdir: "/tmp/work",
|
|
env: {},
|
|
security: "allowlist",
|
|
ask: "on-miss",
|
|
autoReview: true,
|
|
autoReviewer,
|
|
defaultTimeoutSec: 30,
|
|
approvalRunningNoticeMs: 0,
|
|
warnings: [],
|
|
agentId: "requested-agent",
|
|
sessionKey: "requested-session",
|
|
});
|
|
|
|
expect(result.details?.status).toBe("approval-pending");
|
|
await vi.waitFor(() => {
|
|
expect(sendExecApprovalFollowupResultMock).toHaveBeenCalledWith(
|
|
expect.objectContaining({
|
|
approvalId: "approval-1",
|
|
sessionKey: "requested-session",
|
|
}),
|
|
"Exec denied (node=node-1 id=approval-1, approval-timeout): bun ./script.ts",
|
|
);
|
|
});
|
|
expect(
|
|
callGatewayToolMock.mock.calls.some(
|
|
([method, , params]) =>
|
|
method === "node.invoke" &&
|
|
(params as MockNodeInvokeParams | undefined)?.command === "system.run",
|
|
),
|
|
).toBe(false);
|
|
});
|
|
|
|
it("builds a local systemRunPlan when approval is required and the node omits prepare", async () => {
|
|
listNodesMock.mockResolvedValueOnce([
|
|
{
|
|
nodeId: "node-1",
|
|
commands: ["system.run", "system.which", "system.notify"],
|
|
platform: "darwin",
|
|
},
|
|
]);
|
|
resolveExecHostApprovalContextMock.mockReturnValue({
|
|
approvals: { allowlist: [], file: { version: 1, agents: {} } },
|
|
hostSecurity: "full",
|
|
hostAsk: "always",
|
|
askFallback: "deny",
|
|
});
|
|
|
|
const result = await executeNodeHostCommand({
|
|
command: "bun ./script.ts",
|
|
workdir: "/tmp/work",
|
|
env: {},
|
|
security: "full",
|
|
ask: "off",
|
|
defaultTimeoutSec: 30,
|
|
approvalRunningNoticeMs: 0,
|
|
warnings: [],
|
|
agentId: "requested-agent",
|
|
sessionKey: "requested-session",
|
|
});
|
|
|
|
expect(result.details?.status).toBe("approval-pending");
|
|
expect(parsePreparedSystemRunPayloadMock).not.toHaveBeenCalled();
|
|
const expectedPlan = {
|
|
argv: ["/bin/sh", "-lc", "bun ./script.ts"],
|
|
cwd: "/tmp/work",
|
|
commandText: '/bin/sh -lc "bun ./script.ts"',
|
|
commandPreview: "bun ./script.ts",
|
|
agentId: "requested-agent",
|
|
sessionKey: "requested-session",
|
|
};
|
|
expect(requireRegisteredApprovalRequest().systemRunPlan).toEqual(expectedPlan);
|
|
|
|
await vi.waitFor(() => {
|
|
const call = requireGatewayCommand("system.run");
|
|
expect(call.callOptions).toEqual({ scopes: ["operator.write", "operator.approvals"] });
|
|
const runParams = requireRunParams(call);
|
|
expect(runParams.rawCommand).toBe(expectedPlan.commandText);
|
|
expect(runParams.systemRunPlan).toEqual(expectedPlan);
|
|
});
|
|
});
|
|
|
|
it("requires approval when node allowlist matching would depend on gateway PATH", async () => {
|
|
const allowlistEntry = { pattern: "/trusted/bin/tool" };
|
|
mockGatewayInvokesWithNodeApprovals({ version: 1, agents: {} });
|
|
usePolicyApprovalRequirementMock();
|
|
resolveExecApprovalsFromFileMock.mockReturnValue({
|
|
agent: { security: "allowlist", ask: "on-miss" },
|
|
allowlist: [allowlistEntry],
|
|
file: { version: 1, agents: {} },
|
|
});
|
|
evaluateShellAllowlistMock.mockImplementation((raw: unknown) => {
|
|
const params = raw as ShellAllowlistMockParams;
|
|
const hasNodeAllowlist = (params.allowlist ?? []).length > 0;
|
|
const gatewayPathWouldMatch = params.env?.PATH?.includes("/trusted/bin") === true;
|
|
return buildAllowlistEvalResult({
|
|
allowlistSatisfied: hasNodeAllowlist && gatewayPathWouldMatch,
|
|
segmentAllowlistEntry: allowlistEntry,
|
|
});
|
|
});
|
|
resolveExecHostApprovalContextMock.mockReturnValue({
|
|
approvals: { allowlist: [], file: { version: 1, agents: {} } },
|
|
hostSecurity: "allowlist",
|
|
hostAsk: "on-miss",
|
|
askFallback: "deny",
|
|
});
|
|
resolveApprovalDecisionOrUndefinedMock.mockResolvedValue(undefined);
|
|
|
|
const result = await executeNodeHostCommand({
|
|
command: "tool --version",
|
|
workdir: "/tmp/work",
|
|
env: { PATH: "/trusted/bin:/usr/bin" },
|
|
security: "allowlist",
|
|
ask: "on-miss",
|
|
defaultTimeoutSec: 30,
|
|
approvalRunningNoticeMs: 0,
|
|
warnings: [],
|
|
agentId: "requested-agent",
|
|
sessionKey: "requested-session",
|
|
});
|
|
|
|
expect(result.details?.status).toBe("approval-pending");
|
|
expect(registerExecApprovalRequestForHostOrThrowMock).toHaveBeenCalledTimes(1);
|
|
expect(requireRegisteredApprovalRequest().env).toBeUndefined();
|
|
const evalEnvs = evaluateShellAllowlistMock.mock.calls.map(
|
|
([raw]) => (raw as ShellAllowlistMockParams).env,
|
|
);
|
|
expect(evalEnvs.length).toBeGreaterThanOrEqual(2);
|
|
expect(evalEnvs.every((env) => env?.PATH === "" && env?.Path === "")).toBe(true);
|
|
await vi.waitFor(() => {
|
|
expect(resolveApprovalDecisionOrUndefinedMock).toHaveBeenCalledTimes(1);
|
|
});
|
|
});
|
|
|
|
it("reuses exact node allow-always command entries for prechecks", async () => {
|
|
const allowlistEntry = {
|
|
pattern: "/trusted/bin/tool",
|
|
source: "allow-always" as const,
|
|
};
|
|
const commandMarker = { pattern: nodeCommandMarker, source: "allow-always" as const };
|
|
mockGatewayInvokesWithNodeApprovals({ version: 1, agents: {} });
|
|
usePolicyApprovalRequirementMock();
|
|
resolveExecApprovalsFromFileMock.mockReturnValue({
|
|
agent: { security: "allowlist", ask: "on-miss" },
|
|
allowlist: [commandMarker, allowlistEntry],
|
|
file: { version: 1, agents: {} },
|
|
});
|
|
evaluateShellAllowlistMock.mockImplementation((raw: unknown) => {
|
|
const params = raw as ShellAllowlistMockParams;
|
|
expect(params.env?.PATH).toBe("");
|
|
expect(params.env?.Path).toBe("");
|
|
return {
|
|
allowlistMatches: [],
|
|
analysisOk: true,
|
|
allowlistSatisfied: false,
|
|
segments: [{ resolution: null, argv: ["/trusted/bin/tool", "--version"] }],
|
|
segmentAllowlistEntries: [null],
|
|
};
|
|
});
|
|
resolveAllowAlwaysPatternCoverageMock.mockImplementation((raw: unknown) => {
|
|
const params = raw as { segments?: MockAllowlistSegment[]; env?: NodeJS.ProcessEnv };
|
|
expect(params.env?.PATH).toBe("");
|
|
expect(params.env?.Path).toBe("");
|
|
expect(params.segments?.[0]?.argv[0]).toBe("/trusted/bin/tool");
|
|
return {
|
|
complete: true,
|
|
patterns: [{ pattern: "/trusted/bin/tool" }],
|
|
};
|
|
});
|
|
resolveExecHostApprovalContextMock.mockReturnValue({
|
|
approvals: { allowlist: [], file: { version: 1, agents: {} } },
|
|
hostSecurity: "allowlist",
|
|
hostAsk: "on-miss",
|
|
askFallback: "deny",
|
|
});
|
|
|
|
const result = await executeNodeHostCommand({
|
|
command: "/trusted/bin/tool --version",
|
|
workdir: "/tmp/work",
|
|
env: { PATH: "/gateway/bin:/usr/bin" },
|
|
security: "allowlist",
|
|
ask: "on-miss",
|
|
defaultTimeoutSec: 30,
|
|
approvalRunningNoticeMs: 0,
|
|
warnings: [],
|
|
agentId: "requested-agent",
|
|
sessionKey: "requested-session",
|
|
});
|
|
|
|
expect(result.details?.status).toBe("completed");
|
|
expect(registerExecApprovalRequestForHostOrThrowMock).not.toHaveBeenCalled();
|
|
expect(requiresExecApprovalMock).toHaveBeenLastCalledWith(
|
|
expect.objectContaining({
|
|
analysisOk: true,
|
|
allowlistSatisfied: false,
|
|
durableApprovalSatisfied: true,
|
|
}),
|
|
);
|
|
expect(requireRunParams(requireGatewayCommand("system.run")).env).toBeUndefined();
|
|
});
|
|
|
|
it("omits allow-always from node approval prompts when persistence is one-shot", async () => {
|
|
mockGatewayInvokesWithNodeApprovals({ version: 1, agents: {} });
|
|
usePolicyApprovalRequirementMock();
|
|
resolveAllowAlwaysPersistenceDecisionMock.mockReturnValue({
|
|
kind: "one-shot",
|
|
reasons: ["unplanned"],
|
|
});
|
|
resolveExecHostApprovalContextMock.mockReturnValue({
|
|
approvals: { allowlist: [], file: { version: 1, agents: {} } },
|
|
hostSecurity: "allowlist",
|
|
hostAsk: "on-miss",
|
|
askFallback: "deny",
|
|
});
|
|
resolveApprovalDecisionOrUndefinedMock.mockResolvedValue(undefined);
|
|
|
|
const result = await executeNodeHostCommand({
|
|
command: "bun ./script.ts",
|
|
workdir: "/tmp/work",
|
|
env: {},
|
|
security: "allowlist",
|
|
ask: "on-miss",
|
|
defaultTimeoutSec: 30,
|
|
approvalRunningNoticeMs: 0,
|
|
warnings: [],
|
|
agentId: "requested-agent",
|
|
sessionKey: "requested-session",
|
|
});
|
|
|
|
expect(result.details?.status).toBe("approval-pending");
|
|
expect(resolveAllowAlwaysPersistenceDecisionMock).toHaveBeenCalledWith(
|
|
expect.objectContaining({
|
|
commandText: "bun ./script.ts",
|
|
platform: process.platform,
|
|
runtimePayload: false,
|
|
}),
|
|
);
|
|
expect(resolveExecApprovalAllowedDecisionsMock).toHaveBeenCalledWith({
|
|
ask: "on-miss",
|
|
allowAlwaysPersistence: { kind: "one-shot", reasons: ["unplanned"] },
|
|
});
|
|
expect(requireRegisteredApprovalRequest().unavailableDecisions).toEqual(["allow-always"]);
|
|
expect(buildExecApprovalPendingToolResultMock).toHaveBeenCalledWith(
|
|
expect.objectContaining({
|
|
allowedDecisions: ["allow-once", "deny"],
|
|
}),
|
|
);
|
|
});
|
|
|
|
it("reuses de-duplicated node allow-always metadata for repeated command segments", async () => {
|
|
const allowlistEntry = {
|
|
pattern: "/trusted/bin/tool",
|
|
source: "allow-always" as const,
|
|
};
|
|
const commandMarker = { pattern: nodeCommandMarker, source: "allow-always" as const };
|
|
mockGatewayInvokesWithNodeApprovals({ version: 1, agents: {} });
|
|
usePolicyApprovalRequirementMock();
|
|
resolveExecApprovalsFromFileMock.mockReturnValue({
|
|
agent: { security: "allowlist", ask: "on-miss" },
|
|
allowlist: [commandMarker, allowlistEntry],
|
|
file: { version: 1, agents: {} },
|
|
});
|
|
evaluateShellAllowlistMock.mockReturnValue({
|
|
allowlistMatches: [],
|
|
analysisOk: true,
|
|
allowlistSatisfied: false,
|
|
segments: [
|
|
{ resolution: null, argv: ["/trusted/bin/tool", "a"] },
|
|
{ resolution: null, argv: ["/trusted/bin/tool", "b"] },
|
|
],
|
|
segmentAllowlistEntries: [null, null],
|
|
});
|
|
resolveAllowAlwaysPatternCoverageMock.mockReturnValue({
|
|
complete: true,
|
|
patterns: [{ pattern: "/trusted/bin/tool" }],
|
|
});
|
|
resolveExecHostApprovalContextMock.mockReturnValue({
|
|
approvals: { allowlist: [], file: { version: 1, agents: {} } },
|
|
hostSecurity: "allowlist",
|
|
hostAsk: "on-miss",
|
|
askFallback: "deny",
|
|
});
|
|
|
|
const result = await executeNodeHostCommand({
|
|
command: "/trusted/bin/tool a && /trusted/bin/tool b",
|
|
workdir: "/tmp/work",
|
|
env: {},
|
|
security: "allowlist",
|
|
ask: "on-miss",
|
|
defaultTimeoutSec: 30,
|
|
approvalRunningNoticeMs: 0,
|
|
warnings: [],
|
|
agentId: "requested-agent",
|
|
sessionKey: "requested-session",
|
|
});
|
|
|
|
expect(result.details?.status).toBe("completed");
|
|
expect(registerExecApprovalRequestForHostOrThrowMock).not.toHaveBeenCalled();
|
|
expect(requiresExecApprovalMock).toHaveBeenLastCalledWith(
|
|
expect.objectContaining({
|
|
allowlistSatisfied: false,
|
|
durableApprovalSatisfied: true,
|
|
}),
|
|
);
|
|
});
|
|
|
|
it("does not reuse partial node allow-always metadata for compound commands", async () => {
|
|
const allowlistEntry = {
|
|
pattern: "/trusted/bin/foo",
|
|
source: "allow-always" as const,
|
|
};
|
|
const commandMarker = { pattern: nodeCommandMarker, source: "allow-always" as const };
|
|
mockGatewayInvokesWithNodeApprovals({ version: 1, agents: {} });
|
|
usePolicyApprovalRequirementMock();
|
|
resolveExecApprovalsFromFileMock.mockReturnValue({
|
|
agent: { security: "allowlist", ask: "on-miss" },
|
|
allowlist: [commandMarker, allowlistEntry],
|
|
file: { version: 1, agents: {} },
|
|
});
|
|
evaluateShellAllowlistMock.mockReturnValue({
|
|
allowlistMatches: [],
|
|
analysisOk: true,
|
|
allowlistSatisfied: false,
|
|
segments: [
|
|
{ resolution: null, argv: ["foo"] },
|
|
{ resolution: null, argv: ["bar"] },
|
|
],
|
|
segmentAllowlistEntries: [null, null],
|
|
});
|
|
resolveAllowAlwaysPatternCoverageMock.mockReturnValue({
|
|
complete: true,
|
|
patterns: [{ pattern: "/trusted/bin/foo" }, { pattern: "/trusted/bin/bar" }],
|
|
});
|
|
resolveExecHostApprovalContextMock.mockReturnValue({
|
|
approvals: { allowlist: [], file: { version: 1, agents: {} } },
|
|
hostSecurity: "allowlist",
|
|
hostAsk: "on-miss",
|
|
askFallback: "deny",
|
|
});
|
|
resolveApprovalDecisionOrUndefinedMock.mockResolvedValue(undefined);
|
|
|
|
const result = await executeNodeHostCommand({
|
|
command: "foo && bar",
|
|
workdir: "/tmp/work",
|
|
env: {},
|
|
security: "allowlist",
|
|
ask: "on-miss",
|
|
defaultTimeoutSec: 30,
|
|
approvalRunningNoticeMs: 0,
|
|
warnings: [],
|
|
agentId: "requested-agent",
|
|
sessionKey: "requested-session",
|
|
});
|
|
|
|
expect(result.details?.status).toBe("approval-pending");
|
|
expect(registerExecApprovalRequestForHostOrThrowMock).toHaveBeenCalledTimes(1);
|
|
expect(requiresExecApprovalMock).toHaveBeenLastCalledWith(
|
|
expect.objectContaining({
|
|
allowlistSatisfied: false,
|
|
durableApprovalSatisfied: false,
|
|
}),
|
|
);
|
|
});
|
|
|
|
it("does not reuse a node command marker when concrete allow-always coverage is empty", async () => {
|
|
const commandMarker = { pattern: nodeCommandMarker, source: "allow-always" as const };
|
|
mockGatewayInvokesWithNodeApprovals({ version: 1, agents: {} });
|
|
usePolicyApprovalRequirementMock();
|
|
resolveExecApprovalsFromFileMock.mockReturnValue({
|
|
agent: { security: "allowlist", ask: "on-miss" },
|
|
allowlist: [commandMarker],
|
|
file: { version: 1, agents: {} },
|
|
});
|
|
evaluateShellAllowlistMock.mockReturnValue({
|
|
allowlistMatches: [],
|
|
analysisOk: true,
|
|
allowlistSatisfied: false,
|
|
segments: [{ resolution: null, argv: ["tool", "--version"] }],
|
|
segmentAllowlistEntries: [null],
|
|
});
|
|
resolveAllowAlwaysPatternCoverageMock.mockReturnValue({
|
|
complete: false,
|
|
patterns: [],
|
|
});
|
|
resolveExecHostApprovalContextMock.mockReturnValue({
|
|
approvals: { allowlist: [], file: { version: 1, agents: {} } },
|
|
hostSecurity: "allowlist",
|
|
hostAsk: "on-miss",
|
|
askFallback: "deny",
|
|
});
|
|
resolveApprovalDecisionOrUndefinedMock.mockResolvedValue(undefined);
|
|
|
|
const result = await executeNodeHostCommand({
|
|
command: "tool --version",
|
|
workdir: "/tmp/work",
|
|
env: {},
|
|
security: "allowlist",
|
|
ask: "on-miss",
|
|
defaultTimeoutSec: 30,
|
|
approvalRunningNoticeMs: 0,
|
|
warnings: [],
|
|
agentId: "requested-agent",
|
|
sessionKey: "requested-session",
|
|
});
|
|
|
|
expect(result.details?.status).toBe("approval-pending");
|
|
expect(registerExecApprovalRequestForHostOrThrowMock).toHaveBeenCalledTimes(1);
|
|
expect(requiresExecApprovalMock).toHaveBeenLastCalledWith(
|
|
expect.objectContaining({
|
|
allowlistSatisfied: false,
|
|
durableApprovalSatisfied: false,
|
|
}),
|
|
);
|
|
});
|
|
|
|
it("reuses current node-reported coverage when gateway analysis cannot resolve node paths", async () => {
|
|
const commandMarker = { pattern: nodeCommandMarker, source: "allow-always" as const };
|
|
const allowlistEntry = {
|
|
pattern: "/node/bin/tool",
|
|
source: "allow-always" as const,
|
|
};
|
|
mockGatewayInvokesWithNodeApprovals({ version: 1, agents: {} });
|
|
usePolicyApprovalRequirementMock();
|
|
parsePreparedSystemRunPayloadMock.mockReturnValueOnce({
|
|
plan: preparedPlan,
|
|
execPolicy: { security: "full", ask: "off" },
|
|
allowAlwaysCoverage: {
|
|
complete: true,
|
|
patterns: [{ pattern: "/node/bin/tool" }],
|
|
},
|
|
});
|
|
resolveExecApprovalsFromFileMock.mockReturnValue({
|
|
agent: { security: "allowlist", ask: "on-miss" },
|
|
allowlist: [commandMarker, allowlistEntry],
|
|
file: { version: 1, agents: {} },
|
|
});
|
|
evaluateShellAllowlistMock.mockReturnValue({
|
|
allowlistMatches: [],
|
|
analysisOk: true,
|
|
allowlistSatisfied: false,
|
|
segments: [{ resolution: null, argv: ["tool", "--version"] }],
|
|
segmentAllowlistEntries: [null],
|
|
});
|
|
resolveAllowAlwaysPatternCoverageMock.mockReturnValue({
|
|
complete: false,
|
|
patterns: [],
|
|
});
|
|
resolveExecHostApprovalContextMock.mockReturnValue({
|
|
approvals: { allowlist: [], file: { version: 1, agents: {} } },
|
|
hostSecurity: "allowlist",
|
|
hostAsk: "on-miss",
|
|
askFallback: "deny",
|
|
});
|
|
|
|
const result = await executeNodeHostCommand({
|
|
command: "tool --version",
|
|
workdir: "/tmp/work",
|
|
env: {},
|
|
security: "allowlist",
|
|
ask: "on-miss",
|
|
defaultTimeoutSec: 30,
|
|
approvalRunningNoticeMs: 0,
|
|
warnings: [],
|
|
agentId: "requested-agent",
|
|
sessionKey: "requested-session",
|
|
});
|
|
|
|
expect(result.details?.status).toBe("completed");
|
|
expect(registerExecApprovalRequestForHostOrThrowMock).not.toHaveBeenCalled();
|
|
expect(requiresExecApprovalMock).toHaveBeenLastCalledWith(
|
|
expect.objectContaining({
|
|
allowlistSatisfied: false,
|
|
durableApprovalSatisfied: true,
|
|
}),
|
|
);
|
|
});
|
|
|
|
it("does not reuse last-used node metadata without an exact command marker", async () => {
|
|
const allowlistEntries = [
|
|
{
|
|
pattern: "/trusted/bin/foo",
|
|
argPattern: "^a\x00$",
|
|
source: "allow-always" as const,
|
|
lastUsedCommand: preparedPlan.commandText,
|
|
},
|
|
{
|
|
pattern: "/trusted/bin/foo",
|
|
argPattern: "^b\x00$",
|
|
source: "allow-always" as const,
|
|
lastUsedCommand: preparedPlan.commandText,
|
|
},
|
|
];
|
|
mockGatewayInvokesWithNodeApprovals({ version: 1, agents: {} });
|
|
usePolicyApprovalRequirementMock();
|
|
resolveExecApprovalsFromFileMock.mockReturnValue({
|
|
agent: { security: "allowlist", ask: "on-miss" },
|
|
allowlist: allowlistEntries,
|
|
file: { version: 1, agents: {} },
|
|
});
|
|
evaluateShellAllowlistMock.mockReturnValue({
|
|
allowlistMatches: [],
|
|
analysisOk: true,
|
|
allowlistSatisfied: false,
|
|
segments: [
|
|
{ resolution: null, argv: ["foo", "a"] },
|
|
{ resolution: null, argv: ["foo", "b"] },
|
|
{ resolution: null, argv: ["missingcmd"] },
|
|
],
|
|
segmentAllowlistEntries: [null, null, null],
|
|
});
|
|
resolveAllowAlwaysPatternCoverageMock.mockReturnValue({ complete: false, patterns: [] });
|
|
resolveExecHostApprovalContextMock.mockReturnValue({
|
|
approvals: { allowlist: [], file: { version: 1, agents: {} } },
|
|
hostSecurity: "allowlist",
|
|
hostAsk: "on-miss",
|
|
askFallback: "deny",
|
|
});
|
|
resolveApprovalDecisionOrUndefinedMock.mockResolvedValue(undefined);
|
|
|
|
const result = await executeNodeHostCommand({
|
|
command: "foo a && foo b && missingcmd",
|
|
workdir: "/tmp/work",
|
|
env: {},
|
|
security: "allowlist",
|
|
ask: "on-miss",
|
|
defaultTimeoutSec: 30,
|
|
approvalRunningNoticeMs: 0,
|
|
warnings: [],
|
|
agentId: "requested-agent",
|
|
sessionKey: "requested-session",
|
|
});
|
|
|
|
expect(result.details?.status).toBe("approval-pending");
|
|
expect(registerExecApprovalRequestForHostOrThrowMock).toHaveBeenCalledTimes(1);
|
|
expect(requiresExecApprovalMock).toHaveBeenLastCalledWith(
|
|
expect.objectContaining({
|
|
allowlistSatisfied: false,
|
|
durableApprovalSatisfied: false,
|
|
}),
|
|
);
|
|
});
|
|
|
|
it("does not reuse node allow-always metadata when only representable segments match", async () => {
|
|
const allowlistEntries = [
|
|
{
|
|
pattern: "/bin/echo",
|
|
source: "allow-always" as const,
|
|
},
|
|
{
|
|
pattern: "/bin/date",
|
|
source: "allow-always" as const,
|
|
},
|
|
];
|
|
const commandMarker = { pattern: nodeCommandMarker, source: "allow-always" as const };
|
|
mockGatewayInvokesWithNodeApprovals({ version: 1, agents: {} });
|
|
usePolicyApprovalRequirementMock();
|
|
resolveExecApprovalsFromFileMock.mockReturnValue({
|
|
agent: { security: "allowlist", ask: "on-miss" },
|
|
allowlist: [commandMarker, ...allowlistEntries],
|
|
file: { version: 1, agents: {} },
|
|
});
|
|
evaluateShellAllowlistMock.mockReturnValue({
|
|
allowlistMatches: [],
|
|
analysisOk: true,
|
|
allowlistSatisfied: false,
|
|
segments: [
|
|
{ resolution: null, argv: ["sh", "-c", "/bin/echo ok && /bin/date"] },
|
|
{ resolution: null, argv: ["missingcmd"] },
|
|
],
|
|
segmentAllowlistEntries: [null, null],
|
|
});
|
|
resolveAllowAlwaysPatternCoverageMock.mockReturnValue({
|
|
complete: false,
|
|
patterns: [{ pattern: "/bin/echo" }, { pattern: "/bin/date" }],
|
|
});
|
|
resolveExecHostApprovalContextMock.mockReturnValue({
|
|
approvals: { allowlist: [], file: { version: 1, agents: {} } },
|
|
hostSecurity: "allowlist",
|
|
hostAsk: "on-miss",
|
|
askFallback: "deny",
|
|
});
|
|
resolveApprovalDecisionOrUndefinedMock.mockResolvedValue(undefined);
|
|
|
|
const result = await executeNodeHostCommand({
|
|
command: 'sh -c "/bin/echo ok && /bin/date" && missingcmd',
|
|
workdir: "/tmp/work",
|
|
env: {},
|
|
security: "allowlist",
|
|
ask: "on-miss",
|
|
defaultTimeoutSec: 30,
|
|
approvalRunningNoticeMs: 0,
|
|
warnings: [],
|
|
agentId: "requested-agent",
|
|
sessionKey: "requested-session",
|
|
});
|
|
|
|
expect(result.details?.status).toBe("approval-pending");
|
|
expect(registerExecApprovalRequestForHostOrThrowMock).toHaveBeenCalledTimes(1);
|
|
expect(requiresExecApprovalMock).toHaveBeenLastCalledWith(
|
|
expect.objectContaining({
|
|
allowlistSatisfied: false,
|
|
durableApprovalSatisfied: false,
|
|
}),
|
|
);
|
|
});
|
|
|
|
it("does not use unresolved node allow-always fallback for shell wrappers", async () => {
|
|
const allowlistEntry = {
|
|
pattern: "/trusted/bin/foo",
|
|
source: "allow-always" as const,
|
|
};
|
|
mockGatewayInvokesWithNodeApprovals({ version: 1, agents: {} });
|
|
usePolicyApprovalRequirementMock();
|
|
resolveExecApprovalsFromFileMock.mockReturnValue({
|
|
agent: { security: "allowlist", ask: "on-miss" },
|
|
allowlist: [allowlistEntry],
|
|
file: { version: 1, agents: {} },
|
|
});
|
|
evaluateShellAllowlistMock.mockReturnValue({
|
|
allowlistMatches: [],
|
|
analysisOk: true,
|
|
allowlistSatisfied: false,
|
|
segments: [{ resolution: null, argv: ["bash", "-lc", "foo && missingcmd"] }],
|
|
segmentAllowlistEntries: [null],
|
|
});
|
|
resolveAllowAlwaysPatternCoverageMock.mockReturnValue({ complete: false, patterns: [] });
|
|
resolveExecHostApprovalContextMock.mockReturnValue({
|
|
approvals: { allowlist: [], file: { version: 1, agents: {} } },
|
|
hostSecurity: "allowlist",
|
|
hostAsk: "on-miss",
|
|
askFallback: "deny",
|
|
});
|
|
resolveApprovalDecisionOrUndefinedMock.mockResolvedValue(undefined);
|
|
|
|
const result = await executeNodeHostCommand({
|
|
command: 'bash -lc "foo && missingcmd"',
|
|
workdir: "/tmp/work",
|
|
env: {},
|
|
security: "allowlist",
|
|
ask: "on-miss",
|
|
defaultTimeoutSec: 30,
|
|
approvalRunningNoticeMs: 0,
|
|
warnings: [],
|
|
agentId: "requested-agent",
|
|
sessionKey: "requested-session",
|
|
});
|
|
|
|
expect(result.details?.status).toBe("approval-pending");
|
|
expect(registerExecApprovalRequestForHostOrThrowMock).toHaveBeenCalledTimes(1);
|
|
expect(requiresExecApprovalMock).toHaveBeenLastCalledWith(
|
|
expect.objectContaining({
|
|
allowlistSatisfied: false,
|
|
durableApprovalSatisfied: false,
|
|
}),
|
|
);
|
|
});
|
|
|
|
it("uses forwarded node env overrides for node approval prechecks", async () => {
|
|
const allowlistEntry = { pattern: "/trusted/bin/tool" };
|
|
mockGatewayInvokesWithNodeApprovals({ version: 1, agents: {} });
|
|
usePolicyApprovalRequirementMock();
|
|
resolveExecApprovalsFromFileMock.mockReturnValue({
|
|
agent: { security: "allowlist", ask: "on-miss" },
|
|
allowlist: [allowlistEntry],
|
|
file: { version: 1, agents: {} },
|
|
});
|
|
evaluateShellAllowlistMock.mockImplementation((raw: unknown) => {
|
|
const params = raw as ShellAllowlistMockParams;
|
|
const hasNodeAllowlist = (params.allowlist ?? []).length > 0;
|
|
return buildAllowlistEvalResult({
|
|
allowlistSatisfied:
|
|
hasNodeAllowlist &&
|
|
params.env != null &&
|
|
params.env.FOO === "bar" &&
|
|
params.env.PATH === "",
|
|
segmentAllowlistEntry: allowlistEntry,
|
|
});
|
|
});
|
|
resolveExecHostApprovalContextMock.mockReturnValue({
|
|
approvals: { allowlist: [], file: { version: 1, agents: {} } },
|
|
hostSecurity: "allowlist",
|
|
hostAsk: "on-miss",
|
|
askFallback: "deny",
|
|
});
|
|
|
|
const result = await executeNodeHostCommand({
|
|
command: "tool --version",
|
|
workdir: "/tmp/work",
|
|
env: { PATH: "/gateway/bin:/usr/bin" },
|
|
requestedEnv: { FOO: "bar" },
|
|
security: "allowlist",
|
|
ask: "on-miss",
|
|
defaultTimeoutSec: 30,
|
|
approvalRunningNoticeMs: 0,
|
|
warnings: [],
|
|
agentId: "requested-agent",
|
|
sessionKey: "requested-session",
|
|
});
|
|
|
|
expect(result.details?.status).toBe("completed");
|
|
expect(registerExecApprovalRequestForHostOrThrowMock).not.toHaveBeenCalled();
|
|
expect(requiresExecApprovalMock).toHaveBeenLastCalledWith(
|
|
expect.objectContaining({
|
|
analysisOk: true,
|
|
allowlistSatisfied: true,
|
|
durableApprovalSatisfied: false,
|
|
}),
|
|
);
|
|
expect(requireGatewayCommand("system.run.prepare").params?.params?.env).toEqual({
|
|
FOO: "bar",
|
|
});
|
|
expect(requireRunParams(requireGatewayCommand("system.run")).env).toEqual({ FOO: "bar" });
|
|
const evalEnvs = evaluateShellAllowlistMock.mock.calls.map(
|
|
([raw]) => (raw as ShellAllowlistMockParams).env,
|
|
);
|
|
expect(evalEnvs.length).toBeGreaterThanOrEqual(2);
|
|
expect(evalEnvs.every((env) => env != null && env.FOO === "bar" && env.PATH === "")).toBe(true);
|
|
});
|
|
|
|
it("skips approval prepare in full/off mode", async () => {
|
|
await executeNodeHostCommand({
|
|
command: "bun ./script.ts",
|
|
workdir: "/tmp/work",
|
|
env: {},
|
|
security: "full",
|
|
ask: "off",
|
|
defaultTimeoutSec: 30,
|
|
approvalRunningNoticeMs: 0,
|
|
warnings: [],
|
|
agentId: "requested-agent",
|
|
sessionKey: "requested-session",
|
|
notifyOnExit: false,
|
|
});
|
|
|
|
expect(callGatewayToolMock).toHaveBeenCalledTimes(1);
|
|
const call = requireGatewayCall(0);
|
|
expect(call.options.timeoutMs).toBe(35_000);
|
|
const runParams = requireRunParams(call);
|
|
expect(runParams.command).toEqual(["/bin/sh", "-lc", "bun ./script.ts"]);
|
|
expect(runParams.rawCommand).toBe("bun ./script.ts");
|
|
expect(typeof runParams.runId).toBe("string");
|
|
expect(runParams.suppressNotifyOnExit).toBe(true);
|
|
expect(runParams.timeoutMs).toBe(30_000);
|
|
expect(Object.hasOwn(runParams, "systemRunPlan")).toBe(false);
|
|
});
|
|
|
|
it("rejects disconnected node targets before invoking system.run", async () => {
|
|
listNodesMock.mockResolvedValueOnce([
|
|
{
|
|
nodeId: "node-1",
|
|
commands: ["system.run", "system.run.prepare"],
|
|
connected: false,
|
|
platform: process.platform,
|
|
},
|
|
]);
|
|
|
|
await expect(
|
|
executeNodeHostCommand({
|
|
command: "git log --oneline -5",
|
|
workdir: "/tmp/work",
|
|
env: {},
|
|
security: "allowlist",
|
|
ask: "off",
|
|
requestedNode: "node-1",
|
|
defaultTimeoutSec: 30,
|
|
approvalRunningNoticeMs: 0,
|
|
warnings: [],
|
|
agentId: "requested-agent",
|
|
sessionKey: "requested-session",
|
|
}),
|
|
).rejects.toThrow(
|
|
"exec host=node requires a connected node (node-1 is currently disconnected)",
|
|
);
|
|
expect(callGatewayToolMock).not.toHaveBeenCalled();
|
|
});
|
|
|
|
it("returns a non-empty placeholder for silent node exec results", async () => {
|
|
callGatewayToolMock.mockImplementationOnce(
|
|
async (method: string, _options: unknown, params: MockNodeInvokeParams | undefined) => {
|
|
if (method === "node.invoke" && params?.command === "system.run") {
|
|
return {
|
|
payload: {
|
|
success: true,
|
|
stdout: "",
|
|
stderr: "",
|
|
exitCode: 0,
|
|
timedOut: false,
|
|
},
|
|
};
|
|
}
|
|
throw new Error(`unexpected node invoke command: ${String(params?.command)}`);
|
|
},
|
|
);
|
|
|
|
const result = await executeNodeHostCommand({
|
|
command: "mkdir /tmp/quiet",
|
|
workdir: "/tmp/work",
|
|
env: {},
|
|
security: "full",
|
|
ask: "off",
|
|
defaultTimeoutSec: 30,
|
|
approvalRunningNoticeMs: 0,
|
|
warnings: [],
|
|
agentId: "requested-agent",
|
|
sessionKey: "requested-session",
|
|
});
|
|
|
|
expect(result.content).toEqual([{ type: "text", text: "(no output)" }]);
|
|
const details = result.details;
|
|
expect(details?.status).toBe("completed");
|
|
if (details?.status !== "completed") {
|
|
throw new Error(`expected completed details, got ${details?.status ?? "missing"}`);
|
|
}
|
|
expect(details.exitCode).toBe(0);
|
|
expect(details.aggregated).toBe("");
|
|
expect(details.cwd).toBe("/tmp/work");
|
|
});
|
|
|
|
it("forwards explicit timeouts to node system.run", async () => {
|
|
await executeNodeHostCommand({
|
|
command: "bun ./script.ts",
|
|
workdir: "/tmp/work",
|
|
env: {},
|
|
security: "full",
|
|
ask: "off",
|
|
timeoutSec: 12,
|
|
defaultTimeoutSec: 30,
|
|
approvalRunningNoticeMs: 0,
|
|
warnings: [],
|
|
agentId: "requested-agent",
|
|
sessionKey: "requested-session",
|
|
});
|
|
|
|
expectSystemRunInvoke({ invokeTimeoutMs: 17_000, runTimeoutMs: 12_000 });
|
|
});
|
|
|
|
it("normalizes unsafe explicit timeouts before invoking node system.run", async () => {
|
|
await executeNodeHostCommand({
|
|
command: "bun ./script.ts",
|
|
workdir: "/tmp/work",
|
|
env: {},
|
|
security: "full",
|
|
ask: "off",
|
|
timeoutSec: Number.POSITIVE_INFINITY,
|
|
defaultTimeoutSec: 30,
|
|
approvalRunningNoticeMs: 0,
|
|
warnings: [],
|
|
agentId: "requested-agent",
|
|
sessionKey: "requested-session",
|
|
});
|
|
|
|
expectSystemRunInvoke({ invokeTimeoutMs: 35_000, runTimeoutMs: 30_000 });
|
|
|
|
callGatewayToolMock.mockClear();
|
|
|
|
await executeNodeHostCommand({
|
|
command: "bun ./script.ts",
|
|
workdir: "/tmp/work",
|
|
env: {},
|
|
security: "full",
|
|
ask: "off",
|
|
timeoutSec: 3_000_000,
|
|
defaultTimeoutSec: 30,
|
|
approvalRunningNoticeMs: 0,
|
|
warnings: [],
|
|
agentId: "requested-agent",
|
|
sessionKey: "requested-session",
|
|
});
|
|
|
|
expectSystemRunInvoke({
|
|
invokeTimeoutMs: MAX_SAFE_TIMEOUT_DELAY_MS,
|
|
runTimeoutMs: MAX_SAFE_TIMEOUT_DELAY_MS,
|
|
});
|
|
|
|
callGatewayToolMock.mockClear();
|
|
|
|
await executeNodeHostCommand({
|
|
command: "bun ./script.ts",
|
|
workdir: "/tmp/work",
|
|
env: {},
|
|
security: "full",
|
|
ask: "off",
|
|
timeoutSec: Number.MAX_VALUE,
|
|
defaultTimeoutSec: 30,
|
|
approvalRunningNoticeMs: 0,
|
|
warnings: [],
|
|
agentId: "requested-agent",
|
|
sessionKey: "requested-session",
|
|
});
|
|
|
|
expectSystemRunInvoke({
|
|
invokeTimeoutMs: MAX_SAFE_TIMEOUT_DELAY_MS,
|
|
runTimeoutMs: MAX_SAFE_TIMEOUT_DELAY_MS,
|
|
});
|
|
});
|
|
|
|
it("forwards timeout zero to node system.run and keeps the invoke wait bounded", async () => {
|
|
await executeNodeHostCommand({
|
|
command: "bun ./script.ts",
|
|
workdir: "/tmp/work",
|
|
env: {},
|
|
security: "full",
|
|
ask: "off",
|
|
timeoutSec: 0,
|
|
defaultTimeoutSec: 30,
|
|
approvalRunningNoticeMs: 0,
|
|
warnings: [],
|
|
agentId: "requested-agent",
|
|
sessionKey: "requested-session",
|
|
});
|
|
|
|
expectSystemRunInvoke({ invokeTimeoutMs: 35_000, runTimeoutMs: 0 });
|
|
});
|
|
|
|
it("allows exec when requestedNode is display name matching boundNode's device", async () => {
|
|
listNodesMock.mockResolvedValue([
|
|
{
|
|
nodeId: "f2396b588d391d30a79d300e196a17cf197f34969b5e2485d2734c953567f44e",
|
|
displayName: "home-wsl-debian",
|
|
commands: ["system.run"],
|
|
platform: process.platform,
|
|
},
|
|
]);
|
|
const result = await executeNodeHostCommand({
|
|
command: "echo hello",
|
|
workdir: "/tmp/work",
|
|
env: {},
|
|
security: "full",
|
|
ask: "off",
|
|
defaultTimeoutSec: 30,
|
|
approvalRunningNoticeMs: 0,
|
|
warnings: [],
|
|
agentId: "test-agent",
|
|
sessionKey: "test-session",
|
|
boundNode: "f2396b588d391d30a79d300e196a17cf197f34969b5e2485d2734c953567f44e",
|
|
requestedNode: "home-wsl-debian",
|
|
});
|
|
expect(result.details?.status).toBeDefined();
|
|
});
|
|
|
|
it("allows exec when requestedNode is partial ID matching boundNode's device", async () => {
|
|
listNodesMock.mockResolvedValue([
|
|
{
|
|
nodeId: "f2396b588d391d30a79d300e196a17cf197f34969b5e2485d2734c953567f44e",
|
|
displayName: "home-wsl-debian",
|
|
commands: ["system.run"],
|
|
platform: process.platform,
|
|
},
|
|
]);
|
|
const result = await executeNodeHostCommand({
|
|
command: "echo hello",
|
|
workdir: "/tmp/work",
|
|
env: {},
|
|
security: "full",
|
|
ask: "off",
|
|
defaultTimeoutSec: 30,
|
|
approvalRunningNoticeMs: 0,
|
|
warnings: [],
|
|
agentId: "test-agent",
|
|
sessionKey: "test-session",
|
|
boundNode: "f2396b588d391d30a79d300e196a17cf197f34969b5e2485d2734c953567f44e",
|
|
requestedNode: "f2396b588d391d",
|
|
});
|
|
expect(result.details?.status).toBeDefined();
|
|
});
|
|
|
|
it("rejects exec when requestedNode resolves to a different node than boundNode", async () => {
|
|
listNodesMock.mockResolvedValue([
|
|
{
|
|
nodeId: "f2396b588d391d30a79d300e196a17cf197f34969b5e2485d2734c953567f44e",
|
|
displayName: "home-wsl-debian",
|
|
commands: ["system.run"],
|
|
platform: process.platform,
|
|
},
|
|
{
|
|
nodeId: "aaaa1111bbbb2222cccc3333dddd4444eeee5555ffff6666aaa7777bbb88889999",
|
|
displayName: "other-node",
|
|
commands: ["system.run"],
|
|
platform: process.platform,
|
|
},
|
|
]);
|
|
await expect(
|
|
executeNodeHostCommand({
|
|
command: "echo hello",
|
|
workdir: "/tmp/work",
|
|
env: {},
|
|
security: "full",
|
|
ask: "off",
|
|
defaultTimeoutSec: 30,
|
|
approvalRunningNoticeMs: 0,
|
|
warnings: [],
|
|
agentId: "test-agent",
|
|
sessionKey: "test-session",
|
|
boundNode: "f2396b588d391d30a79d300e196a17cf197f34969b5e2485d2734c953567f44e",
|
|
requestedNode: "other-node",
|
|
}),
|
|
).rejects.toThrow("exec node not allowed (bound to f2396b588d391d30");
|
|
});
|
|
|
|
it("preserves original error when requestedNode matches no known node", async () => {
|
|
listNodesMock.mockResolvedValue([
|
|
{
|
|
nodeId: "f2396b588d391d30a79d300e196a17cf197f34969b5e2485d2734c953567f44e",
|
|
displayName: "home-wsl-debian",
|
|
commands: ["system.run"],
|
|
platform: process.platform,
|
|
},
|
|
]);
|
|
await expect(
|
|
executeNodeHostCommand({
|
|
command: "echo hello",
|
|
workdir: "/tmp/work",
|
|
env: {},
|
|
security: "full",
|
|
ask: "off",
|
|
defaultTimeoutSec: 30,
|
|
approvalRunningNoticeMs: 0,
|
|
warnings: [],
|
|
agentId: "test-agent",
|
|
sessionKey: "test-session",
|
|
requestedNode: "nonexistent-node",
|
|
}),
|
|
).rejects.toThrow(
|
|
"requested node not found: nonexistent-node (unknown node: nonexistent-node)",
|
|
);
|
|
});
|
|
|
|
it("allows exec when boundNode is a display name matching the same device as requestedNode", async () => {
|
|
listNodesMock.mockResolvedValue([
|
|
{
|
|
nodeId: "f2396b588d391d30a79d300e196a17cf197f34969b5e2485d2734c953567f44e",
|
|
displayName: "home-wsl-debian",
|
|
commands: ["system.run"],
|
|
platform: process.platform,
|
|
},
|
|
]);
|
|
const result = await executeNodeHostCommand({
|
|
command: "echo hello",
|
|
workdir: "/tmp/work",
|
|
env: {},
|
|
security: "full",
|
|
ask: "off",
|
|
defaultTimeoutSec: 30,
|
|
approvalRunningNoticeMs: 0,
|
|
warnings: [],
|
|
agentId: "test-agent",
|
|
sessionKey: "test-session",
|
|
boundNode: "home-wsl-debian",
|
|
requestedNode: "home-wsl-debian",
|
|
});
|
|
expect(result.details?.status).toBeDefined();
|
|
});
|
|
|
|
it("auto-reviews strict inline-eval commands with full/off host policy when node policy is available", async () => {
|
|
const inlinePlan = {
|
|
argv: ["python3", "-c", "print(1)"],
|
|
cwd: "/tmp/work",
|
|
commandText: "python3 -c 'print(1)'",
|
|
commandPreview: null,
|
|
agentId: "requested-agent",
|
|
sessionKey: "requested-session",
|
|
};
|
|
parsePreparedSystemRunPayloadMock.mockReturnValue({
|
|
plan: inlinePlan,
|
|
execPolicy: { security: "full", ask: "off" },
|
|
});
|
|
const autoReviewer = vi.fn<ExecAutoReviewer>(async () => ({
|
|
decision: "allow-once",
|
|
risk: "low",
|
|
rationale: "safe inline eval",
|
|
}));
|
|
detectInterpreterInlineEvalArgvMock.mockReturnValue(INLINE_EVAL_HIT);
|
|
evaluateShellAllowlistMock.mockReturnValue({
|
|
allowlistMatches: [],
|
|
analysisOk: true,
|
|
allowlistSatisfied: false,
|
|
segments: [
|
|
{
|
|
resolution: null,
|
|
argv: ["python3", "-c", "print(1)"],
|
|
raw: "python3 -c 'print(1)'",
|
|
},
|
|
],
|
|
segmentAllowlistEntries: [],
|
|
});
|
|
resolveExecHostApprovalContextMock.mockReturnValue({
|
|
approvals: { allowlist: [], file: { version: 1, agents: {} } },
|
|
hostSecurity: "full",
|
|
hostAsk: "off",
|
|
askFallback: "deny",
|
|
});
|
|
|
|
const result = await executeNodeHostCommand({
|
|
command: "python3 -c 'print(1)'",
|
|
workdir: "/tmp/work",
|
|
env: {},
|
|
security: "full",
|
|
ask: "off",
|
|
autoReview: true,
|
|
autoReviewer,
|
|
strictInlineEval: true,
|
|
defaultTimeoutSec: 30,
|
|
approvalRunningNoticeMs: 0,
|
|
warnings: [],
|
|
agentId: "requested-agent",
|
|
sessionKey: "requested-session",
|
|
});
|
|
|
|
expect(result.details?.status).toBe("completed");
|
|
expect(autoReviewer).toHaveBeenCalledWith(
|
|
expect.objectContaining({
|
|
command: "python3 -c 'print(1)'",
|
|
argv: ["python3", "-c", "print(1)"],
|
|
host: "node",
|
|
reason: "strict-inline-eval",
|
|
}),
|
|
);
|
|
expect(callGatewayToolMock).toHaveBeenCalledWith(
|
|
"exec.approvals.node.get",
|
|
{ timeoutMs: 10_000 },
|
|
{ nodeId: "node-1" },
|
|
);
|
|
});
|
|
|
|
it("denies timed-out inline-eval requests instead of invoking the node", async () => {
|
|
detectInterpreterInlineEvalArgvMock.mockReturnValue(INLINE_EVAL_HIT);
|
|
resolveApprovalDecisionOrUndefinedMock.mockResolvedValue(null);
|
|
createExecApprovalDecisionStateMock.mockReturnValue({
|
|
baseDecision: { timedOut: true },
|
|
approvedByAsk: true,
|
|
deniedReason: null,
|
|
});
|
|
enforceStrictInlineEvalApprovalBoundaryMock.mockReturnValue({
|
|
approvedByAsk: false,
|
|
deniedReason: "approval-timeout",
|
|
});
|
|
resolveExecHostApprovalContextMock.mockReturnValue({
|
|
approvals: { allowlist: [], file: { version: 1, agents: {} } },
|
|
hostSecurity: "full",
|
|
hostAsk: "off",
|
|
askFallback: "full",
|
|
});
|
|
|
|
const result = await executeNodeHostCommand({
|
|
command: "python3 -c 'print(1)'",
|
|
workdir: "/tmp/work",
|
|
env: {},
|
|
security: "full",
|
|
ask: "off",
|
|
strictInlineEval: true,
|
|
defaultTimeoutSec: 30,
|
|
approvalRunningNoticeMs: 0,
|
|
warnings: [],
|
|
agentId: "requested-agent",
|
|
sessionKey: "requested-session",
|
|
});
|
|
|
|
expect(result.details?.status).toBe("approval-pending");
|
|
await vi.waitFor(() => {
|
|
expect(sendExecApprovalFollowupResultMock).toHaveBeenCalledWith(
|
|
expect.objectContaining({
|
|
approvalId: "approval-1",
|
|
sessionKey: "requested-session",
|
|
}),
|
|
"Exec denied (node=node-1 id=approval-1, approval-timeout): python3 -c 'print(1)'",
|
|
);
|
|
});
|
|
expect(callGatewayToolMock).toHaveBeenCalledTimes(1);
|
|
});
|
|
});
|