Add AST-based security middleware and enforcement wiring

2026-02-23 14:21:22 -05:00
parent 9b4216dda9
commit ef2a25b5fb
28 changed files with 1936 additions and 37 deletions
--- a/tests/config.test.ts
+++ b/tests/config.test.ts
@@ -9,6 +9,8 @@ test("loads defaults and freezes config", () => {
  assert.equal(config.orchestration.maxDepth, 4);
  assert.equal(config.provisioning.portRange.basePort, 36000);
  assert.equal(config.discovery.fileRelativePath, ".agent-context/resources.json");
+  assert.equal(config.security.violationHandling, "hard_abort");
+  assert.equal(config.security.commandTimeoutMs, 120000);
  assert.equal(Object.isFrozen(config), true);
  assert.equal(Object.isFrozen(config.orchestration), true);
 });
@@ -20,3 +22,9 @@ test("validates boolean env values", () => {
  );
 });

+test("validates security violation mode", () => {
+  assert.throws(
+    () => loadConfig({ AGENT_SECURITY_VIOLATION_MODE: "retry_forever" }),
+    /invalid_union|Invalid input/i,
+  );
+});
--- a/tests/mcp-registry.test.ts
+++ b/tests/mcp-registry.test.ts
@@ -63,3 +63,34 @@ test("mcp registry rejects unknown explicit handlers", () => {
    /Unknown MCP handler/,
  );
 });
+
+test("mcp registry enforces tool clearance on resolved codex tool lists", () => {
+  const registry = createDefaultMcpRegistry();
+
+  const resolved = registry.resolveServerWithHandler({
+    serverName: "sandbox-tools",
+    server: {
+      type: "stdio",
+      command: "node",
+      args: ["server.js"],
+      enabled_tools: ["read_file", "write_file", "search"],
+      disabled_tools: ["legacy_tool"],
+    },
+    context: {},
+    fullConfig: {
+      servers: {},
+    },
+    toolClearance: {
+      allowlist: ["read_file", "search"],
+      banlist: ["search", "write_file"],
+    },
+  });
+
+  assert.ok(resolved.codex);
+  assert.deepEqual(resolved.codex.enabled_tools, ["read_file"]);
+  assert.deepEqual(resolved.codex.disabled_tools, [
+    "legacy_tool",
+    "search",
+    "write_file",
+  ]);
+});
--- a/tests/orchestration-engine.test.ts
+++ b/tests/orchestration-engine.test.ts
@@ -5,6 +5,7 @@ import { tmpdir } from "node:os";
 import { resolve } from "node:path";
 import { SchemaDrivenExecutionEngine } from "../src/agents/orchestration.js";
 import type { ActorExecutionResult } from "../src/agents/pipeline.js";
+import { SecurityViolationError } from "../src/security/index.js";

 function createManifest(): unknown {
  return {
@@ -191,6 +192,7 @@ test("runs DAG pipeline with state-dependent routing and retry behavior", async
      coder: async (input): Promise<ActorExecutionResult> => {
        assert.match(input.prompt, /AIOPS-123/);
        assert.deepEqual(input.toolClearance.allowlist, ["read_file", "write_file"]);
+        assert.ok(input.security);
        coderAttempts += 1;
        if (coderAttempts === 1) {
          return {
@@ -759,3 +761,158 @@ test("propagates abort signal into actor execution and stops the run", async ()
  await assert.rejects(() => runPromise, /(AbortError|manual-abort|aborted)/i);
  assert.equal(observedAbort, true);
 });
+
+test("hard-aborts pipeline on security violations by default", async () => {
+  const workspaceRoot = await mkdtemp(resolve(tmpdir(), "ai-ops-workspace-"));
+  const stateRoot = await mkdtemp(resolve(tmpdir(), "ai-ops-session-state-"));
+  const projectContextPath = resolve(stateRoot, "project-context.json");
+
+  const manifest = {
+    schemaVersion: "1",
+    topologies: ["retry-unrolled", "sequential"],
+    personas: [
+      {
+        id: "coder",
+        displayName: "Coder",
+        systemPromptTemplate: "Coder",
+        toolClearance: {
+          allowlist: ["git"],
+          banlist: [],
+        },
+      },
+    ],
+    relationships: [],
+    topologyConstraints: {
+      maxDepth: 3,
+      maxRetries: 2,
+    },
+    pipeline: {
+      entryNodeId: "secure-node",
+      nodes: [
+        {
+          id: "secure-node",
+          actorId: "secure_actor",
+          personaId: "coder",
+        },
+      ],
+      edges: [],
+    },
+  } as const;
+
+  const engine = new SchemaDrivenExecutionEngine({
+    manifest,
+    settings: {
+      workspaceRoot,
+      stateRoot,
+      projectContextPath,
+      maxDepth: 3,
+      maxRetries: 2,
+      maxChildren: 2,
+      runtimeContext: {},
+    },
+    actorExecutors: {
+      secure_actor: async () => {
+        throw new SecurityViolationError("blocked by policy", {
+          code: "TOOL_NOT_ALLOWED",
+        });
+      },
+    },
+  });
+
+  await assert.rejects(
+    () =>
+      engine.runSession({
+        sessionId: "session-security-hard-abort",
+        initialPayload: {
+          task: "Security hard abort",
+        },
+      }),
+    /blocked by policy/,
+  );
+});
+
+test("can map security violations to validation_fail for retry-unrolled remediation", async () => {
+  const workspaceRoot = await mkdtemp(resolve(tmpdir(), "ai-ops-workspace-"));
+  const stateRoot = await mkdtemp(resolve(tmpdir(), "ai-ops-session-state-"));
+  const projectContextPath = resolve(stateRoot, "project-context.json");
+
+  const manifest = {
+    schemaVersion: "1",
+    topologies: ["retry-unrolled", "sequential"],
+    personas: [
+      {
+        id: "coder",
+        displayName: "Coder",
+        systemPromptTemplate: "Coder",
+        toolClearance: {
+          allowlist: ["git"],
+          banlist: [],
+        },
+      },
+    ],
+    relationships: [],
+    topologyConstraints: {
+      maxDepth: 3,
+      maxRetries: 2,
+    },
+    pipeline: {
+      entryNodeId: "secure-node",
+      nodes: [
+        {
+          id: "secure-node",
+          actorId: "secure_actor",
+          personaId: "coder",
+          constraints: {
+            maxRetries: 1,
+          },
+        },
+      ],
+      edges: [],
+    },
+  } as const;
+
+  let attempts = 0;
+  const engine = new SchemaDrivenExecutionEngine({
+    manifest,
+    settings: {
+      workspaceRoot,
+      stateRoot,
+      projectContextPath,
+      maxDepth: 3,
+      maxRetries: 2,
+      maxChildren: 2,
+      securityViolationHandling: "validation_fail",
+      runtimeContext: {},
+    },
+    actorExecutors: {
+      secure_actor: async () => {
+        attempts += 1;
+        if (attempts === 1) {
+          throw new SecurityViolationError("first attempt blocked", {
+            code: "PATH_TRAVERSAL_BLOCKED",
+          });
+        }
+
+        return {
+          status: "success",
+          payload: {
+            fixed: true,
+          },
+        };
+      },
+    },
+  });
+
+  const result = await engine.runSession({
+    sessionId: "session-security-validation-retry",
+    initialPayload: {
+      task: "Security retry path",
+    },
+  });
+
+  assert.equal(result.status, "success");
+  assert.deepEqual(
+    result.records.map((record) => `${record.nodeId}:${record.status}:${String(record.attempt)}`),
+    ["secure-node:validation_fail:1", "secure-node:success:2"],
+  );
+});
--- a/tests/security-middleware.test.ts
+++ b/tests/security-middleware.test.ts
@@ -0,0 +1,125 @@
+import test from "node:test";
+import assert from "node:assert/strict";
+import { mkdtemp } from "node:fs/promises";
+import { tmpdir } from "node:os";
+import { resolve } from "node:path";
+import {
+  SecurityRulesEngine,
+  SecureCommandExecutor,
+  SecurityViolationError,
+  parseShellScript,
+} from "../src/security/index.js";
+
+test("shell parser extracts Command and Word nodes across chained expressions", () => {
+  const parsed = parseShellScript("FOO=bar git status && npm test | cat > logs/output.txt");
+
+  assert.equal(parsed.commandCount, 3);
+  assert.deepEqual(
+    parsed.commands.map((command) => command.binary),
+    ["git", "npm", "cat"],
+  );
+
+  const gitCommand = parsed.commands[0];
+  assert.ok(gitCommand);
+  assert.equal(gitCommand.assignments[0]?.key, "FOO");
+  assert.deepEqual(gitCommand.args, ["status"]);
+
+  const catCommand = parsed.commands[2];
+  assert.ok(catCommand);
+  assert.deepEqual(catCommand.redirects, ["logs/output.txt"]);
+});
+
+test("rules engine enforces binary allowlist, tool policy, and path boundaries", async () => {
+  const worktreeRoot = await mkdtemp(resolve(tmpdir(), "ai-ops-security-worktree-"));
+  const stateRoot = await mkdtemp(resolve(tmpdir(), "ai-ops-security-state-"));
+  const projectContextPath = resolve(stateRoot, "project-context.json");
+
+  const rules = new SecurityRulesEngine({
+    allowedBinaries: ["git", "npm", "cat"],
+    worktreeRoot,
+    protectedPaths: [stateRoot, projectContextPath],
+    requireCwdWithinWorktree: true,
+    rejectRelativePathTraversal: true,
+    enforcePathBoundaryOnArguments: true,
+    allowedEnvAssignments: [],
+    blockedEnvAssignments: [],
+  });
+
+  const allowed = rules.validateShellCommand({
+    command: "git status && npm test | cat > logs/output.txt",
+    cwd: worktreeRoot,
+    toolClearance: {
+      allowlist: ["git", "npm", "cat"],
+      banlist: [],
+    },
+  });
+
+  assert.equal(allowed.parsed.commandCount, 3);
+
+  assert.throws(
+    () =>
+      rules.validateShellCommand({
+        command: "cat ../secrets.txt",
+        cwd: worktreeRoot,
+      }),
+    (error) =>
+      error instanceof SecurityViolationError &&
+      error.code === "PATH_TRAVERSAL_BLOCKED",
+  );
+
+  assert.throws(
+    () =>
+      rules.validateShellCommand({
+        command: "git status",
+        cwd: stateRoot,
+      }),
+    (error) =>
+      error instanceof SecurityViolationError &&
+      error.code === "CWD_OUTSIDE_WORKTREE",
+  );
+});
+
+test("secure executor runs with explicit env policy", async () => {
+  const worktreeRoot = await mkdtemp(resolve(tmpdir(), "ai-ops-security-exec-"));
+
+  const rules = new SecurityRulesEngine({
+    allowedBinaries: ["echo"],
+    worktreeRoot,
+    protectedPaths: [],
+    requireCwdWithinWorktree: true,
+    rejectRelativePathTraversal: true,
+    enforcePathBoundaryOnArguments: true,
+    allowedEnvAssignments: [],
+    blockedEnvAssignments: [],
+  });
+
+  const executor = new SecureCommandExecutor({
+    rulesEngine: rules,
+    timeoutMs: 2000,
+    envPolicy: {
+      inherit: ["PATH", "HOME"],
+      scrub: ["SECRET_VALUE"],
+      inject: {
+        SAFE_VALUE: "ok",
+      },
+    },
+  });
+
+  let streamedStdout = "";
+  const result = await executor.execute({
+    command: "echo \"$SAFE_VALUE|$SECRET_VALUE\"",
+    cwd: worktreeRoot,
+    baseEnv: {
+      PATH: process.env.PATH,
+      HOME: process.env.HOME,
+      SECRET_VALUE: "hidden",
+    },
+    onStdoutChunk: (chunk) => {
+      streamedStdout += chunk;
+    },
+  });
+
+  assert.equal(result.exitCode, 0);
+  assert.equal(result.stdout, "ok|\n");
+  assert.equal(streamedStdout, result.stdout);
+});