Infisical · dangtony98 · Apr 21, 2026 · Apr 21, 2026 · Apr 21, 2026 · Apr 21, 2026
diff --git a/.env.example b/.env.example
@@ -35,6 +35,10 @@
 # Development (optional)
 # AGENT_VAULT_DEV_MODE=false               # when true, allows internal/localhost hosts in proposals
 
+# Sandbox mode for `agent-vault vault run` (optional)
+# process (default, cooperative) | container (non-cooperative Docker sandbox with iptables egress lock)
+# AGENT_VAULT_SANDBOX=process
+
 # Observability (optional)
 # AGENT_VAULT_LOG_LEVEL=info               # info (default) | debug — debug emits one line per proxied request (no secret values)
 

diff --git a/CLAUDE.md b/CLAUDE.md
@@ -31,6 +31,7 @@ make docker       # Multi-stage Docker image; data persisted at /data/.agent-vau
   - Vault role: `proxy` < `member` < `admin`. Proxy can use the proxy and raise proposals; member can manage credentials/services; admin can invite humans.
 - **KEK/DEK key wrapping**: A random DEK (Data Encryption Key) encrypts credentials and the CA key at rest (AES-256-GCM). If a master password is set, Argon2id derives a KEK (Key Encryption Key) that wraps the DEK; changing the password re-wraps the DEK without re-encrypting credentials. If no password is set (passwordless mode), the DEK is stored in plaintext — suitable for PaaS deploys where volume security is the trust boundary. Login uses email+password or Google OAuth. The first user to register becomes the instance owner and is auto-granted vault admin on `default`.
 - **Agent skills are the agent-facing contract.** [cmd/skill_cli.md](cmd/skill_cli.md) and [cmd/skill_http.md](cmd/skill_http.md) are embedded into the binary, installed by `vault run`, and served publicly at `/v1/skills/{cli,http}`. They are the authoritative reference for what agents can do.
+- **Two sandbox modes for `vault run`** (selected via `--sandbox` or `AGENT_VAULT_SANDBOX`): `process` (default, cooperative — fork+exec with `HTTPS_PROXY` envvars) and `container` (non-cooperative — Docker container with iptables egress locked to the Agent Vault proxy). Container mode lives in [internal/sandbox/](internal/sandbox/) with an embedded Dockerfile + init-firewall.sh + entrypoint.sh, built on first use and cached by content hash.
 
 ## Where to look for details
 

diff --git a/README.md b/README.md
@@ -87,6 +87,14 @@ agent-vault vault run -- claude
 
 The agent calls APIs normally (e.g. `fetch("https://api.github.com/...")`). Agent Vault intercepts the request, injects the credential, and forwards it upstream. The agent never sees secrets.
 
+For **non-cooperative** sandboxing — where the child physically cannot reach anything except the Agent Vault proxy, regardless of what it tries — launch it in a Docker container with egress locked down by iptables:
+
+```bash
+agent-vault vault run --sandbox=container -- claude
+```
+
+See [Container sandbox](https://docs.agent-vault.dev/guides/container-sandbox) for the threat model and flags.
+
 ### SDK — sandboxed agents (Docker, Daytona, E2B)
 
 For agents running inside containers, use the SDK from your orchestrator to mint a session and pass proxy config into the sandbox:

diff --git a/cmd/run.go b/cmd/run.go
@@ -13,6 +13,7 @@ import (
 	"strings"
 	"syscall"
 
+	"github.com/Infisical/agent-vault/internal/sandbox"
 	"github.com/Infisical/agent-vault/internal/session"
 	"github.com/Infisical/agent-vault/internal/store"
 	"github.com/charmbracelet/huh"
@@ -25,6 +26,10 @@ var skillCLI string
 //go:embed skill_http.md
 var skillHTTP string
 
+// sandboxMode is enum-typed so `--sandbox=foo` fails at flag-parse time
+// with the allowed set, rather than deep inside RunE.
+var sandboxMode SandboxMode
+
 var runCmd = &cobra.Command{
 	Use:   "run [flags] -- <command> [args...]",
 	Short: "Wrap an agent process with Agent Vault access",
@@ -53,6 +58,24 @@ Example:
 	Args:                  cobra.MinimumNArgs(1),
 	DisableFlagsInUseLine: true,
 	RunE: func(cmd *cobra.Command, args []string) error {
+		// 0. Resolve sandbox mode and validate flag compatibility before any
+		//    network I/O — the user sees conflicts immediately, not after
+		//    a slow session-mint round-trip.
+		mode := sandboxMode
+		if mode == "" {
+			if v := os.Getenv("AGENT_VAULT_SANDBOX"); v != "" {
+				if err := mode.Set(v); err != nil {
+					return fmt.Errorf("AGENT_VAULT_SANDBOX: %w", err)
+				}
+			}
+		}
+		if mode == "" {
+			mode = SandboxProcess
+		}
+		if err := validateSandboxFlagConflicts(cmd, mode); err != nil {
+			return err
+		}
+
 		// 1. Load the admin session from agent-vault auth login.
 		sess, err := ensureSession()
 		if err != nil {
@@ -78,6 +101,10 @@ Example:
 			return err
 		}
 
+		if mode == SandboxContainer {
+			return runContainer(cmd, args, scopedToken, addr, vault)
+		}
+
 		// 4. Resolve the target binary.
 		binary, err := exec.LookPath(args[0])
 		if err != nil {
@@ -276,23 +303,19 @@ func fetchUserVaults(addr, token string) ([]string, error) {
 	return names, nil
 }
 
-// mitmInjectedKeys is the set of env keys augmentEnvWithMITM manages on
-// the child. Any pre-existing occurrence inherited from os.Environ() must
-// be stripped before the new values are appended — POSIX getenv returns
-// the *first* match in C code paths (glibc, curl, libcurl-backed Python),
-// so a stale corporate HTTPS_PROXY from the parent shell would otherwise
-// silently win and the MITM route would be bypassed entirely.
-var mitmInjectedKeys = map[string]struct{}{
-	"HTTPS_PROXY":         {},
-	"NO_PROXY":            {},
-	"NODE_USE_ENV_PROXY":  {},
-	"SSL_CERT_FILE":       {},
-	"NODE_EXTRA_CA_CERTS": {},
-	"REQUESTS_CA_BUNDLE":  {},
-	"CURL_CA_BUNDLE":      {},
-	"GIT_SSL_CAINFO":      {},
-	"DENO_CERT":           {},
-}
+// mitmInjectedKeys is the keyset that BuildProxyEnv emits. Any
+// pre-existing occurrence inherited from os.Environ() must be stripped
+// before the new values are appended — POSIX getenv returns the *first*
+// match in C code paths (glibc, curl, libcurl-backed Python), so a stale
+// corporate HTTPS_PROXY from the parent shell would otherwise silently
+// win and the MITM route would be bypassed entirely.
+var mitmInjectedKeys = func() map[string]struct{} {
+	m := make(map[string]struct{}, len(sandbox.ProxyEnvKeys))
+	for _, k := range sandbox.ProxyEnvKeys {
+		m[k] = struct{}{}
+	}
+	return m
+}()
 
 // stripEnvKeys returns env with every entry whose key (the part before
 // '=') appears in keys removed. Case-sensitive, matching how the kernel
@@ -359,30 +382,16 @@ func augmentEnvWithMITM(env []string, addr, token, vault, caPath string) ([]stri
 			mitmHost = h
 		}
 	}
-	scheme := "http"
-	if mitmTLS {
-		scheme = "https"
-	}
-	proxyURL := (&url.URL{
-		Scheme: scheme,
-		User:   url.UserPassword(token, vault),
-		Host:   fmt.Sprintf("%s:%d", mitmHost, port),
-	}).String()
 
 	env = stripEnvKeys(env, mitmInjectedKeys)
-	// CA trust variables must stay in sync with buildProxyEnv() in
-	// sdks/sdk-typescript/src/resources/sessions.ts.
-	env = append(env,
-		"HTTPS_PROXY="+proxyURL,
-		"NO_PROXY=localhost,127.0.0.1",
-		"NODE_USE_ENV_PROXY=1",
-		"SSL_CERT_FILE="+caPath,
-		"NODE_EXTRA_CA_CERTS="+caPath,
-		"REQUESTS_CA_BUNDLE="+caPath,
-		"CURL_CA_BUNDLE="+caPath,
-		"GIT_SSL_CAINFO="+caPath,
-		"DENO_CERT="+caPath,
-	)
+	env = append(env, sandbox.BuildProxyEnv(sandbox.ProxyEnvParams{
+		Host:    mitmHost,
+		Port:    port,
+		Token:   token,
+		Vault:   vault,
+		CAPath:  caPath,
+		MITMTLS: mitmTLS,
+	})...)
 	return env, port, true, nil
 }
 
@@ -440,5 +449,12 @@ func init() {
 	runCmd.Flags().Int("ttl", 0, "Session TTL in seconds (300–604800; default: server default 24h)")
 	runCmd.Flags().Bool("no-mitm", false, "Skip HTTPS_PROXY/CA env injection for the child (explicit /proxy only)")
 
+	runCmd.Flags().Var(&sandboxMode, "sandbox", "Sandbox mode: process (default) or container")
+	runCmd.Flags().String("image", "", "Container image override (requires --sandbox=container)")
+	runCmd.Flags().StringArray("mount", nil, "Extra bind mount src:dst[:ro] (repeatable; requires --sandbox=container)")
+	runCmd.Flags().Bool("keep", false, "Don't pass --rm to docker (requires --sandbox=container)")
+	runCmd.Flags().Bool("no-firewall", false, "Skip iptables egress rules inside the container (requires --sandbox=container; debug only)")
+	runCmd.Flags().Bool("home-volume-shared", false, "Share /home/claude/.claude across invocations (requires --sandbox=container); default is a per-invocation volume, losing auth state but avoiding concurrency corruption")
+
 	vaultCmd.AddCommand(runCmd)
 }
diff --git a/cmd/run_container.go b/cmd/run_container.go
@@ -0,0 +1,171 @@
+package cmd
+
+import (
+	"context"
+	"errors"
+	"fmt"
+	"net/url"
+	"os"
+	"os/exec"
+	"runtime"
+	"strconv"
+	"syscall"
+	"time"
+
+	"github.com/spf13/cobra"
+	"golang.org/x/term"
+
+	"github.com/Infisical/agent-vault/internal/sandbox"
+)
+
+// containerOnlyFlags are no-ops in process mode; we reject them explicitly
+// rather than silently ignoring them, which would be a foot-gun.
+var containerOnlyFlags = []string{"image", "mount", "keep", "no-firewall", "home-volume-shared"}
+
+func validateSandboxFlagConflicts(cmd *cobra.Command, mode SandboxMode) error {
+	if mode == SandboxContainer {
+		return nil
+	}
+	for _, name := range containerOnlyFlags {
+		f := cmd.Flags().Lookup(name)
+		if f == nil {
+			continue
+		}
+		if f.Changed {
+			return fmt.Errorf("--%s requires --sandbox=container", name)
+		}
+	}
+	return nil
+}
+
+// runContainer launches the target agent inside a Docker container with
+// egress locked to the agent-vault proxy via iptables.
+func runContainer(cmd *cobra.Command, args []string, scopedToken, addr, vault string) error {
+	if runtime.GOOS != "linux" && runtime.GOOS != "darwin" {
+		return fmt.Errorf("--sandbox=container: only linux and darwin are supported in v1 (got %s)", runtime.GOOS)
+	}
+	if _, err := exec.LookPath("docker"); err != nil {
+		return errors.New("--sandbox=container: `docker` not found in PATH")
+	}
+
+	ctx := cmd.Context()
+	if ctx == nil {
+		ctx = context.Background()
+	}
+
+	// Housekeeping: trim old CA tempfiles and networks from crashed runs
+	// before we create new ones. Both are best-effort.
+	sandbox.PruneHostCAFiles()
+	_ = sandbox.PruneStaleNetworks(ctx, sandbox.DefaultPruneGrace)
+
+	// Pull the MITM CA from the server. Container mode always routes
+	// through MITM — --no-mitm is a process-mode-only escape hatch.
+	pem, mitmPort, mitmEnabled, mitmTLS, err := fetchMITMCA(addr)
+	if err != nil {
+		return fmt.Errorf("fetch MITM CA: %w", err)
+	}
+	if !mitmEnabled {
+		return errors.New("--sandbox=container requires the MITM proxy; server has it disabled")
+	}
+	if mitmPort == 0 {
+		mitmPort = DefaultMITMPort
+	}
+
+	// Upstream agent-vault HTTP port for the forwarder. Parsed from
+	// --address / session address, with DefaultPort as a fallback.
+	upstreamHTTPPort := DefaultPort
+	if u, perr := url.Parse(addr); perr == nil {
+		if p, cerr := strconv.Atoi(u.Port()); cerr == nil && p > 0 {
+			upstreamHTTPPort = p
+		}
+	}
+
+	sessionID, err := sandbox.NewSessionID()
+	if err != nil {
+		return err
+	}
+
+	hostCAPath, err := sandbox.WriteHostCAFile(pem, sessionID)
+	if err != nil {
+		return fmt.Errorf("write CA: %w", err)
+	}
+
+	network, err := sandbox.CreatePerInvocationNetwork(ctx, sessionID)
+	if err != nil {
+		return fmt.Errorf("create docker network: %w", err)
+	}
+	defer func() {
+		// Only runs on error arms — syscall.Exec below replaces the
+		// process, bypassing defers. Use a detached context so a
+		// parent ctx cancel doesn't skip the cleanup exec itself.
+		cleanup, cancel := context.WithTimeout(context.Background(), 5*time.Second)
+		defer cancel()
+		_ = sandbox.RemoveNetwork(cleanup, network.Name)
+	}()
+
+	bindIP := sandbox.HostBindIP(network)
+	if bindIP == nil {
+		return errors.New("could not determine host bind IP for forwarder")
+	}
+
+	fwd, err := sandbox.StartForwarder(ctx, bindIP, upstreamHTTPPort, mitmPort)
+	if err != nil {
+		return fmt.Errorf("start forwarder: %w", err)
+	}
+	defer func() { _ = fwd.Close() }()
+
+	image, _ := cmd.Flags().GetString("image")
+	imageRef, err := sandbox.EnsureImage(ctx, image, os.Stderr)
+	if err != nil {
+		return err
+	}
+
+	workDir, err := os.Getwd()
+	if err != nil {
+		return fmt.Errorf("getwd: %w", err)
+	}
+
+	env := sandbox.BuildContainerEnv(scopedToken, vault, fwd.HTTPPort, fwd.MITMPort, mitmTLS)
+
+	mounts, _ := cmd.Flags().GetStringArray("mount")
+	keep, _ := cmd.Flags().GetBool("keep")
+	noFirewall, _ := cmd.Flags().GetBool("no-firewall")
+	homeShared, _ := cmd.Flags().GetBool("home-volume-shared")
+
+	dockerArgs, err := sandbox.BuildRunArgs(sandbox.Config{
+		ImageRef:         imageRef,
+		SessionID:        sessionID,
+		WorkDir:          workDir,
+		HostCAPath:       hostCAPath,
+		NetworkName:      network.Name,
+		AttachTTY:        term.IsTerminal(int(os.Stdin.Fd())),
+		Keep:             keep,
+		NoFirewall:       noFirewall,
+		HomeVolumeShared: homeShared,
+		Mounts:           mounts,
+		Env:              env,
+		CommandArgs:      args,
+	})
+	if err != nil {
+		return err
+	}
+
+	dockerBin, err := exec.LookPath("docker")
+	if err != nil {
+		return err
+	}
+
+	if noFirewall {
+		fmt.Fprintln(os.Stderr, "agent-vault: WARNING --no-firewall active, container egress is unrestricted")
+	}
+	fmt.Fprintf(os.Stderr, "%s routing container HTTPS through MITM on %s:%d (container view: host.docker.internal:%d)\n",
+		successText("agent-vault:"), bindIP, fwd.MITMPort, fwd.MITMPort)
+	fmt.Fprintf(os.Stderr, "%s starting %s in sandbox (%s)...\n\n",
+		successText("agent-vault:"), boldText(args[0]), network.Name)
+
+	// Exec docker directly so the controlling TTY, SIGINT, SIGWINCH
+	// propagate naturally. Listeners are FD_CLOEXEC so they close at
+	// exec; per-conn forwarder goroutines die with the replaced process
+	// image. On success this never returns.
+	return syscall.Exec(dockerBin, append([]string{"docker"}, dockerArgs...), os.Environ())
+}