From d70b4392a0e426ff3d94de2fc37ca0744370b937 Mon Sep 17 00:00:00 2001
From: Jeonghwan Lee <jhlee@cryptolab.co.kr>
Date: Mon, 27 Apr 2026 12:02:08 +0900
Subject: [PATCH 01/27] feat: migrate vault to Go gRPC service (runevault)
 (#61)

---
 .gitignore                                    |   8 +
 .mise.ci.toml                                 |  15 +-
 .mise.toml                                    | 152 ++---
 AGENTS.md                                     |  46 +-
 CLAUDE.md                                     |  48 +-
 CONTRIBUTING.md                               |  59 +-
 pyproject.toml                                |  14 -
 requirements.txt                              |  24 -
 tests/integration/__init__.py                 |   1 -
 tests/integration/test_decrypt_pipeline.py    | 155 -----
 tests/requirements.txt                        |  10 -
 tests/unit/__init__.py                        |   1 -
 tests/unit/test_admin_server.py               | 209 ------
 tests/unit/test_audit.py                      | 250 -------
 tests/unit/test_auth.py                       | 147 -----
 tests/unit/test_decrypt_scores.py             | 226 -------
 tests/unit/test_metadata_dek.py               | 164 -----
 tests/unit/test_protovalidate.py              | 141 ----
 tests/unit/test_public_key.py                 |  96 ---
 tests/unit/test_request_validator.py          | 101 ---
 tests/unit/test_token_store.py                | 316 ---------
 tests/unit/test_validation_interceptor.py     | 196 ------
 vault/.env.example                            |  62 --
 vault/Dockerfile                              |  55 --
 vault/admin_server.py                         | 232 -------
 vault/audit.py                                | 153 -----
 vault/buf.gen.yaml                            |  13 +
 vault/docker-compose.yml                      |  62 --
 vault/docker-entrypoint.sh                    |  80 ---
 vault/go.mod                                  |  29 +
 vault/go.sum                                  |  71 ++
 vault/internal/commands/adminclient.go        | 119 ++++
 vault/internal/commands/adminclient_test.go   | 120 ++++
 vault/internal/commands/duration.go           |  27 +
 vault/internal/commands/role.go               | 172 +++++
 vault/internal/commands/token.go              | 192 ++++++
 vault/internal/commands/version.go            |  28 +
 vault/internal/crypto/keys.go                 | 118 ++++
 vault/internal/crypto/keys_test.go            |  49 ++
 vault/internal/crypto/metadata.go             | 105 +++
 vault/internal/crypto/metadata_test.go        | 223 +++++++
 vault/internal/server/audit.go                | 181 ++++++
 vault/internal/server/audit_test.go           | 156 +++++
 vault/internal/server/grpc_test.go            | 205 ++++++
 vault/internal/server/helpers_test.go         |  25 +
 vault/internal/server/interceptors.go         |  85 +++
 vault/internal/server/interceptors_test.go    | 105 +++
 vault/internal/tests/decrypt_pipeline_test.go | 316 +++++++++
 vault/internal/tests/fixtures.go              |  36 ++
 vault/internal/tokens/errors.go               |  43 ++
 vault/internal/tokens/ratelimit.go            |  72 +++
 vault/internal/tokens/ratelimit_test.go       |  88 +++
 vault/internal/tokens/role.go                 |  66 ++
 vault/internal/tokens/store.go                | 612 ++++++++++++++++++
 vault/internal/tokens/store_test.go           | 563 ++++++++++++++++
 vault/internal/tokens/token.go                |  29 +
 vault/pkg/vaultpb/vault_service.pb.go         | 499 ++++++++++++++
 vault/pkg/vaultpb/vault_service_grpc.pb.go    | 209 ++++++
 vault/proto/__init__.py                       |   0
 vault/request_validator.py                    |  96 ---
 vault/requirements.txt                        |  20 -
 vault/scripts/proto-gen.sh                    |  52 --
 vault/token_store.py                          | 580 -----------------
 vault/validation_interceptor.py               |  65 --
 vault/vault_admin_cli.py                      | 250 -------
 vault/vault_core.py                           | 326 ----------
 vault/vault_grpc_server.py                    | 375 -----------
 vault/verify_crypto_flow.py                   |  93 ---
 68 files changed, 4711 insertions(+), 4725 deletions(-)
 delete mode 100644 pyproject.toml
 delete mode 100644 requirements.txt
 delete mode 100644 tests/integration/__init__.py
 delete mode 100644 tests/integration/test_decrypt_pipeline.py
 delete mode 100644 tests/requirements.txt
 delete mode 100644 tests/unit/__init__.py
 delete mode 100644 tests/unit/test_admin_server.py
 delete mode 100644 tests/unit/test_audit.py
 delete mode 100644 tests/unit/test_auth.py
 delete mode 100644 tests/unit/test_decrypt_scores.py
 delete mode 100644 tests/unit/test_metadata_dek.py
 delete mode 100644 tests/unit/test_protovalidate.py
 delete mode 100644 tests/unit/test_public_key.py
 delete mode 100644 tests/unit/test_request_validator.py
 delete mode 100644 tests/unit/test_token_store.py
 delete mode 100644 tests/unit/test_validation_interceptor.py
 delete mode 100644 vault/.env.example
 delete mode 100644 vault/Dockerfile
 delete mode 100644 vault/admin_server.py
 delete mode 100644 vault/audit.py
 create mode 100644 vault/buf.gen.yaml
 delete mode 100644 vault/docker-compose.yml
 delete mode 100755 vault/docker-entrypoint.sh
 create mode 100644 vault/go.mod
 create mode 100644 vault/go.sum
 create mode 100644 vault/internal/commands/adminclient.go
 create mode 100644 vault/internal/commands/adminclient_test.go
 create mode 100644 vault/internal/commands/duration.go
 create mode 100644 vault/internal/commands/role.go
 create mode 100644 vault/internal/commands/token.go
 create mode 100644 vault/internal/commands/version.go
 create mode 100644 vault/internal/crypto/keys.go
 create mode 100644 vault/internal/crypto/keys_test.go
 create mode 100644 vault/internal/crypto/metadata.go
 create mode 100644 vault/internal/crypto/metadata_test.go
 create mode 100644 vault/internal/server/audit.go
 create mode 100644 vault/internal/server/audit_test.go
 create mode 100644 vault/internal/server/grpc_test.go
 create mode 100644 vault/internal/server/helpers_test.go
 create mode 100644 vault/internal/server/interceptors.go
 create mode 100644 vault/internal/server/interceptors_test.go
 create mode 100644 vault/internal/tests/decrypt_pipeline_test.go
 create mode 100644 vault/internal/tests/fixtures.go
 create mode 100644 vault/internal/tokens/errors.go
 create mode 100644 vault/internal/tokens/ratelimit.go
 create mode 100644 vault/internal/tokens/ratelimit_test.go
 create mode 100644 vault/internal/tokens/role.go
 create mode 100644 vault/internal/tokens/store.go
 create mode 100644 vault/internal/tokens/store_test.go
 create mode 100644 vault/internal/tokens/token.go
 create mode 100644 vault/pkg/vaultpb/vault_service.pb.go
 create mode 100644 vault/pkg/vaultpb/vault_service_grpc.pb.go
 delete mode 100644 vault/proto/__init__.py
 delete mode 100644 vault/request_validator.py
 delete mode 100644 vault/requirements.txt
 delete mode 100755 vault/scripts/proto-gen.sh
 delete mode 100644 vault/token_store.py
 delete mode 100644 vault/validation_interceptor.py
 delete mode 100644 vault/vault_admin_cli.py
 delete mode 100644 vault/vault_core.py
 delete mode 100644 vault/vault_grpc_server.py
 delete mode 100644 vault/verify_crypto_flow.py

diff --git a/.gitignore b/.gitignore
index ab447f1..11762c3 100644
--- a/.gitignore
+++ b/.gitignore
@@ -96,6 +96,11 @@ Thumbs.db
 *.dll
 *.dylib
 
+# Go build artifacts
+vault/bin/
+vault/**/*.test
+vault/**/*.out
+
 # Database
 *.db
 *.sqlite
@@ -114,3 +119,6 @@ test-results/
 
 # Test fixtures (plaintext — decrypted from fixtures.tar.gz.gpg)
 tests/fixtures/
+
+# Local dev runtime files (config, socket, keys, pid)
+vault/dev/
diff --git a/.mise.ci.toml b/.mise.ci.toml
index 38b2877..c539fbb 100644
--- a/.mise.ci.toml
+++ b/.mise.ci.toml
@@ -1,11 +1,6 @@
-# CI-only tool configuration
-# Used by setting MISE_ENV=ci in GitHub Actions workflows
+# CI environment overrides — merged on top of .mise.toml when MISE_ENV=ci.
+# Tasks are inherited from .mise.toml; only CI-specific settings go here.
 
-[tools]
-python = "3.12"
-buf = "1.66"
-ruff = "0.15"
-
-[env]
-_.python.venv = { path = ".venv", create = true }
-PYTHONPATH = "{{config_root}}/vault/proto:{{config_root}}/vault"
+# Only install tools required for build and test; skip deployment tools.
+[settings]
+enable_tools = ["go", "buf"]
diff --git a/.mise.toml b/.mise.toml
index c2bbd3f..267684b 100644
--- a/.mise.toml
+++ b/.mise.toml
@@ -1,12 +1,11 @@
 # Rune-Vault Development Environment
 # Run `mise install` to set up all tools, then `mise run setup` to bootstrap.
-# Prerequisites: mise (https://mise.jdx.dev), Docker (https://docs.docker.com/get-docker)
+# Prerequisites: mise (https://mise.jdx.dev)
 
 # ── Core development tools ───────────────────────────────────────────
 [tools]
-python = "3.12"
+go = "1.25"
 buf = "1.66"
-ruff = "0.15"
 
 # ── Deployment tools (install with: mise install) ────────────────────
 # These are needed only for cloud deployment, not for local development.
@@ -15,127 +14,118 @@ terraform = "1.14"
 gcloud = "562"
 oci = "3"
 
-# ── Environment variables ────────────────────────────────────────────
 [env]
-_.python.venv = { path = ".venv", create = true }
-PYTHONPATH = "{{config_root}}/vault/proto:{{config_root}}/vault"
-
-# ── Docker image settings ───────────────────────────────────────────
-[vars]
-docker_image = "ghcr.io/cryptolabinc/rune-vault"
-docker_builder = "rune-vault-builder"
-docker_platforms = "linux/amd64,linux/arm64"
+CGO_ENABLED = "1"
 
 # ── Tasks ────────────────────────────────────────────────────────────
 
 [tasks.setup]
-description = "Bootstrap development environment (venv + dependencies)"
+description = "Bootstrap development environment (Go modules + proto stubs)"
 run = """
 #!/usr/bin/env bash
 set -euo pipefail
 
-echo "==> Installing vault dependencies..."
-pip install -q -r vault/requirements.txt
-
-echo "==> Installing test dependencies..."
-pip install -q -r tests/requirements.txt
+echo "==> Resolving Go modules..."
+cd vault && go mod download && cd ..
 
-echo "==> Generating proto stubs..."
-cd vault && bash scripts/proto-gen.sh && cd ..
+echo "==> Generating Go proto stubs..."
+cd vault && buf generate && cd ..
 
 echo "==> Configuring git hooks..."
 git config core.hooksPath .githooks
 
 echo ""
 echo "Development environment ready."
-echo "Run 'mise run test' to verify."
+echo "Run 'mise run check' to verify."
 """
 
-[tasks.test]
-description = "Run unit and integration tests"
-run = "python -m pytest tests/unit tests/integration -v"
-
-[tasks."test:unit"]
-description = "Run unit tests only"
-run = "python -m pytest tests/unit -v"
-
-[tasks."test:cov"]
-description = "Run tests with coverage report"
-run = "python -m pytest tests/unit tests/integration --cov=vault --cov-report=term-missing -v"
-
-[tasks.lint]
-description = "Run ruff linter"
-run = "ruff check vault/"
-
-[tasks."lint:fix"]
-description = "Run ruff linter with auto-fix"
-run = "ruff check vault/ --fix"
-
-[tasks.format]
-description = "Format code with ruff"
-run = "ruff format vault/"
-
-[tasks."format:check"]
-description = "Check code formatting without modifying"
-run = "ruff format --check vault/"
-
 [tasks.check]
-description = "Run all quality checks (format + lint + test)"
+description = "Run all quality checks (gofmt + go vet + unit tests)"
 run = """
 #!/usr/bin/env bash
 set -euo pipefail
-echo "==> Checking format..."
-ruff format --check vault/
-echo "==> Linting..."
-ruff check vault/
-echo "==> Running tests..."
-python -m pytest tests/unit -v
+cd vault
+echo "==> Checking Go format..."
+diff=$(gofmt -l .)
+if [ -n "$diff" ]; then
+  echo "gofmt found unformatted files:" >&2
+  echo "$diff" >&2
+  exit 1
+fi
+echo "==> go vet..."
+go vet ./...
+echo "==> Running unit tests..."
+go test -race ./...
 echo ""
 echo "All checks passed."
 """
 
-[tasks.proto]
-description = "Regenerate protobuf/gRPC stubs"
-run = "cd vault && bash scripts/proto-gen.sh"
+[tasks."proto:go"]
+description = "Regenerate Go protobuf/gRPC stubs into vault/pkg/vaultpb"
+run = "cd vault && buf generate"
 
-[tasks.build]
-description = "Build Docker image locally (via buildx)"
+[tasks."go:build"]
+description = "Build runevault binary to vault/bin/runevault"
 run = """
 #!/usr/bin/env bash
 set -euo pipefail
-TAG="{{arg(name="tag", default="latest")}}"
+VERSION="${VERSION:-dev}"
+COMMIT=$(git rev-parse --short HEAD 2>/dev/null || echo "none")
+DATE=$(date -u +%Y-%m-%dT%H:%M:%SZ)
+PKG="github.com/CryptoLabInc/rune-admin/vault/internal/commands"
+cd vault && go build \
+  -o bin/runevault \
+  -ldflags "-X '${PKG}.buildVersion=${VERSION}' -X '${PKG}.buildCommit=${COMMIT}' -X '${PKG}.buildDate=${DATE}'" \
+  ./cmd
+"""
 
-docker buildx inspect "{{vars.docker_builder}}" >/dev/null 2>&1 || \
-  docker buildx create --name "{{vars.docker_builder}}" --use --driver docker-container
+[tasks."go:test"]
+description = "Run all tests including E2E (requires pre-built binary via RUNEVAULT_TEST_BINARY)"
+run = "cd vault && go test -race -tags e2e ./..."
 
-cd vault
-docker buildx build --builder "{{vars.docker_builder}}" \
-  -t "{{vars.docker_image}}:$TAG" \
-  --load .
-"""
+[tasks."go:test:unit"]
+description = "Run unit tests only (E2E excluded by build tag)"
+run = "cd vault && go test -race ./..."
 
-[tasks.push]
-description = "Build and push multi-platform Docker image to GHCR"
+[tasks."go:test:e2e"]
+description = "Run E2E tests against the pre-built runevault binary (run go:build first)"
 run = """
 #!/usr/bin/env bash
 set -euo pipefail
-TAG="{{arg(name="tag", default="latest")}}"
+BINARY="${RUNEVAULT_TEST_BINARY:-$(pwd)/vault/bin/runevault}"
+if [ ! -x "$BINARY" ]; then
+  echo "runevault binary not found at $BINARY — run 'mise run go:build' first" >&2
+  exit 1
+fi
+export RUNEVAULT_TEST_BINARY="$BINARY"
+cd vault && go test -race -tags e2e ./internal/tests/...
+"""
 
-gh auth token | docker login ghcr.io -u "$(gh api user -q .login)" --password-stdin
+[tasks."go:vet"]
+description = "Run go vet on all Go packages"
+run = "cd vault && go vet ./..."
 
-docker buildx inspect "{{vars.docker_builder}}" >/dev/null 2>&1 || \
-  docker buildx create --name "{{vars.docker_builder}}" --use --driver docker-container
+[tasks."go:fmt"]
+description = "Format Go source files"
+run = "cd vault && gofmt -w ."
 
+[tasks."go:fmt:check"]
+description = "Check Go formatting without modifying"
+run = """
+#!/usr/bin/env bash
+set -euo pipefail
 cd vault
-docker buildx build --builder "{{vars.docker_builder}}" \
-  --platform "{{vars.docker_platforms}}" \
-  -t "{{vars.docker_image}}:$TAG" \
-  --push .
+diff=$(gofmt -l .)
+if [ -n "$diff" ]; then
+  echo "gofmt found unformatted files:" >&2
+  echo "$diff" >&2
+  exit 1
+fi
 """
 
 [tasks.dev]
-description = "Start local development Vault via Docker Compose"
-run = "cd vault && docker compose up --build -d vault"
+description = "Run runevault daemon in foreground for development"
+run = "cd vault && go run ./cmd/runevault --config dev/runevault.conf daemon start"
 
 [tasks."fixtures:decrypt"]
 description = "Decrypt test fixtures from GPG archive"
diff --git a/AGENTS.md b/AGENTS.md
index 324b633..c86beb2 100644
--- a/AGENTS.md
+++ b/AGENTS.md
@@ -1,7 +1,8 @@
 # Rune-Vault (rune-admin)
 
-Python 3.12 gRPC server for FHE-encrypted organizational memory.
-The secret key never leaves this server.
+Single-binary Go gRPC server (`runevault`) for FHE-encrypted organizational
+memory. Built on `github.com/CryptoLabInc/envector-go-sdk`. The secret key
+never leaves this server.
 
 ## Setup
 
@@ -9,39 +10,40 @@ See [CONTRIBUTING.md](CONTRIBUTING.md#development-setup) for initial setup.
 
 ## Commands
 
-All commands **must** be run via `mise run` to ensure correct tool versions and venv activation.
-Do NOT run python, pytest, or ruff directly.
+All commands **must** be run via `mise run` to ensure correct tool versions.
+Do NOT run go, gofmt, or buf directly.
 
 | Command | Description |
 |---------|-------------|
-| `mise run test` | Unit + integration tests |
-| `mise run test:unit` | Unit tests only |
-| `mise run test:cov` | Tests with coverage report |
-| `mise run lint` | Ruff linter |
-| `mise run lint:fix` | Ruff with auto-fix |
-| `mise run format` | Ruff formatter |
-| `mise run format:check` | Check formatting without modifying |
-| `mise run check` | All checks: format + lint + unit tests |
-| `mise run proto` | Regenerate protobuf/gRPC stubs |
-| `mise run build` | Build Docker image locally |
-| `mise run dev` | Start local Vault via Docker Compose |
+| `mise run setup` | Bootstrap (Go modules + proto stubs) |
+| `mise run check` | All checks: gofmt + go vet + go test (race) |
+| `mise run go:build` | Build the runevault binary |
+| `mise run go:test` | Run Go unit + integration tests with race detector |
+| `mise run go:test:unit` | Run Go unit tests only (skip CLI smoke E2E) |
+| `mise run go:vet` | Run go vet on all Go packages |
+| `mise run go:fmt` | Format Go source files |
+| `mise run go:fmt:check` | Check Go formatting without modifying |
+| `mise run proto:go` | Regenerate Go protobuf/gRPC stubs into `vault/pkg/vaultpb` |
+| `mise run dev` | Run runevault daemon in foreground (uses `vault/dev/runevault.conf`) |
 | `mise run certs` | Generate self-signed TLS certificates |
+| `mise run fixtures:decrypt` | Decrypt test fixtures (requires `FIXTURES_GPG_PASSPHRASE`) |
+| `mise run fixtures:encrypt` | Re-encrypt test fixtures |
 
 ## Rules
 
 - English only in code, commit messages, PR descriptions, and issue bodies
 - Do not amend commits or force-push unless explicitly instructed
-- All public functions need type hints
-- New gRPC methods need corresponding unit tests in `tests/unit/`
-- Token/auth changes must update `tests/unit/test_auth.py`
+- All exported Go identifiers need a doc comment
+- New gRPC methods need corresponding unit tests in `vault/internal/server/grpc_test.go`
+- Token/auth changes must update `vault/internal/tokens/store_test.go`
 - Run `mise run check` before committing
 
 ## Security invariants
 
-- Secret key (`vault_keys/`) must never be logged, returned in API responses, or leave the server process
-- Admin server binds to `127.0.0.1` only — never expose externally
-- Token secrets must come from environment variables, never hardcoded
-- TLS is required for all cloud deployments
+- Secret key (`vault-keys/<key-id>/SecKey.json`) must never be logged, returned in API responses, or leave the server process
+- Admin transport is a Unix domain socket (mode 0600, vault-user owned) — never expose externally
+- Token secrets and FHE keys live in `runevault.conf` (mode 0600); secret YAML fields support `*_file` indirection for KMS-backed deployments
+- TLS is required for all cloud deployments (`server.grpc.tls.disable: true` is dev-only)
 
 ## Worktree setup
 
diff --git a/CLAUDE.md b/CLAUDE.md
index b53a5d9..82f38bd 100644
--- a/CLAUDE.md
+++ b/CLAUDE.md
@@ -1,7 +1,8 @@
 # Rune-Vault (rune-admin)
 
-Python 3.12 gRPC server for FHE-encrypted organizational memory.
-The secret key never leaves this server.
+Single-binary Go gRPC server (`runevault`) for FHE-encrypted organizational
+memory. Built on `github.com/CryptoLabInc/envector-go-sdk`. The secret key
+never leaves this server.
 
 ## Setup
 
@@ -9,40 +10,41 @@ See [CONTRIBUTING.md](CONTRIBUTING.md#development-setup) for initial setup.
 
 ## Commands
 
-All commands **must** be run via `mise run` to ensure correct tool versions and venv activation.
-Do NOT run python, pytest, or ruff directly.
+All commands **must** be run via `mise run` to ensure correct tool versions.
+Do NOT run go, gofmt, or buf directly.
 
 | Command | Description |
 |---------|-------------|
-| `mise run test` | Unit + integration tests |
-| `mise run test:unit` | Unit tests only |
-| `mise run test:cov` | Tests with coverage report |
-| `mise run lint` | Ruff linter |
-| `mise run lint:fix` | Ruff with auto-fix |
-| `mise run format` | Ruff formatter |
-| `mise run format:check` | Check formatting without modifying |
-| `mise run check` | All checks: format + lint + unit tests |
-| `mise run proto` | Regenerate protobuf/gRPC stubs |
-| `mise run build` | Build Docker image locally |
-| `mise run push` | Build and push multi-platform image to GHCR (requires GHCR access) |
-| `mise run dev` | Start local Vault via Docker Compose |
+| `mise run setup` | Bootstrap (Go modules + proto stubs) |
+| `mise run check` | All checks: gofmt + go vet + unit tests (race) |
+| `mise run go:build` | Build the runevault binary to `vault/bin/runevault` |
+| `mise run go:test` | Run all tests including E2E (requires `RUNEVAULT_TEST_BINARY`) |
+| `mise run go:test:unit` | Run unit tests only (E2E excluded by build tag) |
+| `mise run go:test:e2e` | Run E2E tests against pre-built binary (run `go:build` first) |
+| `mise run go:vet` | Run go vet on all Go packages |
+| `mise run go:fmt` | Format Go source files |
+| `mise run go:fmt:check` | Check Go formatting without modifying |
+| `mise run proto:go` | Regenerate Go protobuf/gRPC stubs into `vault/pkg/vaultpb` |
+| `mise run dev` | Run runevault daemon in foreground (uses `vault/dev/runevault.conf`) |
 | `mise run certs` | Generate self-signed TLS certificates |
+| `mise run fixtures:decrypt` | Decrypt test fixtures (requires `FIXTURES_GPG_PASSPHRASE`) |
+| `mise run fixtures:encrypt` | Re-encrypt test fixtures |
 
 ## Rules
 
 - English only in code, commit messages, PR descriptions, and issue bodies
 - Do not amend commits or force-push unless explicitly instructed
-- All public functions need type hints
-- New gRPC methods need corresponding unit tests in `tests/unit/`
-- Token/auth changes must update `tests/unit/test_auth.py`
+- All exported Go identifiers need a doc comment
+- New gRPC methods need corresponding unit tests in `vault/internal/server/grpc_test.go`
+- Token/auth changes must update `vault/internal/tokens/store_test.go`
 - Run `mise run check` before committing
 
 ## Security invariants
 
-- Secret key (`vault_keys/`) must never be logged, returned in API responses, or leave the server process
-- Admin server binds to `127.0.0.1` only — never expose externally
-- Token secrets must come from environment variables, never hardcoded
-- TLS is required for all cloud deployments
+- Secret key (`vault-keys/<key-id>/SecKey.json`) must never be logged, returned in API responses, or leave the server process
+- Admin transport is a Unix domain socket (mode 0600, vault-user owned) — never expose externally
+- Token secrets and FHE keys live in `runevault.conf` (mode 0600); secret YAML fields support `*_file` indirection for KMS-backed deployments
+- TLS is required for all cloud deployments (`server.grpc.tls.disable: true` is dev-only)
 
 ## Worktree setup
 
diff --git a/CONTRIBUTING.md b/CONTRIBUTING.md
index cf56502..209b466 100644
--- a/CONTRIBUTING.md
+++ b/CONTRIBUTING.md
@@ -15,7 +15,7 @@ Before creating an issue:
 2. Collect relevant information:
    - Rune-Admin version
    - Deployment platform (OCI/AWS/GCP)
-   - Python version
+   - Go version (`go version`)
    - Error messages and logs
    - Steps to reproduce
 
@@ -34,7 +34,6 @@ Feature requests should include:
 ### Prerequisites
 
 - [mise](https://mise.jdx.dev): `curl https://mise.jdx.dev/install.sh | sh`
-- [Docker](https://docs.docker.com/get-docker/) (for local Vault and image builds)
 
 **CSP deployment only:**
 - Access to cloud provider (OCI/AWS/GCP)
@@ -50,8 +49,8 @@ Feature requests should include:
 
 2. **Install tools and bootstrap**
    ```bash
-   mise install        # Install Python 3.12, buf, ruff, terraform, cloud CLIs
-   mise run setup      # Create venv, install deps, generate proto stubs
+   mise install        # Install Go 1.25, buf, terraform, cloud CLIs
+   mise run setup      # Resolve Go modules, generate proto stubs
    ```
 
 3. **Verify setup**
@@ -68,47 +67,34 @@ Feature requests should include:
 
 ### Commands
 
-All commands **must** be run via `mise run` to ensure correct tool versions and venv activation.
-
-| Command | Description |
-|---------|-------------|
-| `mise run test` | Unit + integration tests |
-| `mise run test:unit` | Unit tests only |
-| `mise run test:cov` | Tests with coverage report |
-| `mise run lint` | Ruff linter |
-| `mise run lint:fix` | Ruff with auto-fix |
-| `mise run format` | Ruff formatter |
-| `mise run format:check` | Check formatting without modifying |
-| `mise run check` | All checks: format + lint + unit tests |
-| `mise run proto` | Regenerate protobuf/gRPC stubs |
-| `mise run build` | Build Docker image locally |
-| `mise run push` | Build and push multi-platform image to GHCR (requires GHCR access) |
-| `mise run dev` | Start local Vault via Docker Compose |
-| `mise run certs` | Generate self-signed TLS certificates |
+All commands **must** be run via `mise run` to ensure correct tool versions.
+
+See [CLAUDE.md](CLAUDE.md#commands) for the complete task table.
 
 ## Testing
 
 ### Test Structure
 
 ```
-tests/
-├── unit/          # Fast, isolated tests per module
-└── integration/   # End-to-end Vault API tests
+vault/internal/
+├── tokens/        # Token store + role/rate-limit unit tests
+├── crypto/        # HKDF + AES-CTR + envector-go-sdk wrappers
+├── server/        # gRPC handlers, interceptors, audit, admin UDS, pidfile
+├── commands/      # CLI subcommands + admin client
+├── integration/   # E2E: decrypt pipeline (fixture-based) + CLI smoke
+└── testutil/      # Fixture path resolver
 ```
 
 ### Running Tests
 
-All test commands **must** be run via `mise run`:
-
 ```bash
-mise run test         # Unit + integration tests
-mise run test:unit    # Unit tests only
-mise run test:cov     # Tests with coverage report
+mise run go:test          # All tests with race detector
+mise run go:test:unit     # Skip CLI smoke E2E (faster)
 ```
 
 ### Test Fixtures
 
-Integration tests use GPG-encrypted fixtures containing FHE keys and ciphertext blobs. See [tests/FIXTURES.md](tests/FIXTURES.md) for the full update procedure, including passphrase rotation and re-encryption steps.
+Integration tests use GPG-encrypted fixtures containing FHE keys and ciphertext blobs. See [tests/FIXTURES.md](tests/FIXTURES.md) for the full update procedure, including passphrase rotation and re-encryption steps. The fixture-based decrypt-pipeline test under `vault/internal/integration/` skips automatically when `tests/fixtures/` is not decrypted.
 
 ### Test Requirements
 
@@ -116,17 +102,16 @@ Integration tests use GPG-encrypted fixtures containing FHE keys and ciphertext
 - Use fixtures for crypto setup to avoid repeated key generation
 - Mock external dependencies
 - Test both success and error paths
-- New gRPC methods need corresponding unit tests in `tests/unit/`
-- Token/auth changes must update `tests/unit/test_auth.py`
+- New gRPC methods need corresponding unit tests in `vault/internal/server/grpc_test.go`
+- Token/auth changes must update `vault/internal/tokens/store_test.go`
 
 ## Code Style
 
-### Python
+### Go
 
-- Follow PEP 8
-- All public functions need type hints
-- Keep functions focused and testable
-- Format and lint with ruff: `mise run format` and `mise run lint`
+- Run `mise run go:fmt` to format
+- All exported identifiers need a doc comment
+- Tests live alongside the code they test (`*_test.go`)
 - Run `mise run check` before committing
 
 ### Shell Scripts
diff --git a/pyproject.toml b/pyproject.toml
deleted file mode 100644
index b2a9db7..0000000
--- a/pyproject.toml
+++ /dev/null
@@ -1,14 +0,0 @@
-[project]
-name = "rune-vault"
-requires-python = ">=3.12"
-
-[tool.ruff]
-line-length = 100
-target-version = "py312"
-
-[tool.ruff.lint]
-select = ["E", "F", "I", "W"]
-
-[tool.pytest.ini_options]
-testpaths = ["tests"]
-asyncio_mode = "auto"
diff --git a/requirements.txt b/requirements.txt
deleted file mode 100644
index 3f1e84e..0000000
--- a/requirements.txt
+++ /dev/null
@@ -1,24 +0,0 @@
-# Rune-Admin Dependencies
-
-# FHE Encryption SDK
-pyenvector>=1.2.0
-
-# HTTP Client
-httpx>=0.24.0
-
-# JSON handling
-python-json-logger>=2.0.0
-
-# enVector MCP Server Dependencies
-pydantic[email]>=2.11.7
-python-dotenv>=1.2.1
-fastembed>=0.7.4
-langchain-text-splitters>=1.0.0
-pypdf>=6.4.1
-
-# Testing (optional)
-pytest>=7.0.0
-pytest-asyncio>=0.18.0
-
-# NumPy (required by pyenvector)
-numpy>=1.24.0
diff --git a/tests/integration/__init__.py b/tests/integration/__init__.py
deleted file mode 100644
index 2dfbe6f..0000000
--- a/tests/integration/__init__.py
+++ /dev/null
@@ -1 +0,0 @@
-"""Integration tests for Rune-Vault API."""
diff --git a/tests/integration/test_decrypt_pipeline.py b/tests/integration/test_decrypt_pipeline.py
deleted file mode 100644
index fa15e91..0000000
--- a/tests/integration/test_decrypt_pipeline.py
+++ /dev/null
@@ -1,155 +0,0 @@
-"""
-Integration tests for the decrypt pipeline.
-
-Uses pre-generated fixtures from tests/fixtures/ (captured from enVector Cloud)
-to test _decrypt_scores_impl and _decrypt_metadata_impl end-to-end.
-
-Fixtures are generated by: scripts/generate-test-fixtures.py
-"""
-
-import json
-import os
-import sys
-
-import pytest
-
-# Add vault to path
-sys.path.insert(0, os.path.join(os.path.dirname(__file__), "../../vault"))
-
-FIXTURES_DIR = os.path.join(os.path.dirname(__file__), "..", "fixtures")
-
-
-def _load_fixture(name: str) -> str | dict | list:
-    path = os.path.join(FIXTURES_DIR, name)
-    with open(path) as f:
-        if name.endswith(".json"):
-            return json.load(f)
-        return f.read().strip()
-
-
-@pytest.fixture(scope="module")
-def fixtures():
-    """Load all fixtures and patch vault_core for testing."""
-    config = _load_fixture("config.json")
-    keys_dir = os.path.join(FIXTURES_DIR, "keys")
-    return {
-        "config": config,
-        "enc_key_path": os.path.join(keys_dir, "EncKey.json"),
-        "sec_key_path": os.path.join(keys_dir, "SecKey.json"),
-        "score_blob_b64": _load_fixture("ciphertext_score.b64"),
-        "expected_scores": _load_fixture("expected_scores.json"),
-        "envelopes": _load_fixture("metadata_envelopes.json"),
-        "expected_metadata": _load_fixture("expected_metadata.json"),
-    }
-
-
-@pytest.fixture(autouse=True)
-def patch_vault(fixtures, monkeypatch):
-    """Patch vault_core to use fixture keys and config."""
-    import vault_core
-    from pyenvector.crypto import Cipher
-    from token_store import token_store
-
-    config = fixtures["config"]
-
-    monkeypatch.setattr(vault_core, "sec_key_path", fixtures["sec_key_path"])
-    monkeypatch.setattr(vault_core, "VAULT_TEAM_SECRET", config["team_secret"])
-
-    # Reinitialize cipher with fixture SecKey (dim must match fixture FHE dim)
-    # cipher.decrypt_score needs enc_key_path but only uses sec_key_path for decryption
-    # Use a dummy enc_key_path since we only decrypt
-    fixture_cipher = Cipher(enc_key_path=fixtures["enc_key_path"], dim=config["dim"])
-    monkeypatch.setattr(vault_core, "cipher", fixture_cipher)
-
-    token_store._rate_limiters.clear()
-
-
-class TestDecryptScores:
-
-    def test_decrypt_scores(self, fixtures):
-        """Full pipeline: CiphertextScore blob → _decrypt_scores_impl → correct scores."""
-        from vault_core import _decrypt_scores_impl
-
-        config = fixtures["config"]
-        expected = fixtures["expected_scores"]
-        total_scores = sum(len(row) for row in expected["score"])
-
-        result = _decrypt_scores_impl(config["token"], fixtures["score_blob_b64"], top_k=total_scores)
-        data = json.loads(result)
-
-        assert isinstance(data, list)
-        assert len(data) == total_scores
-
-        # Verify scores match expected (FHE decryption is deterministic with same key)
-        expected_flat = []
-        shard_indices = expected["shard_idx"]
-        for i, row in enumerate(expected["score"]):
-            for j, score in enumerate(row):
-                expected_flat.append((shard_indices[i], j, score))
-        expected_flat.sort(key=lambda x: x[2], reverse=True)
-
-        for actual, (exp_shard, exp_row, exp_score) in zip(data, expected_flat):
-            assert actual["shard_idx"] == exp_shard
-            assert actual["row_idx"] == exp_row
-            assert abs(actual["score"] - exp_score) < 1e-6
-
-    def test_decrypt_scores_top_k(self, fixtures):
-        """Top-K filtering returns correct count and highest scores."""
-        from vault_core import _decrypt_scores_impl
-
-        config = fixtures["config"]
-        expected = fixtures["expected_scores"]
-
-        # Get all scores to find the true top-3
-        all_scores = []
-        for i, row in enumerate(expected["score"]):
-            for j, score in enumerate(row):
-                all_scores.append(score)
-        all_scores.sort(reverse=True)
-
-        result = _decrypt_scores_impl(config["token"], fixtures["score_blob_b64"], top_k=3)
-        data = json.loads(result)
-
-        assert len(data) == 3
-        # Returned scores should be the 3 highest
-        returned_scores = [item["score"] for item in data]
-        for actual, expected_score in zip(returned_scores, all_scores[:3]):
-            assert abs(actual - expected_score) < 1e-6
-        # Descending order
-        assert returned_scores == sorted(returned_scores, reverse=True)
-
-
-class TestDecryptMetadata:
-
-    def test_decrypt_metadata_single(self, fixtures):
-        """Single envelope → _decrypt_metadata_impl → correct plaintext."""
-        from vault_core import _decrypt_metadata_impl
-
-        config = fixtures["config"]
-        envelopes = fixtures["envelopes"]
-        expected = fixtures["expected_metadata"]
-
-        result = _decrypt_metadata_impl(config["token"], [envelopes[0]])
-        data = json.loads(result)
-
-        assert isinstance(data, list)
-        assert len(data) == 1
-        # _decrypt_metadata_impl returns JSON strings or already-decoded objects
-        actual = json.loads(data[0]) if isinstance(data[0], str) else data[0]
-        assert actual == expected[0]
-
-    def test_decrypt_metadata_multiple(self, fixtures):
-        """Multiple envelopes → all decrypted correctly."""
-        from vault_core import _decrypt_metadata_impl
-
-        config = fixtures["config"]
-        envelopes = fixtures["envelopes"]
-        expected = fixtures["expected_metadata"]
-
-        result = _decrypt_metadata_impl(config["token"], envelopes)
-        data = json.loads(result)
-
-        assert len(data) == len(expected)
-        for item, exp in zip(data, expected):
-            actual = json.loads(item) if isinstance(item, str) else item
-            assert actual == exp
diff --git a/tests/requirements.txt b/tests/requirements.txt
deleted file mode 100644
index 5a89044..0000000
--- a/tests/requirements.txt
+++ /dev/null
@@ -1,10 +0,0 @@
-# Test dependencies for Rune-Vault
-pytest>=7.4.0
-pytest-asyncio>=0.21.0
-pytest-cov>=4.1.0
-httpx>=0.24.0
-
-# Vault dependencies
-numpy>=1.24.0
-pyenvector>=1.2.0
-
diff --git a/tests/unit/__init__.py b/tests/unit/__init__.py
deleted file mode 100644
index c42a1d7..0000000
--- a/tests/unit/__init__.py
+++ /dev/null
@@ -1 +0,0 @@
-"""Unit tests for Rune-Vault components."""
diff --git a/tests/unit/test_admin_server.py b/tests/unit/test_admin_server.py
deleted file mode 100644
index 5d6ee6f..0000000
--- a/tests/unit/test_admin_server.py
+++ /dev/null
@@ -1,209 +0,0 @@
-"""
-Unit tests for Admin HTTP server.
-"""
-import http.client
-import json
-import os
-import sys
-import time
-
-import pytest
-
-sys.path.insert(0, os.path.join(os.path.dirname(__file__), '../../vault'))
-
-from token_store import TokenStore, DEFAULT_ROLES
-from admin_server import start_admin_server
-
-
-def _request(port, method, path, body=None):
-    conn = http.client.HTTPConnection("127.0.0.1", port)
-    headers = {"Content-Type": "application/json"} if body else {}
-    data = json.dumps(body).encode() if body else None
-    conn.request(method, path, body=data, headers=headers)
-    resp = conn.getresponse()
-    result = json.loads(resp.read().decode())
-    conn.close()
-    return resp.status, result
-
-
-class TestAdminServer:
-    """Integration tests for the admin HTTP API."""
-
-    @pytest.fixture(autouse=True)
-    def setup_server(self):
-        self.store = TokenStore()
-        self.store._roles = dict(DEFAULT_ROLES)
-        # Use port 0 to let OS assign an available ephemeral port
-        self.server = start_admin_server(self.store, "127.0.0.1", 0)
-        self.port = self.server.server_address[1]
-        time.sleep(0.1)  # Give server time to start
-        yield
-        self.server.shutdown()
-
-    # ── Token endpoints ──────────────────────────────────────────────
-
-    def test_issue_token(self):
-        status, data = _request(self.port, "POST", "/tokens", {
-            "user": "alice", "role": "member", "expires_days": 90
-        })
-        assert status == 201
-        assert data["user"] == "alice"
-        assert data["token"].startswith("evt_")
-        assert data["role"] == "member"
-
-    def test_list_tokens(self):
-        _request(self.port, "POST", "/tokens", {
-            "user": "alice", "role": "member"
-        })
-        status, data = _request(self.port, "GET", "/tokens")
-        assert status == 200
-        assert len(data["tokens"]) == 1
-        assert data["tokens"][0]["user"] == "alice"
-
-    def test_revoke_token(self):
-        _request(self.port, "POST", "/tokens", {
-            "user": "alice", "role": "member"
-        })
-        status, data = _request(self.port, "DELETE", "/tokens/alice")
-        assert status == 200
-        assert "Revoked" in data["message"]
-
-        # List should be empty
-        _, data = _request(self.port, "GET", "/tokens")
-        assert len(data["tokens"]) == 0
-
-    def test_revoke_nonexistent_token(self):
-        status, data = _request(self.port, "DELETE", "/tokens/nobody")
-        assert status == 404
-
-    def test_issue_duplicate_user(self):
-        _request(self.port, "POST", "/tokens", {
-            "user": "alice", "role": "member"
-        })
-        status, data = _request(self.port, "POST", "/tokens", {
-            "user": "alice", "role": "member"
-        })
-        assert status == 400
-        assert "already exists" in data["error"]
-
-    def test_issue_token_invalid_role(self):
-        status, data = _request(self.port, "POST", "/tokens", {
-            "user": "alice", "role": "nonexistent"
-        })
-        assert status == 400
-
-    # ── Rotate endpoints ──────────────────────────────────────────────
-
-    def test_rotate_token(self):
-        _, issue_data = _request(self.port, "POST", "/tokens", {
-            "user": "alice", "role": "member"
-        })
-        status, data = _request(self.port, "POST", "/tokens/alice/rotate", {})
-        assert status == 200
-        assert data["user"] == "alice"
-        assert data["token"].startswith("evt_")
-        assert data["token"] != issue_data["token"]
-        assert data["role"] == "member"
-
-    def test_rotate_nonexistent_user(self):
-        status, data = _request(self.port, "POST", "/tokens/nobody/rotate", {})
-        assert status == 400
-        assert "No token found" in data["error"]
-
-    def test_rotate_all(self):
-        _request(self.port, "POST", "/tokens", {"user": "alice", "role": "member"})
-        _request(self.port, "POST", "/tokens", {"user": "bob", "role": "admin"})
-        status, data = _request(self.port, "POST", "/tokens/_rotate_all", {})
-        assert status == 200
-        assert data["rotated"] == 2
-        assert len(data["tokens"]) == 2
-
-    # ── Role endpoints ───────────────────────────────────────────────
-
-    def test_list_roles(self):
-        status, data = _request(self.port, "GET", "/roles")
-        assert status == 200
-        names = [r["name"] for r in data["roles"]]
-        assert "admin" in names
-        assert "member" in names
-
-    def test_create_role(self):
-        status, data = _request(self.port, "POST", "/roles", {
-            "name": "researcher",
-            "scope": ["get_public_key", "decrypt_scores"],
-            "top_k": 3,
-            "rate_limit": "10/60s",
-        })
-        assert status == 201
-        assert data["name"] == "researcher"
-
-    def test_update_role(self):
-        status, data = _request(self.port, "PUT", "/roles/member", {
-            "top_k": 8,
-        })
-        assert status == 200
-        assert data["top_k"] == 8
-
-    def test_delete_custom_role(self):
-        _request(self.port, "POST", "/roles", {
-            "name": "temp",
-            "scope": ["get_public_key"],
-            "top_k": 1,
-            "rate_limit": "5/60s",
-        })
-        status, data = _request(self.port, "DELETE", "/roles/temp")
-        assert status == 200
-
-    def test_delete_default_role_rejected(self):
-        status, data = _request(self.port, "DELETE", "/roles/admin")
-        assert status == 400
-        assert "Cannot delete default" in data["error"]
-
-    def test_unknown_resource(self):
-        status, _ = _request(self.port, "GET", "/unknown")
-        assert status == 404
-
-    # ── Health endpoint ──────────────────────────────────────────────
-
-    def test_health_ok_without_servicer(self):
-        status, data = _request(self.port, "GET", "/health")
-        assert status == 200
-        assert data["status"] == "ok"
-
-    def test_health_ok_with_serving_servicer(self):
-        from grpc_health.v1 import health_pb2
-        from grpc_health.v1.health import HealthServicer
-
-        servicer = HealthServicer()
-        servicer.set("", health_pb2.HealthCheckResponse.SERVING)
-
-        store = TokenStore()
-        store._roles = dict(DEFAULT_ROLES)
-        server = start_admin_server(store, "127.0.0.1", 0, health_servicer=servicer)
-        port = server.server_address[1]
-        time.sleep(0.1)
-        try:
-            status, data = _request(port, "GET", "/health")
-            assert status == 200
-            assert data["status"] == "ok"
-        finally:
-            server.shutdown()
-
-    def test_health_unhealthy_with_not_serving(self):
-        from grpc_health.v1 import health_pb2
-        from grpc_health.v1.health import HealthServicer
-
-        servicer = HealthServicer()
-        servicer.set("", health_pb2.HealthCheckResponse.NOT_SERVING)
-
-        store = TokenStore()
-        store._roles = dict(DEFAULT_ROLES)
-        server = start_admin_server(store, "127.0.0.1", 0, health_servicer=servicer)
-        port = server.server_address[1]
-        time.sleep(0.1)
-        try:
-            status, data = _request(port, "GET", "/health")
-            assert status == 503
-            assert data["status"] == "unhealthy"
-        finally:
-            server.shutdown()
diff --git a/tests/unit/test_audit.py b/tests/unit/test_audit.py
deleted file mode 100644
index 8409166..0000000
--- a/tests/unit/test_audit.py
+++ /dev/null
@@ -1,250 +0,0 @@
-"""
-Unit tests for structured audit logging (issue #19).
-"""
-
-import json
-import os
-import sys
-import tempfile
-from unittest.mock import MagicMock
-
-import pytest
-
-# Add vault to path
-sys.path.insert(0, os.path.join(os.path.dirname(__file__), "../../vault"))
-
-from audit import (
-    AuditLogger,
-    _parse_audit_config,
-    extract_source_ip,
-)
-
-
-# ---------------------------------------------------------------------------
-# Config parsing
-# ---------------------------------------------------------------------------
-
-
-class TestParseAuditConfig:
-    def test_empty_string(self):
-        cfg = _parse_audit_config("")
-        assert cfg["file"] is None
-        assert cfg["stdout"] is False
-
-    def test_file_default_path(self):
-        cfg = _parse_audit_config("file")
-        assert cfg["file"] == "/var/log/rune-vault/audit.log"
-        assert cfg["stdout"] is False
-
-    def test_file_custom_path(self):
-        cfg = _parse_audit_config("file:/tmp/my-audit.log")
-        assert cfg["file"] == "/tmp/my-audit.log"
-
-    def test_stdout(self):
-        cfg = _parse_audit_config("stdout")
-        assert cfg["file"] is None
-        assert cfg["stdout"] is True
-
-    def test_file_plus_stdout(self):
-        cfg = _parse_audit_config("file+stdout")
-        assert cfg["file"] == "/var/log/rune-vault/audit.log"
-        assert cfg["stdout"] is True
-
-    def test_stdout_plus_file(self):
-        cfg = _parse_audit_config("stdout+file")
-        assert cfg["file"] == "/var/log/rune-vault/audit.log"
-        assert cfg["stdout"] is True
-
-    def test_custom_path_plus_stdout(self):
-        cfg = _parse_audit_config("file:/tmp/my-audit.log+stdout")
-        assert cfg["file"] == "/tmp/my-audit.log"
-        assert cfg["stdout"] is True
-
-    def test_custom_path_preserves_case(self):
-        cfg = _parse_audit_config("file:/var/log/Rune-Vault/Audit.log")
-        assert cfg["file"] == "/var/log/Rune-Vault/Audit.log"
-
-    def test_file_keyword_case_insensitive(self):
-        cfg = _parse_audit_config("FILE+STDOUT")
-        assert cfg["file"] == "/var/log/rune-vault/audit.log"
-        assert cfg["stdout"] is True
-
-
-# ---------------------------------------------------------------------------
-# Source IP extraction
-# ---------------------------------------------------------------------------
-
-
-class TestExtractSourceIp:
-    def _make_context(self, peer_value):
-        ctx = MagicMock()
-        ctx.peer.return_value = peer_value
-        return ctx
-
-    def test_ipv4(self):
-        assert extract_source_ip(self._make_context("ipv4:10.0.0.1:12345")) == "10.0.0.1"
-
-    def test_ipv4_no_port(self):
-        # Defensive: if port is missing
-        assert extract_source_ip(self._make_context("ipv4:10.0.0.1")) == "10.0.0.1"
-
-    def test_ipv6_bracketed(self):
-        assert extract_source_ip(self._make_context("ipv6:[::1]:12345")) == "[::1]"
-
-    def test_ipv6_no_brackets(self):
-        result = extract_source_ip(self._make_context("ipv6:::1:12345"))
-        assert result  # should not crash
-
-    def test_none_peer(self):
-        assert extract_source_ip(self._make_context(None)) == "unknown"
-
-    def test_exception(self):
-        ctx = MagicMock()
-        ctx.peer.side_effect = RuntimeError("broken")
-        assert extract_source_ip(ctx) == "unknown"
-
-    def test_unix_socket(self):
-        result = extract_source_ip(self._make_context("unix:/var/run/vault.sock"))
-        assert result == "unix:/var/run/vault.sock"
-
-
-# ---------------------------------------------------------------------------
-# AuditLogger
-# ---------------------------------------------------------------------------
-
-
-class TestAuditLogger:
-    def test_disabled_when_no_handlers(self):
-        logger = AuditLogger({"file": None, "stdout": False})
-        assert logger.enabled is False
-
-    def test_file_mode_writes_json(self):
-        with tempfile.NamedTemporaryFile(mode="r", suffix=".log", delete=False) as f:
-            path = f.name
-        try:
-            logger = AuditLogger({"file": path, "stdout": False})
-            assert logger.enabled is True
-            entry = logger.log(
-                timestamp="2026-03-30T12:00:00+00:00",
-                user_id="alice",
-                method="decrypt_scores",
-                top_k=10,
-                result_count=5,
-                status="success",
-                source_ip="10.0.0.1",
-                latency_ms=42.567,
-            )
-            # Force flush
-            for h in logger._logger.handlers:
-                h.flush()
-            with open(path) as fh:
-                line = fh.readline().strip()
-            parsed = json.loads(line)
-            assert parsed["user_id"] == "alice"
-            assert parsed["method"] == "decrypt_scores"
-            assert parsed["top_k"] == 10
-            assert parsed["result_count"] == 5
-            assert parsed["status"] == "success"
-            assert parsed["source_ip"] == "10.0.0.1"
-            assert parsed["latency_ms"] == 42.57
-            assert parsed["timestamp"] == "2026-03-30T12:00:00+00:00"
-            assert "error" not in parsed
-            # Verify return value matches
-            assert entry["user_id"] == "alice"
-        finally:
-            os.unlink(path)
-
-    def test_error_field_included(self):
-        with tempfile.NamedTemporaryFile(mode="r", suffix=".log", delete=False) as f:
-            path = f.name
-        try:
-            logger = AuditLogger({"file": path, "stdout": False})
-            logger.log(
-                timestamp="2026-03-30T12:00:00+00:00",
-                user_id="unknown",
-                method="decrypt_scores",
-                top_k=None,
-                result_count=0,
-                status="error",
-                source_ip="10.0.0.99",
-                latency_ms=1.23,
-                error="Invalid authentication token",
-            )
-            for h in logger._logger.handlers:
-                h.flush()
-            with open(path) as fh:
-                parsed = json.loads(fh.readline().strip())
-            assert parsed["status"] == "error"
-            assert parsed["error"] == "Invalid authentication token"
-            assert parsed["top_k"] is None
-        finally:
-            os.unlink(path)
-
-    def test_stdout_mode(self, capsys):
-        logger = AuditLogger({"file": None, "stdout": True})
-        assert logger.enabled is True
-        logger.log(
-            timestamp="2026-03-30T12:00:00+00:00",
-            user_id="bob",
-            method="get_public_key",
-            top_k=None,
-            result_count=1,
-            status="success",
-            source_ip="10.0.0.2",
-            latency_ms=5.0,
-        )
-        captured = capsys.readouterr()
-        parsed = json.loads(captured.out.strip())
-        assert parsed["user_id"] == "bob"
-
-    def test_empty_error_string_included(self):
-        with tempfile.NamedTemporaryFile(mode="r", suffix=".log", delete=False) as f:
-            path = f.name
-        try:
-            logger = AuditLogger({"file": path, "stdout": False})
-            logger.log(
-                timestamp="2026-03-30T12:00:00+00:00",
-                user_id="test",
-                method="decrypt_scores",
-                top_k=None,
-                result_count=0,
-                status="error",
-                source_ip="10.0.0.1",
-                latency_ms=1.0,
-                error="",
-            )
-            for h in logger._logger.handlers:
-                h.flush()
-            with open(path) as fh:
-                parsed = json.loads(fh.readline().strip())
-            assert "error" in parsed
-            assert parsed["error"] == ""
-        finally:
-            os.unlink(path)
-
-    def test_entry_schema_required_fields(self):
-        with tempfile.NamedTemporaryFile(mode="r", suffix=".log", delete=False) as f:
-            path = f.name
-        try:
-            logger = AuditLogger({"file": path, "stdout": False})
-            logger.log(
-                timestamp="2026-03-30T12:00:00+00:00",
-                user_id="test",
-                method="decrypt_metadata",
-                top_k=None,
-                result_count=3,
-                status="success",
-                source_ip="127.0.0.1",
-                latency_ms=10.0,
-            )
-            for h in logger._logger.handlers:
-                h.flush()
-            with open(path) as fh:
-                parsed = json.loads(fh.readline().strip())
-            required = {"timestamp", "user_id", "method", "top_k", "result_count",
-                        "status", "source_ip", "latency_ms"}
-            assert required.issubset(parsed.keys())
-        finally:
-            os.unlink(path)
-
-
diff --git a/tests/unit/test_auth.py b/tests/unit/test_auth.py
deleted file mode 100644
index b8507bf..0000000
--- a/tests/unit/test_auth.py
+++ /dev/null
@@ -1,147 +0,0 @@
-"""
-Unit tests for authentication and token validation.
-Updated for per-user token auth (issue #18).
-"""
-import pytest
-import sys
-import os
-import time
-
-# Add vault to path
-sys.path.insert(0, os.path.join(os.path.dirname(__file__), '../../vault'))
-
-from token_store import (
-    TokenStore, RateLimiter, Role,
-    TokenNotFoundError, TokenExpiredError, RateLimitError, ScopeError,
-)
-from vault_core import validate_token, token_store
-
-# Demo token used when no config files or env var set
-DEMO_TOKEN = "evt_0000000000000000000000000000demo"
-
-
-class TestTokenValidation:
-    """Test token validation with per-user token store."""
-
-    def setup_method(self):
-        """Reset token store to demo mode for each test."""
-        token_store._tokens.clear()
-        token_store._tokens_by_user.clear()
-        token_store._roles.clear()
-        token_store._rate_limiters.clear()
-        token_store.load_defaults_with_demo_token()
-
-    def test_valid_demo_token(self):
-        """Demo token should return (username, role) tuple."""
-        username, role = validate_token(DEMO_TOKEN)
-        assert username == "demo"
-        assert role.name == "admin"
-
-    def test_invalid_token_raises_error(self):
-        """Invalid token should raise TokenNotFoundError."""
-        with pytest.raises(TokenNotFoundError):
-            validate_token("invalid-token-123")
-
-    def test_empty_token_raises_error(self):
-        """Empty token should raise TokenNotFoundError."""
-        with pytest.raises(TokenNotFoundError):
-            validate_token("")
-
-    def test_token_case_sensitive(self):
-        """Token validation should be case-sensitive."""
-        with pytest.raises(TokenNotFoundError):
-            validate_token(DEMO_TOKEN.upper())
-
-    def test_token_no_whitespace_tolerance(self):
-        """Tokens with whitespace should fail."""
-        with pytest.raises(TokenNotFoundError):
-            validate_token(f" {DEMO_TOKEN} ")
-
-    def test_old_tokens_not_valid(self):
-        """Old hardcoded tokens should not work."""
-        with pytest.raises(TokenNotFoundError):
-            validate_token("envector-team-alpha")
-
-    def test_validate_returns_tuple(self):
-        """validate_token should return (username, Role) tuple."""
-        result = validate_token(DEMO_TOKEN)
-        assert isinstance(result, tuple)
-        assert len(result) == 2
-        username, role = result
-        assert isinstance(username, str)
-        assert isinstance(role, Role)
-
-
-class TestRateLimiter:
-    """Test rate limiting functionality."""
-
-    def test_allows_requests_under_limit(self):
-        """Requests under limit should be allowed."""
-        limiter = RateLimiter(max_requests=5, window_seconds=60)
-        for _ in range(5):
-            assert limiter.is_allowed("test-client") is True
-
-    def test_blocks_requests_over_limit(self):
-        """Requests over limit should be blocked."""
-        limiter = RateLimiter(max_requests=3, window_seconds=60)
-        for _ in range(3):
-            limiter.is_allowed("test-client")
-        assert limiter.is_allowed("test-client") is False
-
-    def test_different_clients_have_separate_limits(self):
-        """Different clients should have independent rate limits."""
-        limiter = RateLimiter(max_requests=2, window_seconds=60)
-        limiter.is_allowed("client-a")
-        limiter.is_allowed("client-a")
-        assert limiter.is_allowed("client-a") is False
-        assert limiter.is_allowed("client-b") is True
-
-    def test_window_expiration(self):
-        """Old requests should expire after window."""
-        limiter = RateLimiter(max_requests=2, window_seconds=1)
-        limiter.is_allowed("test-client")
-        limiter.is_allowed("test-client")
-        assert limiter.is_allowed("test-client") is False
-        time.sleep(1.1)
-        assert limiter.is_allowed("test-client") is True
-
-    def test_retry_after_returns_correct_value(self):
-        """get_retry_after should return seconds until next allowed request."""
-        limiter = RateLimiter(max_requests=1, window_seconds=60)
-        limiter.is_allowed("test-client")
-        retry_after = limiter.get_retry_after("test-client")
-        assert 55 <= retry_after <= 60
-
-    def test_remove_client(self):
-        """remove() should clear a client's tracking data."""
-        limiter = RateLimiter(max_requests=1, window_seconds=60)
-        limiter.is_allowed("test-client")
-        assert limiter.is_allowed("test-client") is False
-        limiter.remove("test-client")
-        assert limiter.is_allowed("test-client") is True
-
-
-class TestScopeEnforcement:
-    """Test scope enforcement for roles."""
-
-    def setup_method(self):
-        token_store._tokens.clear()
-        token_store._tokens_by_user.clear()
-        token_store._roles.clear()
-        token_store._rate_limiters.clear()
-        token_store.load_defaults_with_demo_token()
-
-    def test_admin_scope_allows_all_methods(self):
-        """Admin role should allow all standard methods."""
-        _, role = validate_token(DEMO_TOKEN)
-        # Should not raise
-        token_store.check_scope(role, "get_public_key")
-        token_store.check_scope(role, "decrypt_scores")
-        token_store.check_scope(role, "decrypt_metadata")
-        token_store.check_scope(role, "manage_tokens")
-
-    def test_scope_rejects_unauthorized_method(self):
-        """Methods not in scope should raise ScopeError."""
-        role = Role("limited", ["get_public_key"], 5, "30/60s")
-        with pytest.raises(ScopeError, match="decrypt_scores"):
-            token_store.check_scope(role, "decrypt_scores")
diff --git a/tests/unit/test_decrypt_scores.py b/tests/unit/test_decrypt_scores.py
deleted file mode 100644
index 4461e21..0000000
--- a/tests/unit/test_decrypt_scores.py
+++ /dev/null
@@ -1,226 +0,0 @@
-"""
-Unit tests for decrypt_scores (including Top-K).
-
-Uses mock-based approach: since we cannot create real CiphertextScore blobs
-without running FHE scoring on an actual index from enVector Cloud, we mock
-cipher.decrypt_score() and CiphertextScore.ParseFromString() to test the Top-K
-and response format logic.
-"""
-import pytest
-import sys
-import os
-import json
-import base64
-import numpy as np
-from unittest.mock import MagicMock, patch
-
-# Add vault to path
-sys.path.insert(0, os.path.join(os.path.dirname(__file__), '../../vault'))
-
-# Import the implementation function (not the MCP-decorated version)
-from vault_core import _decrypt_scores_impl as decrypt_scores
-from token_store import token_store
-
-
-def _make_fake_blob() -> str:
-    """Create a fake base64-encoded blob (content doesn't matter since decrypt_score is mocked)."""
-    return base64.b64encode(b"fake_ciphertext_score_proto").decode("utf-8")
-
-
-def _mock_decrypt_score_flat(scores):
-    """Build a mock decrypt_score return value for FLAT index (single shard)."""
-    return {"score": [scores], "shard_idx": [0]}
-
-
-def _mock_decrypt_score_ivf(score_2d, shard_indices):
-    """Build a mock decrypt_score return value for IVF_FLAT index (multiple shards)."""
-    return {"score": score_2d, "shard_idx": shard_indices}
-
-
-class TestDecryptScores:
-
-    @pytest.fixture(autouse=True)
-    def reset_rate_limiter(self):
-        """Reset rate limiters before each test."""
-        token_store._rate_limiters.clear()
-
-    def _patch_cipher_and_proto(self, monkeypatch, scores_return):
-        """Helper to mock cipher, CiphertextScore, and CipherBlock."""
-        mock_cipher = MagicMock()
-        mock_cipher.decrypt_score.return_value = scores_return
-        monkeypatch.setattr('vault_core.cipher', mock_cipher)
-        monkeypatch.setattr('vault_core.sec_key_path', '/fake/SecKey.json')
-        monkeypatch.setattr('vault_core.CiphertextScore', MagicMock)
-        monkeypatch.setattr('vault_core.CipherBlock', MagicMock)
-
-    def test_decrypt_valid_scores_flat(self, monkeypatch):
-        """Valid encrypted scores (FLAT) should decrypt successfully."""
-        scores = np.random.rand(100).tolist()
-        blob = _make_fake_blob()
-
-        self._patch_cipher_and_proto(monkeypatch, _mock_decrypt_score_flat(scores))
-
-        result = decrypt_scores("evt_0000000000000000000000000000demo", blob, top_k=5)
-        data = json.loads(result)
-
-        assert isinstance(data, list)
-        assert len(data) == 5
-        for item in data:
-            assert "shard_idx" in item
-            assert "row_idx" in item
-            assert "score" in item
-
-    def test_decrypt_valid_scores_ivf(self, monkeypatch):
-        """Valid encrypted scores (IVF_FLAT) should decrypt successfully with shard mapping."""
-        shard0 = [0.1, 0.9, 0.3]
-        shard1 = [0.8, 0.2, 0.7]
-        blob = _make_fake_blob()
-
-        self._patch_cipher_and_proto(monkeypatch, _mock_decrypt_score_ivf(
-            [shard0, shard1], [5, 12]
-        ))
-
-        result = decrypt_scores("evt_0000000000000000000000000000demo", blob, top_k=3)
-        data = json.loads(result)
-
-        assert isinstance(data, list)
-        assert len(data) == 3
-        # Top 3: shard 5 row 1 (0.9), shard 12 row 0 (0.8), shard 12 row 2 (0.7)
-        assert data[0] == {"shard_idx": 5, "row_idx": 1, "score": 0.9}
-        assert data[1] == {"shard_idx": 12, "row_idx": 0, "score": 0.8}
-        assert data[2] == {"shard_idx": 12, "row_idx": 2, "score": 0.7}
-
-    def test_top_k_returns_correct_count(self, monkeypatch):
-        """Top-K should return exactly K results."""
-        scores = np.random.rand(50).tolist()
-        blob = _make_fake_blob()
-
-        self._patch_cipher_and_proto(monkeypatch, _mock_decrypt_score_flat(scores))
-
-        for k in [1, 2, 3, 5]:
-            result = decrypt_scores("evt_0000000000000000000000000000demo", blob, top_k=k)
-            data = json.loads(result)
-            assert isinstance(data, list)
-            assert len(data) == k, f"Expected {k} results, got {len(data)}"
-
-    def test_top_k_returns_highest_scores(self, monkeypatch):
-        """Top-K should return the highest scoring items."""
-        scores = [0.1, 0.9, 0.3, 0.8, 0.5]
-        blob = _make_fake_blob()
-
-        self._patch_cipher_and_proto(monkeypatch, _mock_decrypt_score_flat(scores))
-
-        result = decrypt_scores("evt_0000000000000000000000000000demo", blob, top_k=2)
-        data = json.loads(result)
-
-        assert isinstance(data, list)
-        assert len(data) == 2
-        returned_scores = [item["score"] for item in data]
-        assert returned_scores[0] == pytest.approx(0.9)
-        assert returned_scores[1] == pytest.approx(0.8)
-
-    def test_top_k_limit_enforced(self):
-        """Top-K exceeding role limit should be rejected."""
-        from token_store import TopKExceededError, token_store as ts
-
-        # Issue a member token (top_k=10) to test limit enforcement
-        tok = ts.add_token("topk-test-user", "member")
-        blob = _make_fake_blob()
-
-        with pytest.raises(TopKExceededError):
-            decrypt_scores(tok.token, blob, top_k=15)
-
-        ts.revoke_token("topk-test-user")
-
-    def test_invalid_token_rejected(self):
-        """Invalid token should raise an authentication error."""
-        from token_store import TokenNotFoundError
-        blob = _make_fake_blob()
-
-        with pytest.raises(TokenNotFoundError):
-            decrypt_scores("invalid-token", blob, top_k=5)
-
-    def test_malformed_blob_returns_error(self):
-        """Malformed encrypted blob should return error."""
-
-        result = decrypt_scores("evt_0000000000000000000000000000demo", "not-valid-base64!!!", top_k=5)
-        data = json.loads(result)
-
-        assert "error" in data
-
-    def test_empty_blob_returns_empty_or_error(self):
-        """Empty blob should return error or empty result list."""
-        result = decrypt_scores("evt_0000000000000000000000000000demo", "", top_k=5)
-        data = json.loads(result)
-
-        # Empty base64 decodes to b"", which produces an empty protobuf
-        # with no scores — either an error dict or an empty list is acceptable
-        assert isinstance(data, (dict, list))
-
-    def test_result_format_correct(self, monkeypatch):
-        """Result should have correct format: [{shard_idx, row_idx, score}, ...]."""
-        scores = np.random.rand(20).tolist()
-        blob = _make_fake_blob()
-
-        self._patch_cipher_and_proto(monkeypatch, _mock_decrypt_score_flat(scores))
-
-        result = decrypt_scores("evt_0000000000000000000000000000demo", blob, top_k=5)
-        data = json.loads(result)
-
-        assert isinstance(data, list)
-        for item in data:
-            assert "shard_idx" in item
-            assert "row_idx" in item
-            assert "score" in item
-            assert isinstance(item["shard_idx"], int)
-            assert isinstance(item["row_idx"], int)
-            assert isinstance(item["score"], (int, float))
-
-    def test_scores_sorted_descending(self, monkeypatch):
-        """Returned scores should be sorted in descending order."""
-        scores = np.random.rand(30).tolist()
-        blob = _make_fake_blob()
-
-        self._patch_cipher_and_proto(monkeypatch, _mock_decrypt_score_flat(scores))
-
-        result = decrypt_scores("evt_0000000000000000000000000000demo", blob, top_k=5)
-        data = json.loads(result)
-
-        assert isinstance(data, list) and len(data) > 1
-        returned_scores = [item["score"] for item in data]
-        for i in range(len(returned_scores) - 1):
-            assert returned_scores[i] >= returned_scores[i + 1], "Scores not sorted descending"
-
-    def test_default_top_k_is_5(self, monkeypatch):
-        """Default top_k should be 5."""
-        scores = np.random.rand(50).tolist()
-        blob = _make_fake_blob()
-
-        self._patch_cipher_and_proto(monkeypatch, _mock_decrypt_score_flat(scores))
-
-        result = decrypt_scores("evt_0000000000000000000000000000demo", blob)
-        data = json.loads(result)
-
-        assert isinstance(data, list)
-        assert len(data) == 5, "Default top_k should be 5"
-
-    def test_ivf_topk_cross_shard(self, monkeypatch):
-        """Top-K across multiple IVF shards should pick globally highest scores."""
-        shard0 = [0.1, 0.5, 0.3]
-        shard1 = [0.9, 0.2, 0.8]
-        shard2 = [0.4, 0.6, 0.7]
-        blob = _make_fake_blob()
-
-        self._patch_cipher_and_proto(monkeypatch, _mock_decrypt_score_ivf(
-            [shard0, shard1, shard2], [10, 20, 30]
-        ))
-
-        result = decrypt_scores("evt_0000000000000000000000000000demo", blob, top_k=4)
-        data = json.loads(result)
-
-        assert len(data) == 4
-        # Expected top-4: shard20 row0 (0.9), shard20 row2 (0.8), shard30 row2 (0.7), shard30 row1 (0.6)
-        assert data[0] == {"shard_idx": 20, "row_idx": 0, "score": 0.9}
-        assert data[1] == {"shard_idx": 20, "row_idx": 2, "score": 0.8}
-        assert data[2] == {"shard_idx": 30, "row_idx": 2, "score": 0.7}
-        assert data[3] == {"shard_idx": 30, "row_idx": 1, "score": 0.6}
diff --git a/tests/unit/test_metadata_dek.py b/tests/unit/test_metadata_dek.py
deleted file mode 100644
index 47039af..0000000
--- a/tests/unit/test_metadata_dek.py
+++ /dev/null
@@ -1,164 +0,0 @@
-"""
-Unit tests for per-agent metadata DEK derivation and decrypt_metadata.
-
-Uses mock-based approach: aes_decrypt_metadata is mocked to test the
-envelope parsing and per-agent HKDF key derivation without requiring
-real FHE keys.
-"""
-import pytest
-import sys
-import os
-import json
-from unittest.mock import MagicMock
-
-# Add vault to path
-sys.path.insert(0, os.path.join(os.path.dirname(__file__), '../../vault'))
-
-from vault_core import (
-    derive_agent_key,
-    _decrypt_metadata_impl as decrypt_metadata,
-)
-import vault_core
-from token_store import token_store
-
-VALID_TOKEN = "evt_0000000000000000000000000000demo"
-FAKE_TEAM_SECRET = "evt_fake-team-secret-for-testing-purposes-only"
-
-
-# =============================================================================
-# derive_agent_key tests
-# =============================================================================
-class TestDeriveAgentKey:
-
-    def test_deterministic(self):
-        """Same inputs must produce the same DEK."""
-        dek1 = derive_agent_key("my-team-secret", "agent-abc")
-        dek2 = derive_agent_key("my-team-secret", "agent-abc")
-        assert dek1 == dek2
-
-    def test_different_agent_id_different_dek(self):
-        """Different agent_id must produce different DEKs."""
-        dek_a = derive_agent_key("my-team-secret", "agent-aaa")
-        dek_b = derive_agent_key("my-team-secret", "agent-bbb")
-        assert dek_a != dek_b
-
-    def test_output_is_32_bytes(self):
-        """DEK must be exactly 32 bytes (AES-256)."""
-        dek = derive_agent_key("some-secret", "any-agent")
-        assert isinstance(dek, bytes)
-        assert len(dek) == 32
-
-    def test_different_team_secret_different_dek(self):
-        """Different team secrets must produce different DEKs for the same agent."""
-        dek1 = derive_agent_key("secret-1", "agent-x")
-        dek2 = derive_agent_key("secret-2", "agent-x")
-        assert dek1 != dek2
-
-
-# =============================================================================
-# _decrypt_metadata_impl tests
-# =============================================================================
-class TestDecryptMetadataImpl:
-
-    @pytest.fixture(autouse=True)
-    def reset_state(self):
-        """Reset rate limiters before each test."""
-        token_store._rate_limiters.clear()
-
-    def _make_envelope(self, agent_id: str, ciphertext_b64: str) -> str:
-        """Build a JSON envelope string."""
-        return json.dumps({"a": agent_id, "c": ciphertext_b64})
-
-    def test_per_agent_envelope_decryption(self, monkeypatch):
-        """Per-agent JSON envelope should be parsed and decrypted with derived DEK."""
-        monkeypatch.setattr('vault_core.VAULT_TEAM_SECRET', FAKE_TEAM_SECRET)
-
-        expected_dek = derive_agent_key(FAKE_TEAM_SECRET, "agent123")
-        mock_decrypt = MagicMock(return_value=b'{"text": "hello"}')
-        monkeypatch.setattr('vault_core.aes_decrypt_metadata', mock_decrypt)
-
-        envelope = self._make_envelope("agent123", "Y2lwaGVydGV4dA==")
-        result = decrypt_metadata(VALID_TOKEN, [envelope])
-        data = json.loads(result)
-
-        assert isinstance(data, list)
-        assert len(data) == 1
-        assert data[0] == '{"text": "hello"}'
-
-        # Verify aes_decrypt_metadata was called with the ciphertext and derived DEK
-        mock_decrypt.assert_called_once_with("Y2lwaGVydGV4dA==", expected_dek)
-
-    def test_missing_team_secret_returns_error(self, monkeypatch):
-        """Missing VAULT_TEAM_SECRET should return error."""
-        monkeypatch.setattr('vault_core.VAULT_TEAM_SECRET', '')
-
-        result = decrypt_metadata(VALID_TOKEN, ["anything"])
-        data = json.loads(result)
-
-        assert "error" in data
-        assert "VAULT_TEAM_SECRET not configured" in data["error"]
-
-    def test_invalid_token_rejected(self):
-        """Invalid token should raise an authentication error."""
-        from token_store import TokenNotFoundError
-        with pytest.raises(TokenNotFoundError):
-            decrypt_metadata("bad-token", ["anything"])
-
-    def test_invalid_envelope_returns_error(self, monkeypatch):
-        """Non-JSON envelope should return a decryption error."""
-        monkeypatch.setattr('vault_core.VAULT_TEAM_SECRET', FAKE_TEAM_SECRET)
-
-        result = decrypt_metadata(VALID_TOKEN, ["not-valid-json"])
-        data = json.loads(result)
-
-        assert "error" in data
-
-    def test_missing_key_in_envelope_returns_error(self, monkeypatch):
-        """JSON without 'a' or 'c' key should return a decryption error."""
-        monkeypatch.setattr('vault_core.VAULT_TEAM_SECRET', FAKE_TEAM_SECRET)
-
-        bad_envelope = json.dumps({"x": "y"})
-        result = decrypt_metadata(VALID_TOKEN, [bad_envelope])
-        data = json.loads(result)
-
-        assert "error" in data
-
-    def test_decryption_error_returns_error(self, monkeypatch):
-        """If aes_decrypt_metadata raises, should return error JSON."""
-        monkeypatch.setattr('vault_core.VAULT_TEAM_SECRET', FAKE_TEAM_SECRET)
-
-        mock_decrypt = MagicMock(side_effect=Exception("decrypt boom"))
-        monkeypatch.setattr('vault_core.aes_decrypt_metadata', mock_decrypt)
-
-        envelope = self._make_envelope("agent1", "ct_data")
-        result = decrypt_metadata(VALID_TOKEN, [envelope])
-        data = json.loads(result)
-
-        assert "error" in data
-        assert "decrypt boom" in data["error"]
-
-    def test_multiple_envelopes(self, monkeypatch):
-        """Multiple envelopes with different agent_ids should each derive correct DEK."""
-        monkeypatch.setattr('vault_core.VAULT_TEAM_SECRET', FAKE_TEAM_SECRET)
-
-        dek_a = derive_agent_key(FAKE_TEAM_SECRET, "agentA")
-        dek_b = derive_agent_key(FAKE_TEAM_SECRET, "agentB")
-
-        def side_effect(ct, key):
-            if key == dek_a:
-                return b'result-a'
-            if key == dek_b:
-                return b'result-b'
-            return b'unknown'
-
-        mock_decrypt = MagicMock(side_effect=side_effect)
-        monkeypatch.setattr('vault_core.aes_decrypt_metadata', mock_decrypt)
-
-        env_a = self._make_envelope("agentA", "ct_a")
-        env_b = self._make_envelope("agentB", "ct_b")
-        result = decrypt_metadata(VALID_TOKEN, [env_a, env_b])
-        data = json.loads(result)
-
-        assert len(data) == 2
-        assert data[0] == "result-a"
-        assert data[1] == "result-b"
diff --git a/tests/unit/test_protovalidate.py b/tests/unit/test_protovalidate.py
deleted file mode 100644
index 48d2e4d..0000000
--- a/tests/unit/test_protovalidate.py
+++ /dev/null
@@ -1,141 +0,0 @@
-"""
-Integration tests for protovalidate with real proto message descriptors.
-
-Verifies that .proto annotation constraints are correctly enforced
-at the schema level via protovalidate.
-"""
-import pytest
-import sys
-import os
-
-sys.path.insert(0, os.path.join(os.path.dirname(__file__), '../../vault'))
-sys.path.insert(0, os.path.join(os.path.dirname(__file__), '../../vault/proto'))
-
-protovalidate = pytest.importorskip("protovalidate")
-pb2 = pytest.importorskip("vault_service_pb2")
-
-# Valid token: evt_ (4) + 32 hex = 36 chars
-VALID_TOKEN = "evt_a1b2c3d4e5f6a1b2c3d4e5f6a1b2c3d4"
-
-
-@pytest.fixture
-def validator():
-    return protovalidate.Validator()
-
-
-# ---------------------------------------------------------------------------
-# GetPublicKey
-# ---------------------------------------------------------------------------
-
-class TestGetPublicKeyProto:
-    def test_valid(self, validator):
-        validator.validate(pb2.GetPublicKeyRequest(token=VALID_TOKEN))
-
-    def test_empty_token_rejected(self, validator):
-        with pytest.raises(protovalidate.ValidationError):
-            validator.validate(pb2.GetPublicKeyRequest(token=""))
-
-    def test_short_token_rejected(self, validator):
-        with pytest.raises(protovalidate.ValidationError):
-            validator.validate(pb2.GetPublicKeyRequest(token="evt_short"))
-
-    def test_token_exceeds_max_length(self, validator):
-        with pytest.raises(protovalidate.ValidationError):
-            validator.validate(pb2.GetPublicKeyRequest(token="a" * 37))
-
-
-# ---------------------------------------------------------------------------
-# DecryptScores
-# ---------------------------------------------------------------------------
-
-class TestDecryptScoresProto:
-    def test_valid(self, validator):
-        req = pb2.DecryptScoresRequest(
-            token=VALID_TOKEN, encrypted_blob_b64="AQID", top_k=5
-        )
-        validator.validate(req)
-
-    def test_top_k_zero_rejected(self, validator):
-        """Proto3 int32 default is 0 — must be rejected."""
-        req = pb2.DecryptScoresRequest(
-            token=VALID_TOKEN, encrypted_blob_b64="AQID", top_k=0
-        )
-        with pytest.raises(protovalidate.ValidationError):
-            validator.validate(req)
-
-    def test_top_k_negative_rejected(self, validator):
-        req = pb2.DecryptScoresRequest(
-            token=VALID_TOKEN, encrypted_blob_b64="AQID", top_k=-1
-        )
-        with pytest.raises(protovalidate.ValidationError):
-            validator.validate(req)
-
-    def test_top_k_exceeds_global_max(self, validator):
-        req = pb2.DecryptScoresRequest(
-            token=VALID_TOKEN, encrypted_blob_b64="AQID", top_k=301
-        )
-        with pytest.raises(protovalidate.ValidationError):
-            validator.validate(req)
-
-    def test_top_k_at_boundary_one(self, validator):
-        req = pb2.DecryptScoresRequest(
-            token=VALID_TOKEN, encrypted_blob_b64="a", top_k=1
-        )
-        validator.validate(req)
-
-    def test_top_k_at_boundary_max(self, validator):
-        req = pb2.DecryptScoresRequest(
-            token=VALID_TOKEN, encrypted_blob_b64="a", top_k=300
-        )
-        validator.validate(req)
-
-    def test_empty_blob_rejected(self, validator):
-        req = pb2.DecryptScoresRequest(
-            token=VALID_TOKEN, encrypted_blob_b64="", top_k=5
-        )
-        with pytest.raises(protovalidate.ValidationError):
-            validator.validate(req)
-
-    def test_empty_token_rejected(self, validator):
-        req = pb2.DecryptScoresRequest(
-            token="", encrypted_blob_b64="a", top_k=5
-        )
-        with pytest.raises(protovalidate.ValidationError):
-            validator.validate(req)
-
-
-# ---------------------------------------------------------------------------
-# DecryptMetadata
-# ---------------------------------------------------------------------------
-
-class TestDecryptMetadataProto:
-    def test_valid(self, validator):
-        req = pb2.DecryptMetadataRequest(
-            token=VALID_TOKEN, encrypted_metadata_list=["blob1", "blob2"]
-        )
-        validator.validate(req)
-
-    def test_empty_list_rejected(self, validator):
-        req = pb2.DecryptMetadataRequest(token=VALID_TOKEN)
-        with pytest.raises(protovalidate.ValidationError):
-            validator.validate(req)
-
-    def test_empty_item_rejected(self, validator):
-        req = pb2.DecryptMetadataRequest(
-            token=VALID_TOKEN, encrypted_metadata_list=["valid", ""]
-        )
-        with pytest.raises(protovalidate.ValidationError):
-            validator.validate(req)
-
-    def test_too_many_items_rejected(self, validator):
-        req = pb2.DecryptMetadataRequest(
-            token=VALID_TOKEN, encrypted_metadata_list=["x"] * 1001
-        )
-        with pytest.raises(protovalidate.ValidationError):
-            validator.validate(req)
-
-    def test_max_items_passes(self, validator):
-        req = pb2.DecryptMetadataRequest(
-            token=VALID_TOKEN, encrypted_metadata_list=["x"] * 1000
-        )
-        validator.validate(req)
diff --git a/tests/unit/test_public_key.py b/tests/unit/test_public_key.py
deleted file mode 100644
index 2b309b8..0000000
--- a/tests/unit/test_public_key.py
+++ /dev/null
@@ -1,96 +0,0 @@
-"""
-Unit tests for get_public_key.
-"""
-import pytest
-import sys
-import os
-import json
-import tempfile
-import shutil
-
-# Add vault to path
-sys.path.insert(0, os.path.join(os.path.dirname(__file__), '../../vault'))
-
-# Import the implementation function
-from vault_core import _get_public_key_impl as get_public_key
-import vault_core
-from token_store import token_store
-from pyenvector.crypto import KeyGenerator
-
-FAKE_TEAM_SECRET = "evt_fake-team-secret-for-testing-purposes-only"
-
-
-class TestGetPublicKey:
-
-    @pytest.fixture(autouse=True)
-    def reset_rate_limiter(self):
-        """Reset rate limiters before each test."""
-        token_store._rate_limiters.clear()
-
-    @pytest.fixture(scope="class")
-    def test_keys(self):
-        """Generate test keys."""
-        temp_dir = tempfile.mkdtemp(prefix="test_pubkey_")
-        keygen = KeyGenerator(key_path=temp_dir, key_id="test-pubkey", dim_list=[1024], metadata_encryption=False)
-        keygen.generate_keys()
-
-        yield temp_dir
-        shutil.rmtree(temp_dir, ignore_errors=True)
-
-    @pytest.fixture(autouse=True)
-    def patch_vault_paths(self, test_keys, monkeypatch):
-        """Patch vault paths to point to test-generated keys."""
-        monkeypatch.setattr('vault_core.KEY_SUBDIR', test_keys)
-        monkeypatch.setattr('vault_core.VAULT_TEAM_SECRET', FAKE_TEAM_SECRET)
-
-    def test_valid_token_returns_bundle(self, test_keys):
-        """Valid token should return public key bundle."""
-        result = get_public_key("evt_0000000000000000000000000000demo")
-
-        # Should be valid JSON
-        bundle = json.loads(result)
-
-        # Should contain public keys
-        assert "EncKey.json" in bundle
-        assert "EvalKey.json" in bundle
-
-        # Should NOT contain secret keys
-        assert "SecKey.json" not in bundle
-        assert "MetadataKey.json" not in bundle
-
-    def test_invalid_token_raises_error(self, test_keys):
-        """Invalid token should raise an authentication error."""
-        from token_store import TokenNotFoundError
-        with pytest.raises(TokenNotFoundError):
-            get_public_key("invalid-token")
-
-    def test_bundle_contains_agent_id_and_dek(self, test_keys):
-        """Bundle should contain per-user agent_id and agent_dek."""
-        result = get_public_key("evt_0000000000000000000000000000demo")
-        bundle = json.loads(result)
-
-        assert "agent_id" in bundle
-        assert "agent_dek" in bundle
-        assert len(bundle["agent_id"]) == 32  # SHA256 hex[:32]
-
-    def test_bundle_contains_envector_credentials(self, test_keys, monkeypatch):
-        """Bundle should contain enVector endpoint and API key when configured."""
-        monkeypatch.setattr('vault_core.ENVECTOR_ENDPOINT', 'cluster-test.envector.io')
-        monkeypatch.setattr('vault_core.ENVECTOR_API_KEY', 'test-api-key-abc123')
-
-        result = get_public_key("evt_0000000000000000000000000000demo")
-        bundle = json.loads(result)
-
-        assert bundle["envector_endpoint"] == "cluster-test.envector.io"
-        assert bundle["envector_api_key"] == "test-api-key-abc123"
-
-    def test_bundle_envector_empty_when_not_configured(self, test_keys, monkeypatch):
-        """Bundle should have null enVector fields when not configured on Vault."""
-        monkeypatch.setattr('vault_core.ENVECTOR_ENDPOINT', None)
-        monkeypatch.setattr('vault_core.ENVECTOR_API_KEY', None)
-
-        result = get_public_key("evt_0000000000000000000000000000demo")
-        bundle = json.loads(result)
-
-        assert bundle.get("envector_endpoint") is None
-        assert bundle.get("envector_api_key") is None
diff --git a/tests/unit/test_request_validator.py b/tests/unit/test_request_validator.py
deleted file mode 100644
index eba1140..0000000
--- a/tests/unit/test_request_validator.py
+++ /dev/null
@@ -1,101 +0,0 @@
-"""
-Unit tests for gRPC request input validation rules.
-
-Tests both protovalidate (proto-level) and runtime checks.
-Proto-level tests use fake request objects to exercise the same
-validation functions without requiring the real pb2 module.
-"""
-import pytest
-import sys
-import os
-from types import ModuleType
-
-# Mock protovalidate before importing request_validator
-_pv = ModuleType("protovalidate")
-_pv.Validator = type("Validator", (), {"validate": lambda self, req: None})
-class _ValidationError(Exception):
-    def __init__(self, violations=None):
-        self.violations = violations or []
-        super().__init__("validation error")
-_pv.ValidationError = _ValidationError
-sys.modules.setdefault("protovalidate", _pv)
-
-sys.path.insert(0, os.path.join(os.path.dirname(__file__), '../../vault'))
-
-from request_validator import (
-    RuntimeValidationError,
-    check_token_safety,
-    validate_index_name,
-    MAX_INDEX_NAME_LENGTH,
-)
-
-
-# ---------------------------------------------------------------------------
-# Token safety (runtime layer — control chars & whitespace)
-# ---------------------------------------------------------------------------
-
-class TestTokenSafety:
-    def test_valid_token(self):
-        check_token_safety("abc123-valid")
-
-    def test_null_byte_rejected(self):
-        with pytest.raises(RuntimeValidationError, match="control characters"):
-            check_token_safety("token\x00evil")
-
-    def test_control_char_rejected(self):
-        with pytest.raises(RuntimeValidationError, match="control characters"):
-            check_token_safety("token\x01")
-
-    def test_tab_rejected(self):
-        with pytest.raises(RuntimeValidationError, match="control characters"):
-            check_token_safety("token\t")
-
-    def test_newline_rejected(self):
-        with pytest.raises(RuntimeValidationError, match="control characters"):
-            check_token_safety("token\n")
-
-    def test_del_char_rejected(self):
-        with pytest.raises(RuntimeValidationError, match="control characters"):
-            check_token_safety("token\x7f")
-
-    def test_leading_whitespace_rejected(self):
-        with pytest.raises(RuntimeValidationError, match="whitespace"):
-            check_token_safety(" token")
-
-    def test_trailing_whitespace_rejected(self):
-        with pytest.raises(RuntimeValidationError, match="whitespace"):
-            check_token_safety("token ")
-
-
-# ---------------------------------------------------------------------------
-# Index name validation (runtime layer — path traversal prevention)
-# ---------------------------------------------------------------------------
-
-class TestIndexName:
-    def test_valid_names(self):
-        for name in ["my_index", "index-1", "ABC123", "a"]:
-            validate_index_name(name)
-
-    def test_empty_rejected(self):
-        with pytest.raises(RuntimeValidationError, match="empty"):
-            validate_index_name("")
-
-    def test_too_long_rejected(self):
-        with pytest.raises(RuntimeValidationError, match="exceeds"):
-            validate_index_name("a" * (MAX_INDEX_NAME_LENGTH + 1))
-
-    def test_path_traversal_rejected(self):
-        with pytest.raises(RuntimeValidationError, match="alphanumeric"):
-            validate_index_name("../../etc/passwd")
-
-    def test_slash_rejected(self):
-        with pytest.raises(RuntimeValidationError, match="alphanumeric"):
-            validate_index_name("foo/bar")
-
-    def test_space_rejected(self):
-        with pytest.raises(RuntimeValidationError, match="alphanumeric"):
-            validate_index_name("foo bar")
-
-    def test_special_chars_rejected(self):
-        with pytest.raises(RuntimeValidationError, match="alphanumeric"):
-            validate_index_name("index;DROP TABLE")
diff --git a/tests/unit/test_token_store.py b/tests/unit/test_token_store.py
deleted file mode 100644
index 89c698c..0000000
--- a/tests/unit/test_token_store.py
+++ /dev/null
@@ -1,316 +0,0 @@
-"""
-Unit tests for TokenStore: per-user token management, role CRUD, persistence.
-"""
-import copy
-import datetime
-import os
-import sys
-import tempfile
-
-import pytest
-
-sys.path.insert(0, os.path.join(os.path.dirname(__file__), '../../vault'))
-
-from token_store import (
-    TokenStore, Role, Token, RateLimiter,
-    TokenNotFoundError, TokenExpiredError, RateLimitError,
-    TopKExceededError, ScopeError,
-)
-
-
-class TestTokenStore:
-    """Test token lifecycle: add, validate, revoke, expiry, rate limit."""
-
-    def setup_method(self):
-        self.store = TokenStore()
-        self.store._roles = {
-            "admin": Role("admin", ["get_public_key", "decrypt_scores", "decrypt_metadata", "manage_tokens"], 50, "150/60s"),
-            "member": Role("member", ["get_public_key", "decrypt_scores", "decrypt_metadata"], 10, "30/60s"),
-        }
-
-    def test_add_and_validate_token(self):
-        tok = self.store.add_token("alice", "member", expires_days=90)
-        assert tok.user == "alice"
-        assert tok.token.startswith("evt_")
-        assert tok.role == "member"
-
-        username, role = self.store.validate(tok.token)
-        assert username == "alice"
-        assert role.name == "member"
-
-    def test_invalid_token_raises(self):
-        with pytest.raises(TokenNotFoundError):
-            self.store.validate("nonexistent_token")
-
-    def test_expired_token_raises(self):
-        tok = self.store.add_token("bob", "member", expires_days=1)
-        # Manually expire the token
-        tok.expires = (datetime.date.today() - datetime.timedelta(days=1)).isoformat()
-        with pytest.raises(TokenExpiredError, match="bob"):
-            self.store.validate(tok.token)
-
-    def test_revoke_token(self):
-        tok = self.store.add_token("charlie", "member")
-        assert self.store.revoke_token("charlie") is True
-        with pytest.raises(TokenNotFoundError):
-            self.store.validate(tok.token)
-
-    def test_revoke_nonexistent_returns_false(self):
-        assert self.store.revoke_token("nobody") is False
-
-    def test_duplicate_user_rejected(self):
-        self.store.add_token("alice", "member")
-        with pytest.raises(ValueError, match="already exists"):
-            self.store.add_token("alice", "member")
-
-    def test_invalid_role_rejected(self):
-        with pytest.raises(ValueError, match="does not exist"):
-            self.store.add_token("alice", "nonexistent_role")
-
-    def test_list_tokens_hides_values(self):
-        self.store.add_token("alice", "member", expires_days=30)
-        result = self.store.list_tokens()
-        assert len(result) == 1
-        assert result[0]["user"] == "alice"
-        # Token value should not be in list output
-        assert "token" not in result[0]
-
-    def test_rate_limiting_per_user(self):
-        """Rate limiting should use per-role limits keyed by username."""
-        # Member role: 30/60s — use a custom role with low limit for test
-        self.store.add_role("limited", ["get_public_key"], 5, "2/60s")
-        tok = self.store.add_token("ratelimited_user", "limited")
-
-        self.store.validate(tok.token)
-        self.store.validate(tok.token)
-        with pytest.raises(RateLimitError):
-            self.store.validate(tok.token)
-
-    def test_top_k_from_role(self):
-        tok = self.store.add_token("alice", "member")
-        _, role = self.store.validate(tok.token)
-        assert role.top_k == 10  # member default
-
-    def test_never_expires_token(self):
-        tok = self.store.add_token("permanent_user", "admin")
-        assert tok.expires is None
-        assert tok.is_expired is False
-        # Should validate fine
-        username, _ = self.store.validate(tok.token)
-        assert username == "permanent_user"
-
-    def test_legacy_env_loading(self):
-        store = TokenStore()
-        store.load_legacy_env("token_a,token_b")
-        # Should have 2 tokens with admin role
-        u1, r1 = store.validate("token_a")
-        assert u1 == "legacy_0"
-        assert r1.name == "admin"
-        u2, _ = store.validate("token_b")
-        assert u2 == "legacy_1"
-
-    def test_persist_and_reload(self):
-        """Tokens and roles should survive persist → reload cycle."""
-        with tempfile.TemporaryDirectory() as tmpdir:
-            roles_path = os.path.join(tmpdir, "roles.yml")
-            tokens_path = os.path.join(tmpdir, "tokens.yml")
-
-            # Store 1: add data and persist
-            store1 = TokenStore()
-            store1.load_from_files(roles_path, tokens_path)
-            store1.add_role("researcher", ["get_public_key", "decrypt_scores"], 3, "10/60s")
-            tok = store1.add_token("alice", "member", expires_days=90)
-
-            # Wait for async persist
-            store1._persist_executor.shutdown(wait=True)
-
-            # Store 2: reload from files
-            store2 = TokenStore()
-            store2.load_from_files(roles_path, tokens_path)
-
-            # Validate alice's token works
-            username, role = store2.validate(tok.token)
-            assert username == "alice"
-            assert role.name == "member"
-
-            # Validate custom role exists
-            roles = store2.list_roles()
-            role_names = [r["name"] for r in roles]
-            assert "researcher" in role_names
-
-
-class TestTokenRotation:
-    """Test token rotation: single user and batch."""
-
-    def setup_method(self):
-        self.store = TokenStore()
-        self.store._roles = {
-            "admin": Role("admin", ["get_public_key", "decrypt_scores", "decrypt_metadata", "manage_tokens"], 50, "150/60s"),
-            "member": Role("member", ["get_public_key", "decrypt_scores", "decrypt_metadata"], 10, "30/60s"),
-        }
-
-    def test_rotate_token(self):
-        old_tok = self.store.add_token("alice", "member")
-        new_tok = self.store.rotate_token("alice")
-        assert new_tok.user == "alice"
-        assert new_tok.role == "member"
-        assert new_tok.token.startswith("evt_")
-        assert new_tok.token != old_tok.token
-
-    def test_rotate_preserves_expiry(self):
-        old_tok = self.store.add_token("alice", "member", expires_days=90)
-        new_tok = self.store.rotate_token("alice")
-        assert new_tok.expires is not None
-        # New expiry should be ~90 days from today
-        new_expires = datetime.date.fromisoformat(new_tok.expires)
-        expected = datetime.date.today() + datetime.timedelta(days=90)
-        assert new_expires == expected
-
-    def test_rotate_invalidates_old_token(self):
-        old_tok = self.store.add_token("alice", "member")
-        self.store.rotate_token("alice")
-        with pytest.raises(TokenNotFoundError):
-            self.store.validate(old_tok.token)
-
-    def test_rotate_new_token_validates(self):
-        self.store.add_token("alice", "member")
-        new_tok = self.store.rotate_token("alice")
-        username, role = self.store.validate(new_tok.token)
-        assert username == "alice"
-        assert role.name == "member"
-
-    def test_rotate_nonexistent_user_raises(self):
-        with pytest.raises(ValueError, match="No token found"):
-            self.store.rotate_token("nobody")
-
-    def test_rotate_all(self):
-        tok_a = self.store.add_token("alice", "member")
-        tok_b = self.store.add_token("bob", "admin")
-        results = self.store.rotate_all_tokens()
-        assert len(results) == 2
-        users = {t.user for t in results}
-        assert users == {"alice", "bob"}
-        # Old tokens should be invalid
-        with pytest.raises(TokenNotFoundError):
-            self.store.validate(tok_a.token)
-        with pytest.raises(TokenNotFoundError):
-            self.store.validate(tok_b.token)
-
-    def test_rotate_persists(self):
-        """Rotated token should survive persist → reload cycle."""
-        with tempfile.TemporaryDirectory() as tmpdir:
-            roles_path = os.path.join(tmpdir, "roles.yml")
-            tokens_path = os.path.join(tmpdir, "tokens.yml")
-
-            store1 = TokenStore()
-            store1.load_from_files(roles_path, tokens_path)
-            store1.add_token("alice", "member", expires_days=30)
-            new_tok = store1.rotate_token("alice")
-            store1._persist_executor.shutdown(wait=True)
-
-            store2 = TokenStore()
-            store2.load_from_files(roles_path, tokens_path)
-            username, role = store2.validate(new_tok.token)
-            assert username == "alice"
-            assert role.name == "member"
-
-
-class TestRoleCRUD:
-    """Test role create, update, delete, list operations."""
-
-    def setup_method(self):
-        self.store = TokenStore()
-        self.store._roles = {
-            "admin": Role("admin", ["get_public_key", "decrypt_scores", "decrypt_metadata", "manage_tokens"], 50, "150/60s"),
-            "member": Role("member", ["get_public_key", "decrypt_scores", "decrypt_metadata"], 10, "30/60s"),
-        }
-
-    def test_create_role(self):
-        role = self.store.add_role(
-            "researcher", ["get_public_key", "decrypt_scores"], 3, "10/60s"
-        )
-        assert role.name == "researcher"
-        assert role.top_k == 3
-        assert "get_public_key" in role.scope
-
-    def test_create_duplicate_role_rejected(self):
-        with pytest.raises(ValueError, match="already exists"):
-            self.store.add_role("admin", ["get_public_key"], 5, "30/60s")
-
-    def test_update_role(self):
-        role = self.store.update_role("member", top_k=8)
-        assert role.top_k == 8
-        assert role.name == "member"
-
-    def test_update_nonexistent_role_rejected(self):
-        with pytest.raises(ValueError, match="does not exist"):
-            self.store.update_role("nonexistent", top_k=5)
-
-    def test_delete_custom_role(self):
-        self.store.add_role("temp", ["get_public_key"], 1, "5/60s")
-        self.store.delete_role("temp")
-        roles = self.store.list_roles()
-        assert "temp" not in [r["name"] for r in roles]
-
-    def test_delete_default_role_rejected(self):
-        with pytest.raises(ValueError, match="Cannot delete default"):
-            self.store.delete_role("admin")
-        with pytest.raises(ValueError, match="Cannot delete default"):
-            self.store.delete_role("member")
-
-    def test_delete_role_with_active_tokens_rejected(self):
-        self.store.add_role("temp", ["get_public_key"], 1, "5/60s")
-        self.store.add_token("user1", "temp")
-        with pytest.raises(ValueError, match="token for user"):
-            self.store.delete_role("temp")
-
-    def test_list_roles(self):
-        roles = self.store.list_roles()
-        assert len(roles) >= 2
-        names = [r["name"] for r in roles]
-        assert "admin" in names
-        assert "member" in names
-
-    def test_update_role_clears_rate_limiters(self):
-        """Changing a role's rate_limit should reset affected rate limiters."""
-        tok = self.store.add_token("alice", "member")
-        # Validate to create rate limiter
-        self.store.validate(tok.token)
-        assert "alice" in self.store._rate_limiters
-
-        # Update role
-        self.store.update_role("member", rate_limit="100/60s")
-        assert "alice" not in self.store._rate_limiters
-
-    def test_role_rate_limit_parsed(self):
-        role = Role("test", [], 5, "30/60s")
-        max_req, window = role.rate_limit_parsed
-        assert max_req == 30
-        assert window == 60
-
-
-class TestScopeCheck:
-    """Test scope enforcement."""
-
-    def test_scope_allows_valid_method(self):
-        store = TokenStore()
-        role = Role("member", ["get_public_key", "decrypt_scores"], 5, "30/60s")
-        store.check_scope(role, "get_public_key")  # Should not raise
-
-    def test_scope_rejects_invalid_method(self):
-        store = TokenStore()
-        role = Role("limited", ["get_public_key"], 5, "30/60s")
-        with pytest.raises(ScopeError, match="decrypt_scores"):
-            store.check_scope(role, "decrypt_scores")
-
-
-class TestTopKExceeded:
-    """Test TopKExceededError."""
-
-    def test_top_k_exceeded_message(self):
-        err = TopKExceededError(15, 10, "admin")
-        assert "15" in str(err)
-        assert "10" in str(err)
-        assert "admin" in str(err)
-        assert err.requested == 15
-        assert err.max_top_k == 10
diff --git a/tests/unit/test_validation_interceptor.py b/tests/unit/test_validation_interceptor.py
deleted file mode 100644
index ce33a9f..0000000
--- a/tests/unit/test_validation_interceptor.py
+++ /dev/null
@@ -1,196 +0,0 @@
-"""
-Unit tests for the gRPC ValidationInterceptor.
-
-Tests the interceptor wiring using mock objects — no real gRPC server needed.
-grpc and protovalidate are mocked to avoid heavy runtime dependencies.
-"""
-import pytest
-import sys
-import os
-from unittest.mock import MagicMock, patch, PropertyMock
-from types import ModuleType
-
-# ---------------------------------------------------------------------------
-# Mock heavy dependencies before importing vault modules
-# ---------------------------------------------------------------------------
-
-_grpc_mock = ModuleType("grpc")
-_grpc_mock.ServerInterceptor = type("ServerInterceptor", (), {})
-_grpc_mock.StatusCode = type("StatusCode", (), {
-    "INVALID_ARGUMENT": "INVALID_ARGUMENT",
-})()
-_grpc_mock.unary_unary_rpc_method_handler = lambda handler, **kw: MagicMock(
-    unary_unary=handler
-)
-sys.modules.setdefault("grpc", _grpc_mock)
-
-# Force-mock protovalidate regardless of prior imports — prevents test
-# isolation failures when the full suite loads the real module first.
-_protovalidate_mock = ModuleType("protovalidate")
-
-
-class _ValidationError(Exception):
-    def __init__(self, msg="validation error", violations=None):
-        self.violations = violations or []
-        super().__init__(msg)
-
-
-_protovalidate_mock.ValidationError = _ValidationError
-_protovalidate_mock.Validator = MagicMock
-sys.modules["protovalidate"] = _protovalidate_mock
-
-sys.path.insert(0, os.path.join(os.path.dirname(__file__), '../../vault'))
-
-from request_validator import RuntimeValidationError
-from validation_interceptor import ValidationInterceptor
-
-# Get the actual ValidationError the interceptor will catch
-_ProtoValidationError = sys.modules["protovalidate"].ValidationError
-
-
-# ---------------------------------------------------------------------------
-# Helpers
-# ---------------------------------------------------------------------------
-
-def _make_handler_call_details(method: str):
-    details = MagicMock()
-    details.method = method
-    return details
-
-
-def _make_next_handler(return_value="ok"):
-    handler = MagicMock()
-    handler.unary_unary = MagicMock(return_value=return_value)
-    handler.request_deserializer = None
-    handler.response_serializer = None
-    return handler
-
-
-def _make_context():
-    ctx = MagicMock()
-    ctx.abort = MagicMock(side_effect=Exception("aborted"))
-    return ctx
-
-
-# ---------------------------------------------------------------------------
-# Tests
-# ---------------------------------------------------------------------------
-
-class TestValidationInterceptor:
-    def setup_method(self):
-        self.interceptor = ValidationInterceptor()
-
-    def test_non_vault_method_passes_through(self):
-        """Health check and other non-vault methods bypass validation."""
-        details = _make_handler_call_details("/grpc.health.v1.Health/Check")
-        next_handler = _make_next_handler()
-        continuation = MagicMock(return_value=next_handler)
-
-        result = self.interceptor.intercept_service(continuation, details)
-        assert result is next_handler
-
-    def test_none_handler_returns_none(self):
-        details = _make_handler_call_details("/rune.vault.v1.VaultService/GetPublicKey")
-        continuation = MagicMock(return_value=None)
-
-        result = self.interceptor.intercept_service(continuation, details)
-        assert result is None
-
-    def test_valid_request_reaches_handler(self):
-        """A valid request passes both validation layers."""
-        details = _make_handler_call_details("/rune.vault.v1.VaultService/GetPublicKey")
-        next_handler = _make_next_handler(return_value="response")
-        continuation = MagicMock(return_value=next_handler)
-
-        wrapped = self.interceptor.intercept_service(continuation, details)
-
-        request = MagicMock()
-        request.token = "valid-token-123"
-        context = _make_context()
-
-        with patch("validation_interceptor.validate_proto"):
-            result = wrapped.unary_unary(request, context)
-
-        assert result == "response"
-        context.abort.assert_not_called()
-
-    def test_proto_validation_error_aborts(self):
-        """protovalidate.ValidationError triggers INVALID_ARGUMENT abort."""
-        details = _make_handler_call_details("/rune.vault.v1.VaultService/DecryptScores")
-        next_handler = _make_next_handler()
-        continuation = MagicMock(return_value=next_handler)
-
-        wrapped = self.interceptor.intercept_service(continuation, details)
-
-        request = MagicMock()
-        request.token = "valid-token"
-        context = _make_context()
-
-        violation = MagicMock()
-        violation.proto.field = "top_k"
-        violation.proto.message = "value must be >= 1"
-        exc = _ProtoValidationError(violations=[violation])
-
-        with patch("validation_interceptor.validate_proto", side_effect=exc):
-            with pytest.raises(Exception, match="aborted"):
-                wrapped.unary_unary(request, context)
-
-        context.abort.assert_called_once()
-        status_code = context.abort.call_args[0][0]
-        assert "INVALID_ARGUMENT" in str(status_code)
-        assert "top_k" in context.abort.call_args[0][1]
-
-    def test_runtime_validation_error_aborts(self):
-        """RuntimeValidationError (control chars) triggers INVALID_ARGUMENT abort."""
-        details = _make_handler_call_details("/rune.vault.v1.VaultService/GetPublicKey")
-        next_handler = _make_next_handler()
-        continuation = MagicMock(return_value=next_handler)
-
-        wrapped = self.interceptor.intercept_service(continuation, details)
-
-        request = MagicMock()
-        request.token = "tok\x00en"
-        context = _make_context()
-
-        with patch("validation_interceptor.validate_proto"):
-            with pytest.raises(Exception, match="aborted"):
-                wrapped.unary_unary(request, context)
-
-        context.abort.assert_called_once()
-        status_code = context.abort.call_args[0][0]
-        assert "INVALID_ARGUMENT" in str(status_code)
-        assert "control characters" in context.abort.call_args[0][1]
-
-    def test_handler_without_unary_unary_passes_through(self):
-        details = _make_handler_call_details("/rune.vault.v1.VaultService/GetPublicKey")
-        next_handler = MagicMock()
-        next_handler.unary_unary = None
-        continuation = MagicMock(return_value=next_handler)
-
-        result = self.interceptor.intercept_service(continuation, details)
-        assert result is next_handler
-
-    def test_error_detail_is_human_readable(self):
-        """Validation errors include field path and message."""
-        details = _make_handler_call_details("/rune.vault.v1.VaultService/DecryptScores")
-        next_handler = _make_next_handler()
-        continuation = MagicMock(return_value=next_handler)
-
-        wrapped = self.interceptor.intercept_service(continuation, details)
-
-        request = MagicMock()
-        request.token = "valid-token"
-        context = _make_context()
-
-        violation = MagicMock()
-        violation.proto.field = "encrypted_blob_b64"
-        violation.proto.message = "value length must be at least 1"
-        exc = _ProtoValidationError(violations=[violation])
-
-        with patch("validation_interceptor.validate_proto", side_effect=exc):
-            with pytest.raises(Exception, match="aborted"):
-                wrapped.unary_unary(request, context)
-
-        detail_msg = context.abort.call_args[0][1]
-        assert "encrypted_blob_b64" in detail_msg
-        assert "at least 1" in detail_msg
diff --git a/vault/.env.example b/vault/.env.example
deleted file mode 100644
index 42ba518..0000000
--- a/vault/.env.example
+++ /dev/null
@@ -1,62 +0,0 @@
-# Rune-Vault Configuration
-# Copy this file to .env and fill in the values:
-#   cp .env.example .env
-#
-# .env is excluded from git — safe to put real credentials there.
-
-# ── Authentication ──────────────────────────────────────────────
-# Team secret for metadata DEK derivation (shared across all team members).
-# New installs: auto-generated by install.sh.
-# Migrating from VAULT_TOKENS: copy your existing shared token value here.
-#   e.g. VAULT_TEAM_SECRET=evt_abc123...  (the same value you had in VAULT_TOKENS)
-# Per-user tokens are managed separately via `runevault token issue/revoke/list`.
-VAULT_TEAM_SECRET=
-
-# ── TLS ─────────────────────────────────────────────────────────
-# TLS is required by default. The Docker entrypoint auto-generates
-# self-signed certificates if these are not set.
-#
-# For Let's Encrypt or domain certs, set the paths explicitly:
-#   VAULT_TLS_CERT=/path/to/fullchain.pem
-#   VAULT_TLS_KEY=/path/to/privkey.pem
-#
-# To disable TLS (NOT recommended for production):
-#   VAULT_TLS_DISABLE=true
-VAULT_TLS_CERT=
-VAULT_TLS_KEY=
-VAULT_TLS_DISABLE=
-
-# ── Audit Logging ──────────────────────────────────────────────
-# Structured audit log for all Vault gRPC operations.
-# One JSON line per request with: timestamp, user_id, method, top_k,
-# result_count, status, source_ip, latency_ms.
-#
-# Options:
-#   (empty)        Disabled
-#   file           /var/log/rune-vault/audit.log (daily rotation, 30-day retention)
-#   file:/path     Custom file path
-#   stdout         JSON lines to stdout (for CloudWatch, Stackdriver, etc.)
-#   file+stdout    Both file and stdout
-VAULT_AUDIT_LOG=file
-
-# ── ngrok Tunneling (optional) ──────────────────────────────────
-# Required only if you need to expose the gRPC endpoint over the internet.
-# Get your authtoken at: https://dashboard.ngrok.com/get-started/your-authtoken
-NGROK_AUTHTOKEN=
-
-# ── enVector Cloud ──────────────────────────────────────────────
-# Required for auto-creating the team search index (ensure_index).
-# Without these, FHE key generation (ensure_keys) still works locally,
-# but the team index will NOT be created on enVector Cloud.
-#
-# enVector cluster endpoint (e.g. runestone-XXXX.clusters.envector.io)
-ENVECTOR_ENDPOINT=
-# enVector API key (issued from envector.io dashboard)
-ENVECTOR_API_KEY=
-
-# ── Index Settings ──────────────────────────────────────────────
-# Name of the team index on enVector Cloud.
-# Must be alphanumeric, lowercase, no spaces, and less than 20 characters.
-VAULT_INDEX_NAME=runecontext
-# Embedding dimension (must match your embedding model)
-EMBEDDING_DIM=1024
diff --git a/vault/Dockerfile b/vault/Dockerfile
deleted file mode 100644
index f902b7a..0000000
--- a/vault/Dockerfile
+++ /dev/null
@@ -1,55 +0,0 @@
-# ── Stage 1: Generate proto stubs ────────────────────────────────────
-FROM python:3.12-slim AS proto-builder
-
-RUN apt-get update && apt-get install -y --no-install-recommends curl \
-    && rm -rf /var/lib/apt/lists/*
-
-# Install buf CLI
-RUN curl -sSL "https://github.com/bufbuild/buf/releases/latest/download/buf-Linux-$(uname -m)" \
-        -o /usr/local/bin/buf \
-    && chmod +x /usr/local/bin/buf
-
-RUN pip install --no-cache-dir "grpcio-tools>=1.60.2,<=1.71.2" "protobuf>=5.29.0,<6"
-
-WORKDIR /build
-COPY buf.yaml buf.lock ./
-COPY proto/vault_service.proto proto/__init__.py proto/
-COPY scripts/proto-gen.sh scripts/
-RUN bash scripts/proto-gen.sh
-
-# ── Stage 2: Runtime ─────────────────────────────────────────────────
-FROM python:3.12-slim
-
-RUN apt-get update && apt-get install -y --no-install-recommends \
-        gcc \
-        python3-dev \
-        openssl \
-        curl \
-        gosu \
-    && rm -rf /var/lib/apt/lists/*
-
-RUN useradd -m -u 1000 vault
-
-WORKDIR /app
-
-COPY requirements.txt .
-RUN pip install --no-cache-dir -r requirements.txt
-
-COPY vault_core.py vault_grpc_server.py token_store.py admin_server.py vault_admin_cli.py request_validator.py validation_interceptor.py audit.py ./
-COPY --from=proto-builder /build/proto/ proto/
-COPY --from=proto-builder /build/buf/ buf/
-COPY docker-entrypoint.sh .
-RUN chmod +x docker-entrypoint.sh vault_admin_cli.py
-
-RUN mkdir -p /app/vault_keys /app/certs /app/config /secure/backups /var/log/rune-vault \
-    && chown -R vault:vault /app /secure /var/log/rune-vault
-
-ENV PYTHONPATH=/app/proto:/app
-
-EXPOSE 50051
-
-HEALTHCHECK --interval=30s --timeout=10s --retries=3 \
-    CMD curl -sf http://localhost:8081/health || exit 1
-
-ENTRYPOINT ["./docker-entrypoint.sh"]
-CMD ["--host", "0.0.0.0", "--grpc-port", "50051"]
diff --git a/vault/admin_server.py b/vault/admin_server.py
deleted file mode 100644
index 9b08bde..0000000
--- a/vault/admin_server.py
+++ /dev/null
@@ -1,232 +0,0 @@
-"""
-Admin HTTP server for token and role management.
-
-Listens on 127.0.0.1:8081 (container-internal only, not exposed via Docker).
-No authentication required — access is protected by:
-  SSH → docker group → docker exec → container isolation.
-"""
-
-import json
-import logging
-import re
-import threading
-from http.server import BaseHTTPRequestHandler, HTTPServer
-
-logger = logging.getLogger("vault.admin")
-
-DEFAULT_ADMIN_HOST = "127.0.0.1"
-DEFAULT_ADMIN_PORT = 8081
-
-
-# =============================================================================
-# Route table: (method, pattern) → handler name
-# Patterns use {name} for path parameters, compiled to regex at import time.
-# =============================================================================
-
-_ROUTE_DEFS = [
-    ("GET", "/health", "_handle_health"),
-    ("GET", "/tokens", "_handle_list_tokens"),
-    ("GET", "/roles", "_handle_list_roles"),
-    ("POST", "/tokens", "_handle_issue_token"),
-    ("POST", "/tokens/{user}/rotate", "_handle_rotate_token"),
-    ("POST", "/tokens/_rotate_all", "_handle_rotate_all"),
-    ("POST", "/roles", "_handle_create_role"),
-    ("PUT", "/roles/{name}", "_handle_update_role"),
-    ("DELETE", "/tokens/{user}", "_handle_revoke_token"),
-    ("DELETE", "/roles/{name}", "_handle_delete_role"),
-]
-
-_ROUTES: list[tuple[str, re.Pattern, list[str], str]] = []
-for _method, _pattern, _handler in _ROUTE_DEFS:
-    _param_names = re.findall(r"\{(\w+)\}", _pattern)
-    _regex = re.compile("^" + re.sub(r"\{(\w+)\}", r"(?P<\1>[^/]+)", _pattern) + "$")
-    _ROUTES.append((_method, _regex, _param_names, _handler))
-
-
-class AdminHandler(BaseHTTPRequestHandler):
-    """Request handler for token and role admin API."""
-
-    # Set by start_admin_server() before requests are handled
-    token_store = None
-    health_servicer = None
-
-    def log_message(self, format, *args):
-        logger.info(format, *args)
-
-    def _read_json(self) -> dict:
-        length = int(self.headers.get("Content-Length", 0))
-        if length == 0:
-            return {}
-        body = self.rfile.read(length)
-        return json.loads(body)
-
-    def _send_json(self, data: dict, status: int = 200):
-        body = json.dumps(data).encode()
-        self.send_response(status)
-        self.send_header("Content-Type", "application/json")
-        self.send_header("Content-Length", str(len(body)))
-        self.end_headers()
-        self.wfile.write(body)
-
-    def _send_error(self, status: int, message: str):
-        self._send_json({"error": message}, status)
-
-    # ── Routing ──────────────────────────────────────────────────────────
-
-    def _dispatch(self, method: str):
-        path = self.path.rstrip("/") or "/"
-        for route_method, regex, _, handler_name in _ROUTES:
-            if route_method != method:
-                continue
-            m = regex.match(path)
-            if m:
-                handler = getattr(self, handler_name)
-                try:
-                    kwargs = m.groupdict()
-                    if method in ("POST", "PUT"):
-                        kwargs["body"] = self._read_json()
-                    handler(**kwargs)
-                except (ValueError, KeyError) as e:
-                    self._send_error(400, str(e))
-                except Exception as e:
-                    self._send_error(500, str(e))
-                return
-        self._send_error(404, f"No route for {method} {self.path}")
-
-    def do_GET(self):
-        self._dispatch("GET")
-
-    def do_POST(self):
-        self._dispatch("POST")
-
-    def do_PUT(self):
-        self._dispatch("PUT")
-
-    def do_DELETE(self):
-        self._dispatch("DELETE")
-
-    # ── Health ────────────────────────────────────────────────────────────
-
-    def _handle_health(self):
-        from grpc_health.v1 import health_pb2
-
-        if self.health_servicer is not None:
-            resp = self.health_servicer.Check(health_pb2.HealthCheckRequest(service=""), None)
-            if resp.status != health_pb2.HealthCheckResponse.SERVING:
-                self._send_json({"status": "unhealthy"}, 503)
-                return
-        self._send_json({"status": "ok"})
-
-    # ── Token handlers ───────────────────────────────────────────────────
-
-    def _handle_list_tokens(self):
-        self._send_json({"tokens": self.token_store.list_tokens()})
-
-    def _handle_issue_token(self, body: dict):
-        user = body.get("user")
-        role = body.get("role")
-        if not user or not role:
-            self._send_error(400, "Missing required fields: user, role")
-            return
-        expires_days = body.get("expires_days")
-        tok = self.token_store.add_token(user, role, expires_days)
-        self._send_json(
-            {
-                "user": tok.user,
-                "token": tok.token,
-                "role": tok.role,
-                "issued_at": tok.issued_at,
-                "expires": tok.expires or "never",
-            },
-            201,
-        )
-
-    def _handle_revoke_token(self, user: str):
-        revoked = self.token_store.revoke_token(user)
-        if revoked:
-            self._send_json({"message": f"Revoked token for '{user}'"})
-        else:
-            self._send_error(404, f"No token found for user '{user}'")
-
-    def _handle_rotate_token(self, user: str, body: dict):
-        tok = self.token_store.rotate_token(user)
-        self._send_json(
-            {
-                "user": tok.user,
-                "token": tok.token,
-                "role": tok.role,
-                "issued_at": tok.issued_at,
-                "expires": tok.expires or "never",
-            }
-        )
-
-    def _handle_rotate_all(self, body: dict):
-        tokens = self.token_store.rotate_all_tokens()
-        self._send_json(
-            {
-                "rotated": len(tokens),
-                "tokens": [{"user": t.user, "token": t.token, "role": t.role} for t in tokens],
-            }
-        )
-
-    # ── Role handlers ────────────────────────────────────────────────────
-
-    def _handle_list_roles(self):
-        self._send_json({"roles": self.token_store.list_roles()})
-
-    def _handle_create_role(self, body: dict):
-        name = body.get("name")
-        scope = body.get("scope")
-        top_k = body.get("top_k")
-        rate_limit = body.get("rate_limit")
-        if not all([name, scope, top_k is not None, rate_limit]):
-            self._send_error(400, "Missing required fields: name, scope, top_k, rate_limit")
-            return
-        role = self.token_store.add_role(name, scope, top_k, rate_limit)
-        self._send_json(
-            {
-                "name": role.name,
-                "scope": role.scope,
-                "top_k": role.top_k,
-                "rate_limit": role.rate_limit,
-            },
-            201,
-        )
-
-    def _handle_update_role(self, name: str, body: dict):
-        kwargs = {}
-        if "scope" in body:
-            kwargs["scope"] = body["scope"]
-        if "top_k" in body:
-            kwargs["top_k"] = body["top_k"]
-        if "rate_limit" in body:
-            kwargs["rate_limit"] = body["rate_limit"]
-        if not kwargs:
-            self._send_error(400, "No fields to update")
-            return
-        role = self.token_store.update_role(name, **kwargs)
-        self._send_json(
-            {
-                "name": role.name,
-                "scope": role.scope,
-                "top_k": role.top_k,
-                "rate_limit": role.rate_limit,
-            }
-        )
-
-    def _handle_delete_role(self, name: str):
-        self.token_store.delete_role(name)
-        self._send_json({"message": f"Deleted role '{name}'"})
-
-
-def start_admin_server(
-    store, host: str = DEFAULT_ADMIN_HOST, port: int = DEFAULT_ADMIN_PORT, health_servicer=None
-):
-    """Start the admin HTTP server in a daemon thread."""
-    AdminHandler.token_store = store
-    AdminHandler.health_servicer = health_servicer
-    server = HTTPServer((host, port), AdminHandler)
-    thread = threading.Thread(target=server.serve_forever, daemon=True, name="admin-server")
-    thread.start()
-    logger.info("Admin server started on %s:%d", host, port)
-    return server
diff --git a/vault/audit.py b/vault/audit.py
deleted file mode 100644
index cdb639a..0000000
--- a/vault/audit.py
+++ /dev/null
@@ -1,153 +0,0 @@
-"""
-Structured audit logging for Rune-Vault operations.
-
-Emits one JSON line per gRPC request to a dedicated audit log,
-separate from the application log. Supports file-based daily rotation
-and stdout JSON mode for container environments.
-
-Configuration via VAULT_AUDIT_LOG env var:
-  (empty)        disabled
-  file           /var/log/rune-vault/audit.log, daily rotation, 30-day retention
-  file:/path     custom file path
-  stdout         JSON lines to stdout
-  file+stdout    both
-"""
-
-import json
-import logging
-import os
-import sys
-from logging.handlers import TimedRotatingFileHandler
-from typing import Any
-
-_DEFAULT_AUDIT_PATH = "/var/log/rune-vault/audit.log"
-
-# ---------------------------------------------------------------------------
-# Configuration parsing
-# ---------------------------------------------------------------------------
-
-
-def _parse_audit_config(env_value: str) -> dict:
-    """Parse VAULT_AUDIT_LOG into {"file": path | None, "stdout": bool}."""
-    if not env_value:
-        return {"file": None, "stdout": False}
-
-    parts = [p.strip() for p in env_value.split("+")]
-    config: dict[str, Any] = {"file": None, "stdout": False}
-
-    for part in parts:
-        lowered = part.lower()
-        if lowered == "stdout":
-            config["stdout"] = True
-        elif lowered == "file":
-            config["file"] = _DEFAULT_AUDIT_PATH
-        elif lowered.startswith("file:"):
-            config["file"] = part.split(":", 1)[1].strip()
-
-    return config
-
-
-# ---------------------------------------------------------------------------
-# Source IP extraction
-# ---------------------------------------------------------------------------
-
-
-def extract_source_ip(context) -> str:
-    """Extract client IP from gRPC context.peer().
-
-    peer() returns strings like:
-      'ipv4:10.0.0.1:12345'
-      'ipv6:[::1]:12345'
-      'unix:/path/to/socket'
-    """
-    try:
-        peer = context.peer()
-        if peer is None:
-            return "unknown"
-        if peer.startswith("ipv4:"):
-            # ipv4:10.0.0.1:12345 -> 10.0.0.1
-            return peer[5:].rsplit(":", 1)[0]
-        if peer.startswith("ipv6:"):
-            addr = peer[5:]
-            if addr.startswith("["):
-                # [::1]:12345 -> [::1]
-                return addr.split("]", 1)[0] + "]"
-            return addr.rsplit(":", 1)[0]
-        return peer
-    except Exception:
-        return "unknown"
-
-
-# ---------------------------------------------------------------------------
-# AuditLogger
-# ---------------------------------------------------------------------------
-
-
-class AuditLogger:
-    """JSON-structured audit logger with file rotation and stdout support."""
-
-    def __init__(self, config: dict):
-        self._logger = logging.getLogger("rune.vault.audit")
-        self._logger.setLevel(logging.INFO)
-        self._logger.propagate = False
-
-        # Close and remove any pre-existing handlers (e.g. during tests)
-        for h in self._logger.handlers[:]:
-            h.close()
-            self._logger.removeHandler(h)
-
-        if config.get("file"):
-            handler = TimedRotatingFileHandler(
-                config["file"],
-                when="midnight",
-                backupCount=30,
-                utc=True,
-            )
-            handler.setFormatter(logging.Formatter("%(message)s"))
-            self._logger.addHandler(handler)
-
-        if config.get("stdout"):
-            handler = logging.StreamHandler(sys.stdout)
-            handler.setFormatter(logging.Formatter("%(message)s"))
-            self._logger.addHandler(handler)
-
-    @property
-    def enabled(self) -> bool:
-        return len(self._logger.handlers) > 0
-
-    def log(
-        self,
-        *,
-        timestamp: str,
-        user_id: str,
-        method: str,
-        top_k: int | None,
-        result_count: int,
-        status: str,
-        source_ip: str,
-        latency_ms: float,
-        error: str | None = None,
-    ) -> dict:
-        """Emit a single structured audit entry. Returns the entry dict."""
-        entry: dict[str, Any] = {
-            "timestamp": timestamp,
-            "user_id": user_id,
-            "method": method,
-            "top_k": top_k,
-            "result_count": result_count,
-            "status": status,
-            "source_ip": source_ip,
-            "latency_ms": round(latency_ms, 2),
-        }
-        if error is not None:
-            entry["error"] = error
-        self._logger.info(json.dumps(entry, separators=(",", ":")))
-        return entry
-
-
-# ---------------------------------------------------------------------------
-# Module-level singleton
-# ---------------------------------------------------------------------------
-
-_config = _parse_audit_config(os.environ.get("VAULT_AUDIT_LOG", ""))
-audit_logger = AuditLogger(_config)
diff --git a/vault/buf.gen.yaml b/vault/buf.gen.yaml
new file mode 100644
index 0000000..0497bba
--- /dev/null
+++ b/vault/buf.gen.yaml
@@ -0,0 +1,13 @@
+version: v2
+clean: true
+plugins:
+  - remote: buf.build/protocolbuffers/go
+    out: pkg/vaultpb
+    opt:
+      - module=github.com/CryptoLabInc/rune-admin/vault/pkg/vaultpb
+      - Mvault_service.proto=github.com/CryptoLabInc/rune-admin/vault/pkg/vaultpb;vaultpb
+  - remote: buf.build/grpc/go
+    out: pkg/vaultpb
+    opt:
+      - module=github.com/CryptoLabInc/rune-admin/vault/pkg/vaultpb
+      - Mvault_service.proto=github.com/CryptoLabInc/rune-admin/vault/pkg/vaultpb;vaultpb
diff --git a/vault/docker-compose.yml b/vault/docker-compose.yml
deleted file mode 100644
index 1b5d598..0000000
--- a/vault/docker-compose.yml
+++ /dev/null
@@ -1,62 +0,0 @@
-services:
-  vault:
-    build:
-      context: .
-      dockerfile: Dockerfile
-    image: ghcr.io/cryptolabinc/rune-vault:${RUNE_VAULT_TAG:-latest}
-    container_name: rune-vault
-
-    volumes:
-      - vault-keys:/app/vault_keys:rw
-      - ./certs:/app/certs:rw
-      - ./backups:/secure/backups:rw
-      - ./logs:/var/log/rune-vault:rw
-      - ./vault-roles.yml:/app/config/vault-roles.yml:rw
-      - ./vault-tokens.yml:/app/config/vault-tokens.yml:rw
-
-    environment:
-      - VAULT_TEAM_SECRET=${VAULT_TEAM_SECRET:-}
-      # Migrating from VAULT_TOKENS? Copy the value to VAULT_TEAM_SECRET in .env.
-      # See .env.example for details.
-      - VAULT_TLS_CERT=${VAULT_TLS_CERT:-}
-      - VAULT_TLS_KEY=${VAULT_TLS_KEY:-}
-      - VAULT_TLS_DISABLE=${VAULT_TLS_DISABLE:-}
-      - VAULT_INDEX_NAME=${VAULT_INDEX_NAME:-runecontext}
-      - ENVECTOR_ENDPOINT=${ENVECTOR_ENDPOINT:-}
-      - ENVECTOR_API_KEY=${ENVECTOR_API_KEY:-}
-      - EMBEDDING_DIM=${EMBEDDING_DIM:-1024}
-      - VAULT_AUDIT_LOG=${VAULT_AUDIT_LOG:-file}
-
-    networks:
-      - vault-net
-
-    ports:
-      - "0.0.0.0:50051:50051"
-
-    security_opt:
-      - no-new-privileges:true
-
-    restart: unless-stopped
-
-    healthcheck:
-      test: ["CMD", "curl", "-sf", "http://localhost:8081/health"]
-      interval: 30s
-      timeout: 10s
-      retries: 3
-
-    deploy:
-      resources:
-        limits:
-          memory: 1G
-          cpus: "1.0"
-        reservations:
-          memory: 512M
-          cpus: "0.5"
-
-
-networks:
-  vault-net:
-    driver: bridge
-
-volumes:
-  vault-keys:
diff --git a/vault/docker-entrypoint.sh b/vault/docker-entrypoint.sh
deleted file mode 100755
index ae1dd25..0000000
--- a/vault/docker-entrypoint.sh
+++ /dev/null
@@ -1,80 +0,0 @@
-#!/bin/sh
-#
-# Docker entrypoint for Rune-Vault.
-# Auto-generates self-signed certificates if none are provided.
-
-set -e
-
-CERT_DIR="/app/certs"
-
-# Skip auto-generation if TLS is disabled
-if [ "${VAULT_TLS_DISABLE:-}" = "true" ]; then
-    echo "[entrypoint] TLS disabled — skipping certificate generation."
-    chown -R vault:vault /app/vault_keys /app/config /secure /var/log/rune-vault 2>/dev/null || true
-    exec gosu vault python3 vault_grpc_server.py "$@"
-fi
-
-# Auto-generate self-signed cert if no cert exists and env vars not set
-if [ -z "${VAULT_TLS_CERT:-}" ] && [ ! -f "$CERT_DIR/server.pem" ]; then
-    echo "[entrypoint] No TLS certificate found — generating self-signed cert..."
-    mkdir -p "$CERT_DIR"
-
-    # Generate CA
-    openssl genrsa -out "$CERT_DIR/ca.key" 4096 2>/dev/null
-    openssl req -new -x509 \
-        -key "$CERT_DIR/ca.key" \
-        -out "$CERT_DIR/ca.pem" \
-        -days 3650 \
-        -subj "/CN=Rune-Vault CA" \
-        -sha256
-
-    # Generate server cert with SANs
-    openssl genrsa -out "$CERT_DIR/server.key" 2048 2>/dev/null
-
-    TMPCONF=$(mktemp)
-    cat > "$TMPCONF" <<EOF
-[req]
-distinguished_name = req_dn
-req_extensions = v3_req
-prompt = no
-
-[req_dn]
-CN = rune-vault
-
-[v3_req]
-subjectAltName = DNS:localhost,DNS:vault,DNS:rune-vault,IP:127.0.0.1
-EOF
-
-    openssl req -new \
-        -key "$CERT_DIR/server.key" \
-        -out "$CERT_DIR/server.csr" \
-        -config "$TMPCONF"
-
-    openssl x509 -req \
-        -in "$CERT_DIR/server.csr" \
-        -CA "$CERT_DIR/ca.pem" \
-        -CAkey "$CERT_DIR/ca.key" \
-        -CAcreateserial \
-        -out "$CERT_DIR/server.pem" \
-        -days 825 \
-        -sha256 \
-        -extfile "$TMPCONF" \
-        -extensions v3_req \
-        2>/dev/null
-
-    rm -f "$TMPCONF" "$CERT_DIR/server.csr" "$CERT_DIR/ca.srl"
-    chmod 600 "$CERT_DIR/ca.key" "$CERT_DIR/server.key"
-
-    echo "[entrypoint] Self-signed certificates generated in $CERT_DIR/"
-    echo "[entrypoint] Distribute ca.pem to clients for verification."
-fi
-
-# Default to auto-generated certs if env vars not set
-export VAULT_TLS_CERT="${VAULT_TLS_CERT:-$CERT_DIR/server.pem}"
-export VAULT_TLS_KEY="${VAULT_TLS_KEY:-$CERT_DIR/server.key}"
-
-# Fix ownership on mounted volumes so the vault user can read them
-chown -R vault:vault /app/certs /app/vault_keys /app/config /secure /var/log/rune-vault 2>/dev/null || true
-
-# Drop privileges and run as vault user
-exec gosu vault python3 vault_grpc_server.py "$@"
diff --git a/vault/go.mod b/vault/go.mod
new file mode 100644
index 0000000..879b4d4
--- /dev/null
+++ b/vault/go.mod
@@ -0,0 +1,29 @@
+module github.com/CryptoLabInc/rune-admin/vault
+
+go 1.25.9
+
+require (
+	buf.build/gen/go/bufbuild/protovalidate/protocolbuffers/go v1.36.11-20260415201107-50325440f8f2.1
+	github.com/CryptoLabInc/envector-go-sdk v0.1.0
+	github.com/spf13/cobra v1.8.1
+	golang.org/x/crypto v0.47.0
+	google.golang.org/grpc v1.80.0
+	google.golang.org/protobuf v1.36.11
+	gopkg.in/natefinch/lumberjack.v2 v2.2.1
+	gopkg.in/yaml.v3 v3.0.1
+)
+
+require (
+	buf.build/go/protovalidate v1.2.0 // indirect
+	cel.dev/expr v0.25.1 // indirect
+	github.com/antlr4-go/antlr/v4 v4.13.1 // indirect
+	github.com/google/cel-go v0.28.0 // indirect
+	github.com/inconshreveable/mousetrap v1.1.0 // indirect
+	github.com/spf13/pflag v1.0.5 // indirect
+	golang.org/x/exp v0.0.0-20250813145105-42675adae3e6 // indirect
+	golang.org/x/net v0.49.0 // indirect
+	golang.org/x/sys v0.40.0 // indirect
+	golang.org/x/text v0.33.0 // indirect
+	google.golang.org/genproto/googleapis/api v0.0.0-20260120221211-b8f7ae30c516 // indirect
+	google.golang.org/genproto/googleapis/rpc v0.0.0-20260120221211-b8f7ae30c516 // indirect
+)
diff --git a/vault/go.sum b/vault/go.sum
new file mode 100644
index 0000000..d7411b4
--- /dev/null
+++ b/vault/go.sum
@@ -0,0 +1,71 @@
+buf.build/gen/go/bufbuild/protovalidate/protocolbuffers/go v1.36.11-20260415201107-50325440f8f2.1 h1:s6hzCXtND/ICdGPTMGk7C+/BFlr2Jg5GyH0NKf4XGXg=
+buf.build/gen/go/bufbuild/protovalidate/protocolbuffers/go v1.36.11-20260415201107-50325440f8f2.1/go.mod h1:tvtbpgaVXZX4g6Pn+AnzFycuRK3MOz5HJfEGeEllXYM=
+buf.build/go/protovalidate v1.2.0 h1:DQVrUWkmGTBij+kOYv/x2LLxwcLaGKMdzShj1/6/3H0=
+buf.build/go/protovalidate v1.2.0/go.mod h1:7rYiQEhqvAipoazpVNBBH2S2f8bjG4huMVy1V2Yofn4=
+cel.dev/expr v0.25.1 h1:1KrZg61W6TWSxuNZ37Xy49ps13NUovb66QLprthtwi4=
+cel.dev/expr v0.25.1/go.mod h1:hrXvqGP6G6gyx8UAHSHJ5RGk//1Oj5nXQ2NI02Nrsg4=
+github.com/CryptoLabInc/envector-go-sdk v0.1.0 h1:EaPiFtvLh33mrS1Nfjb/sF5tmDlOIHpjj3TJ6QIIFgM=
+github.com/CryptoLabInc/envector-go-sdk v0.1.0/go.mod h1:jXVwGkqUOmQUnJiEshq7sG2x0nveFCNlAU5J7xc7CDw=
+github.com/antlr4-go/antlr/v4 v4.13.1 h1:SqQKkuVZ+zWkMMNkjy5FZe5mr5WURWnlpmOuzYWrPrQ=
+github.com/antlr4-go/antlr/v4 v4.13.1/go.mod h1:GKmUxMtwp6ZgGwZSva4eWPC5mS6vUAmOABFgjdkM7Nw=
+github.com/cespare/xxhash/v2 v2.3.0 h1:UL815xU9SqsFlibzuggzjXhog7bL6oX9BbNZnL2UFvs=
+github.com/cespare/xxhash/v2 v2.3.0/go.mod h1:VGX0DQ3Q6kWi7AoAeZDth3/j3BFtOZR5XLFGgcrjCOs=
+github.com/cpuguy83/go-md2man/v2 v2.0.4/go.mod h1:tgQtvFlXSQOSOSIRvRPT7W67SCa46tRHOmNcaadrF8o=
+github.com/go-logr/logr v1.4.3 h1:CjnDlHq8ikf6E492q6eKboGOC0T8CDaOvkHCIg8idEI=
+github.com/go-logr/logr v1.4.3/go.mod h1:9T104GzyrTigFIr8wt5mBrctHMim0Nb2HLGrmQ40KvY=
+github.com/go-logr/stdr v1.2.2 h1:hSWxHoqTgW2S2qGc0LTAI563KZ5YKYRhT3MFKZMbjag=
+github.com/go-logr/stdr v1.2.2/go.mod h1:mMo/vtBO5dYbehREoey6XUKy/eSumjCCveDpRre4VKE=
+github.com/golang/protobuf v1.5.4 h1:i7eJL8qZTpSEXOPTxNKhASYpMn+8e5Q6AdndVa1dWek=
+github.com/golang/protobuf v1.5.4/go.mod h1:lnTiLA8Wa4RWRcIUkrtSVa5nRhsEGBg48fD6rSs7xps=
+github.com/google/cel-go v0.28.0 h1:KjSWstCpz/MN5t4a8gnGJNIYUsJRpdi/r97xWDphIQc=
+github.com/google/cel-go v0.28.0/go.mod h1:X0bD6iVNR8pkROSOoHVdgTkzmRcosof7WQqCD6wcMc8=
+github.com/google/go-cmp v0.7.0 h1:wk8382ETsv4JYUZwIsn6YpYiWiBsYLSJiTsyBybVuN8=
+github.com/google/go-cmp v0.7.0/go.mod h1:pXiqmnSA92OHEEa9HXL2W4E7lf9JzCmGVUdgjX3N/iU=
+github.com/google/uuid v1.6.0 h1:NIvaJDMOsjHA8n1jAhLSgzrAzy1Hgr+hNrb57e+94F0=
+github.com/google/uuid v1.6.0/go.mod h1:TIyPZe4MgqvfeYDBFedMoGGpEw/LqOeaOT+nhxU+yHo=
+github.com/inconshreveable/mousetrap v1.1.0 h1:wN+x4NVGpMsO7ErUn/mUI3vEoE6Jt13X2s0bqwp9tc8=
+github.com/inconshreveable/mousetrap v1.1.0/go.mod h1:vpF70FUmC8bwa3OWnCshd2FqLfsEA9PFc4w1p2J65bw=
+github.com/russross/blackfriday/v2 v2.1.0/go.mod h1:+Rmxgy9KzJVeS9/2gXHxylqXiyQDYRxCVz55jmeOWTM=
+github.com/spf13/cobra v1.8.1 h1:e5/vxKd/rZsfSJMUX1agtjeTDf+qv1/JdBF8gg5k9ZM=
+github.com/spf13/cobra v1.8.1/go.mod h1:wHxEcudfqmLYa8iTfL+OuZPbBZkmvliBWKIezN3kD9Y=
+github.com/spf13/pflag v1.0.5 h1:iy+VFUOCP1a+8yFto/drg2CJ5u0yRoB7fZw3DKv/JXA=
+github.com/spf13/pflag v1.0.5/go.mod h1:McXfInJRrz4CZXVZOBLb0bTZqETkiAhM9Iw0y3An2Bg=
+go.opentelemetry.io/auto/sdk v1.2.1 h1:jXsnJ4Lmnqd11kwkBV2LgLoFMZKizbCi5fNZ/ipaZ64=
+go.opentelemetry.io/auto/sdk v1.2.1/go.mod h1:KRTj+aOaElaLi+wW1kO/DZRXwkF4C5xPbEe3ZiIhN7Y=
+go.opentelemetry.io/otel v1.39.0 h1:8yPrr/S0ND9QEfTfdP9V+SiwT4E0G7Y5MO7p85nis48=
+go.opentelemetry.io/otel v1.39.0/go.mod h1:kLlFTywNWrFyEdH0oj2xK0bFYZtHRYUdv1NklR/tgc8=
+go.opentelemetry.io/otel/metric v1.39.0 h1:d1UzonvEZriVfpNKEVmHXbdf909uGTOQjA0HF0Ls5Q0=
+go.opentelemetry.io/otel/metric v1.39.0/go.mod h1:jrZSWL33sD7bBxg1xjrqyDjnuzTUB0x1nBERXd7Ftcs=
+go.opentelemetry.io/otel/sdk v1.39.0 h1:nMLYcjVsvdui1B/4FRkwjzoRVsMK8uL/cj0OyhKzt18=
+go.opentelemetry.io/otel/sdk v1.39.0/go.mod h1:vDojkC4/jsTJsE+kh+LXYQlbL8CgrEcwmt1ENZszdJE=
+go.opentelemetry.io/otel/sdk/metric v1.39.0 h1:cXMVVFVgsIf2YL6QkRF4Urbr/aMInf+2WKg+sEJTtB8=
+go.opentelemetry.io/otel/sdk/metric v1.39.0/go.mod h1:xq9HEVH7qeX69/JnwEfp6fVq5wosJsY1mt4lLfYdVew=
+go.opentelemetry.io/otel/trace v1.39.0 h1:2d2vfpEDmCJ5zVYz7ijaJdOF59xLomrvj7bjt6/qCJI=
+go.opentelemetry.io/otel/trace v1.39.0/go.mod h1:88w4/PnZSazkGzz/w84VHpQafiU4EtqqlVdxWy+rNOA=
+golang.org/x/crypto v0.47.0 h1:V6e3FRj+n4dbpw86FJ8Fv7XVOql7TEwpHapKoMJ/GO8=
+golang.org/x/crypto v0.47.0/go.mod h1:ff3Y9VzzKbwSSEzWqJsJVBnWmRwRSHt/6Op5n9bQc4A=
+golang.org/x/exp v0.0.0-20250813145105-42675adae3e6 h1:SbTAbRFnd5kjQXbczszQ0hdk3ctwYf3qBNH9jIsGclE=
+golang.org/x/exp v0.0.0-20250813145105-42675adae3e6/go.mod h1:4QTo5u+SEIbbKW1RacMZq1YEfOBqeXa19JeshGi+zc4=
+golang.org/x/net v0.49.0 h1:eeHFmOGUTtaaPSGNmjBKpbng9MulQsJURQUAfUwY++o=
+golang.org/x/net v0.49.0/go.mod h1:/ysNB2EvaqvesRkuLAyjI1ycPZlQHM3q01F02UY/MV8=
+golang.org/x/sys v0.40.0 h1:DBZZqJ2Rkml6QMQsZywtnjnnGvHza6BTfYFWY9kjEWQ=
+golang.org/x/sys v0.40.0/go.mod h1:OgkHotnGiDImocRcuBABYBEXf8A9a87e/uXjp9XT3ks=
+golang.org/x/text v0.33.0 h1:B3njUFyqtHDUI5jMn1YIr5B0IE2U0qck04r6d4KPAxE=
+golang.org/x/text v0.33.0/go.mod h1:LuMebE6+rBincTi9+xWTY8TztLzKHc/9C1uBCG27+q8=
+gonum.org/v1/gonum v0.17.0 h1:VbpOemQlsSMrYmn7T2OUvQ4dqxQXU+ouZFQsZOx50z4=
+gonum.org/v1/gonum v0.17.0/go.mod h1:El3tOrEuMpv2UdMrbNlKEh9vd86bmQ6vqIcDwxEOc1E=
+google.golang.org/genproto/googleapis/api v0.0.0-20260120221211-b8f7ae30c516 h1:vmC/ws+pLzWjj/gzApyoZuSVrDtF1aod4u/+bbj8hgM=
+google.golang.org/genproto/googleapis/api v0.0.0-20260120221211-b8f7ae30c516/go.mod h1:p3MLuOwURrGBRoEyFHBT3GjUwaCQVKeNqqWxlcISGdw=
+google.golang.org/genproto/googleapis/rpc v0.0.0-20260120221211-b8f7ae30c516 h1:sNrWoksmOyF5bvJUcnmbeAmQi8baNhqg5IWaI3llQqU=
+google.golang.org/genproto/googleapis/rpc v0.0.0-20260120221211-b8f7ae30c516/go.mod h1:j9x/tPzZkyxcgEFkiKEEGxfvyumM01BEtsW8xzOahRQ=
+google.golang.org/grpc v1.80.0 h1:Xr6m2WmWZLETvUNvIUmeD5OAagMw3FiKmMlTdViWsHM=
+google.golang.org/grpc v1.80.0/go.mod h1:ho/dLnxwi3EDJA4Zghp7k2Ec1+c2jqup0bFkw07bwF4=
+google.golang.org/protobuf v1.36.11 h1:fV6ZwhNocDyBLK0dj+fg8ektcVegBBuEolpbTQyBNVE=
+google.golang.org/protobuf v1.36.11/go.mod h1:HTf+CrKn2C3g5S8VImy6tdcUvCska2kB7j23XfzDpco=
+gopkg.in/check.v1 v0.0.0-20161208181325-20d25e280405 h1:yhCVgyC4o1eVCa2tZl7eS0r+SDo693bJlVdllGtEeKM=
+gopkg.in/check.v1 v0.0.0-20161208181325-20d25e280405/go.mod h1:Co6ibVJAznAaIkqp8huTwlJQCZ016jof/cbN4VW5Yz0=
+gopkg.in/check.v1 v1.0.0-20190902080502-41f04d3bba15 h1:YR8cESwS4TdDjEe65xsg0ogRM/Nc3DYOhEAlW+xobZo=
+gopkg.in/natefinch/lumberjack.v2 v2.2.1 h1:bBRl1b0OH9s/DuPhuXpNl+VtCaJXFZ5/uEFST95x9zc=
+gopkg.in/natefinch/lumberjack.v2 v2.2.1/go.mod h1:YD8tP3GAjkrDg1eZH7EGmyESg/lsYskCTPBJVb9jqSc=
+gopkg.in/yaml.v3 v3.0.1 h1:fxVm/GzAzEWqLHuvctI91KS9hhNmmWOoWu0XTYJS7CA=
+gopkg.in/yaml.v3 v3.0.1/go.mod h1:K4uyk7z7BCEPqu6E+C64Yfv1cQ7kz7rIZviUmN+EgEM=
diff --git a/vault/internal/commands/adminclient.go b/vault/internal/commands/adminclient.go
new file mode 100644
index 0000000..eca2dfd
--- /dev/null
+++ b/vault/internal/commands/adminclient.go
@@ -0,0 +1,119 @@
+package commands
+
+import (
+	"bytes"
+	"context"
+	"encoding/json"
+	"errors"
+	"fmt"
+	"io"
+	"net"
+	"net/http"
+	"os"
+	"strings"
+	"time"
+
+	"github.com/CryptoLabInc/rune-admin/vault/internal/server"
+)
+
+// AdminClient talks to the Vault admin UDS server.
+type AdminClient struct {
+	socket string
+	hc     *http.Client
+}
+
+// NewAdminClient builds a client that dials the given UDS path.
+// Returns ErrSocketMissing if the socket file does not exist on disk —
+// gives the CLI a friendlier message than a connection-refused on the
+// first request.
+func NewAdminClient(socketPath string) (*AdminClient, error) {
+	if socketPath == "" {
+		return nil, errors.New("admin socket path is empty (set server.admin.socket or pass --admin-socket)")
+	}
+	if _, err := os.Stat(socketPath); err != nil {
+		if os.IsNotExist(err) {
+			return nil, fmt.Errorf("admin socket %s not found — is the daemon running?", socketPath)
+		}
+		return nil, err
+	}
+	hc := &http.Client{
+		Timeout: 30 * time.Second,
+		Transport: &http.Transport{
+			DialContext: func(ctx context.Context, _, _ string) (net.Conn, error) {
+				return (&net.Dialer{}).DialContext(ctx, "unix", socketPath)
+			},
+			DisableKeepAlives: true,
+		},
+	}
+	return &AdminClient{socket: socketPath, hc: hc}, nil
+}
+
+// adminError is what the server returns on 4xx/5xx.
+type adminError struct {
+	Status  int
+	Message string
+}
+
+func (e *adminError) Error() string { return e.Message }
+
+// Do sends a JSON request and decodes the response into dst (which may
+// be nil to discard). 4xx/5xx responses become *adminError.
+func (a *AdminClient) Do(method, path string, body, dst any) error {
+	var buf io.Reader
+	if body != nil {
+		b, err := json.Marshal(body)
+		if err != nil {
+			return err
+		}
+		buf = bytes.NewReader(b)
+	}
+	url := "http://admin" + path
+	req, err := http.NewRequest(method, url, buf)
+	if err != nil {
+		return err
+	}
+	if body != nil {
+		req.Header.Set("Content-Type", "application/json")
+	}
+	resp, err := a.hc.Do(req)
+	if err != nil {
+		return fmt.Errorf("admin: %w (socket: %s)", err, a.socket)
+	}
+	defer resp.Body.Close()
+	respBody, err := io.ReadAll(resp.Body)
+	if err != nil {
+		return err
+	}
+	if resp.StatusCode >= 400 {
+		var e struct {
+			Error string `json:"error"`
+		}
+		if jerr := json.Unmarshal(respBody, &e); jerr != nil || e.Error == "" {
+			return &adminError{Status: resp.StatusCode, Message: strings.TrimSpace(string(respBody))}
+		}
+		return &adminError{Status: resp.StatusCode, Message: e.Error}
+	}
+	if dst != nil && len(respBody) > 0 {
+		if err := json.Unmarshal(respBody, dst); err != nil {
+			return fmt.Errorf("admin: parse response: %w", err)
+		}
+	}
+	return nil
+}
+
+// resolveAdminClient returns an AdminClient using either the explicit
+// --admin-socket flag or the socket field from the resolved runevault.conf.
+func resolveAdminClient() (*AdminClient, error) {
+	socket := globals.adminSocket
+	if socket == "" {
+		cfg, err := server.LoadConfig(globals.configPath)
+		if err != nil {
+			return nil, err
+		}
+		socket = cfg.Server.Admin.Socket
+	}
+	if socket == "" {
+		return nil, errors.New("admin socket not configured (set server.admin.socket or pass --admin-socket)")
+	}
+	return NewAdminClient(socket)
+}
diff --git a/vault/internal/commands/adminclient_test.go b/vault/internal/commands/adminclient_test.go
new file mode 100644
index 0000000..461747b
--- /dev/null
+++ b/vault/internal/commands/adminclient_test.go
@@ -0,0 +1,120 @@
+package commands
+
+import (
+	"context"
+	"net"
+	"net/http"
+	"os"
+	"path/filepath"
+	"strings"
+	"testing"
+
+	"github.com/CryptoLabInc/rune-admin/vault/internal/server"
+	"github.com/CryptoLabInc/rune-admin/vault/internal/tokens"
+)
+
+// adminUDSFixture spins up a real UDS-backed admin server with a demo
+// store. Exposes the socket path so AdminClient can dial it.
+func adminUDSFixture(t *testing.T) (socket string, store *tokens.Store, shutdown func()) {
+	t.Helper()
+	// Darwin sun_path caps at ~104 bytes; t.TempDir() can overflow with
+	// long test names. Use a short MkdirTemp.
+	dir, err := os.MkdirTemp("", "vt-")
+	if err != nil {
+		t.Fatal(err)
+	}
+	t.Cleanup(func() { os.RemoveAll(dir) })
+	socket = filepath.Join(dir, "x.sock")
+
+	store = tokens.NewStore()
+	store.LoadDefaultsWithDemoToken()
+
+	cfg := &server.Config{
+		Server: server.ServerConfig{Admin: server.AdminConfig{Socket: socket}},
+		Tokens: server.TokensConfig{TeamSecret: "test-secret"},
+		Keys:   server.KeysConfig{Path: t.TempDir(), EmbeddingDim: 1024},
+	}
+	audit, _ := server.NewAuditLogger(server.AuditConfig{Mode: ""})
+	v := server.NewVault(cfg, store, nil, audit)
+
+	stop, err := server.AdminFromConfig(context.Background(), v)
+	if err != nil {
+		t.Fatal(err)
+	}
+	shutdown = func() { _ = stop(context.Background()) }
+	t.Cleanup(shutdown)
+	return socket, store, shutdown
+}
+
+func TestAdminClientHealth(t *testing.T) {
+	socket, _, _ := adminUDSFixture(t)
+	c, err := NewAdminClient(socket)
+	if err != nil {
+		t.Fatal(err)
+	}
+	var status struct {
+		Status string `json:"status"`
+	}
+	if err := c.Do("GET", "/health", nil, &status); err != nil {
+		t.Fatal(err)
+	}
+	if status.Status != "ok" {
+		t.Errorf("status = %q", status.Status)
+	}
+}
+
+func TestAdminClientIssueAndList(t *testing.T) {
+	socket, _, _ := adminUDSFixture(t)
+	c, _ := NewAdminClient(socket)
+
+	var issued tokenResult
+	if err := c.Do("POST", "/tokens", map[string]any{"user": "alice", "role": "member"}, &issued); err != nil {
+		t.Fatal(err)
+	}
+	if !strings.HasPrefix(issued.Token, "evt_") {
+		t.Errorf("token = %q", issued.Token)
+	}
+
+	var listResp struct {
+		Tokens []map[string]any `json:"tokens"`
+	}
+	if err := c.Do("GET", "/tokens", nil, &listResp); err != nil {
+		t.Fatal(err)
+	}
+	found := false
+	for _, t := range listResp.Tokens {
+		if t["user"] == "alice" {
+			found = true
+		}
+	}
+	if !found {
+		t.Errorf("alice not in list: %+v", listResp.Tokens)
+	}
+}
+
+func TestAdminClientErrorBubblesUp(t *testing.T) {
+	socket, _, _ := adminUDSFixture(t)
+	c, _ := NewAdminClient(socket)
+	err := c.Do("POST", "/tokens", map[string]any{}, nil)
+	if err == nil {
+		t.Fatal("expected error for missing fields")
+	}
+	if !strings.Contains(err.Error(), "Missing required") {
+		t.Errorf("err = %v", err)
+	}
+}
+
+func TestAdminClientMissingSocket(t *testing.T) {
+	_, err := NewAdminClient("/tmp/no-such-socket")
+	if err == nil {
+		t.Fatal("expected error for missing socket")
+	}
+	if !strings.Contains(err.Error(), "not found") {
+		t.Errorf("err = %v", err)
+	}
+}
+
+// silence unused import if running tests in isolation
+var _ = net.Listen
+var _ = http.StatusOK
+var _ = os.Stat
diff --git a/vault/internal/commands/duration.go b/vault/internal/commands/duration.go
new file mode 100644
index 0000000..200181e
--- /dev/null
+++ b/vault/internal/commands/duration.go
@@ -0,0 +1,27 @@
+package commands
+
+import (
+	"fmt"
+	"regexp"
+	"strconv"
+)
+
+var durationRE = regexp.MustCompile(`^(\d+)([dwm])$`)
+
+// parseDuration converts strings like "90d", "12w", "6m" into days.
+// Mirrors vault_admin_cli.py:_parse_duration (m = 30 days approximation).
+func parseDuration(value string) (int, error) {
+	m := durationRE.FindStringSubmatch(value)
+	if m == nil {
+		return 0, fmt.Errorf("Invalid duration '%s'. Use <number><d|w|m> (e.g. 90d, 12w, 6m)", value)
+	}
+	n, _ := strconv.Atoi(m[1])
+	switch m[2] {
+	case "d":
+		return n, nil
+	case "w":
+		return n * 7, nil
+	default:
+		return n * 30, nil
+	}
+}
diff --git a/vault/internal/commands/role.go b/vault/internal/commands/role.go
new file mode 100644
index 0000000..bb6df14
--- /dev/null
+++ b/vault/internal/commands/role.go
@@ -0,0 +1,172 @@
+package commands
+
+import (
+	"fmt"
+	"strings"
+
+	"github.com/spf13/cobra"
+)
+
+func newRoleCmd() *cobra.Command {
+	cmd := &cobra.Command{
+		Use:   "role",
+		Short: "Manage authorization roles",
+	}
+	cmd.AddCommand(
+		newRoleListCmd(),
+		newRoleCreateCmd(),
+		newRoleUpdateCmd(),
+		newRoleDeleteCmd(),
+	)
+	return cmd
+}
+
+type roleResult struct {
+	Name      string   `json:"name"`
+	Scope     []string `json:"scope"`
+	TopK      int      `json:"top_k"`
+	RateLimit string   `json:"rate_limit"`
+}
+
+func newRoleListCmd() *cobra.Command {
+	return &cobra.Command{
+		Use:   "list",
+		Short: "List all roles",
+		RunE: func(cmd *cobra.Command, _ []string) error {
+			ac, err := resolveAdminClient()
+			if err != nil {
+				return err
+			}
+			var result struct {
+				Roles []roleResult `json:"roles"`
+			}
+			if err := ac.Do("GET", "/roles", nil, &result); err != nil {
+				return err
+			}
+			out := cmd.OutOrStdout()
+			if len(result.Roles) == 0 {
+				fmt.Fprintln(out, "No roles defined.")
+				return nil
+			}
+			// "{:<12} {:<50} {:>6} {:>10}" — match vault_admin_cli.py
+			fmt.Fprintf(out, "%-12s %-50s %6s %10s\n", "ROLE", "SCOPE", "TOP_K", "RATE")
+			for _, r := range result.Roles {
+				fmt.Fprintf(out, "%-12s %-50s %6d %10s\n",
+					r.Name, formatScope(r.Scope), r.TopK, r.RateLimit)
+			}
+			return nil
+		},
+	}
+}
+
+func newRoleCreateCmd() *cobra.Command {
+	var name, scope, rateLimit string
+	var topK int
+	cmd := &cobra.Command{
+		Use:   "create",
+		Short: "Create a new role",
+		RunE: func(cmd *cobra.Command, _ []string) error {
+			scopeList := splitCSV(scope)
+			body := map[string]any{
+				"name":       name,
+				"scope":      scopeList,
+				"top_k":      topK,
+				"rate_limit": rateLimit,
+			}
+			ac, err := resolveAdminClient()
+			if err != nil {
+				return err
+			}
+			if err := ac.Do("POST", "/roles", body, nil); err != nil {
+				return err
+			}
+			fmt.Fprintf(cmd.OutOrStdout(), "Role '%s' created.\n", name)
+			return nil
+		},
+	}
+	cmd.Flags().StringVar(&name, "name", "", "Role name")
+	cmd.Flags().StringVar(&scope, "scope", "", "Comma-separated scope list")
+	cmd.Flags().IntVar(&topK, "top-k", 0, "Max top_k")
+	cmd.Flags().StringVar(&rateLimit, "rate-limit", "", "Rate limit (e.g. 30/60s)")
+	_ = cmd.MarkFlagRequired("name")
+	_ = cmd.MarkFlagRequired("scope")
+	_ = cmd.MarkFlagRequired("top-k")
+	_ = cmd.MarkFlagRequired("rate-limit")
+	return cmd
+}
+
+func newRoleUpdateCmd() *cobra.Command {
+	var name, scope, rateLimit string
+	var topK int
+	var topKSet bool
+	cmd := &cobra.Command{
+		Use:   "update",
+		Short: "Update an existing role",
+		RunE: func(cmd *cobra.Command, _ []string) error {
+			body := map[string]any{}
+			if scope != "" {
+				body["scope"] = splitCSV(scope)
+			}
+			if topKSet {
+				body["top_k"] = topK
+			}
+			if rateLimit != "" {
+				body["rate_limit"] = rateLimit
+			}
+			if len(body) == 0 {
+				return fmt.Errorf("No fields to update.")
+			}
+			ac, err := resolveAdminClient()
+			if err != nil {
+				return err
+			}
+			if err := ac.Do("PUT", "/roles/"+name, body, nil); err != nil {
+				return err
+			}
+			fmt.Fprintf(cmd.OutOrStdout(),
+				"Role '%s' updated. Changes take effect immediately for all tokens with this role.\n", name)
+			return nil
+		},
+	}
+	cmd.Flags().StringVar(&name, "name", "", "Role name")
+	cmd.Flags().StringVar(&scope, "scope", "", "Comma-separated scope list")
+	cmd.Flags().IntVar(&topK, "top-k", 0, "Max top_k")
+	cmd.Flags().StringVar(&rateLimit, "rate-limit", "", "Rate limit (e.g. 30/60s)")
+	_ = cmd.MarkFlagRequired("name")
+	cmd.PreRun = func(c *cobra.Command, _ []string) {
+		topKSet = c.Flags().Changed("top-k")
+	}
+	return cmd
+}
+
+func newRoleDeleteCmd() *cobra.Command {
+	var name string
+	cmd := &cobra.Command{
+		Use:   "delete",
+		Short: "Delete a role",
+		RunE: func(cmd *cobra.Command, _ []string) error {
+			ac, err := resolveAdminClient()
+			if err != nil {
+				return err
+			}
+			if err := ac.Do("DELETE", "/roles/"+name, nil, nil); err != nil {
+				return err
+			}
+			fmt.Fprintf(cmd.OutOrStdout(), "Role '%s' deleted.\n", name)
+			return nil
+		},
+	}
+	cmd.Flags().StringVar(&name, "name", "", "Role name")
+	_ = cmd.MarkFlagRequired("name")
+	return cmd
+}
+
+func splitCSV(s string) []string {
+	out := []string{}
+	for _, p := range strings.Split(s, ",") {
+		if t := strings.TrimSpace(p); t != "" {
+			out = append(out, t)
+		}
+	}
+	return out
+}
diff --git a/vault/internal/commands/token.go b/vault/internal/commands/token.go
new file mode 100644
index 0000000..2be54a1
--- /dev/null
+++ b/vault/internal/commands/token.go
@@ -0,0 +1,192 @@
+package commands
+
+import (
+	"fmt"
+	"strings"
+
+	"github.com/spf13/cobra"
+)
+
+func newTokenCmd() *cobra.Command {
+	cmd := &cobra.Command{
+		Use:   "token",
+		Short: "Manage authentication tokens",
+	}
+	cmd.AddCommand(
+		newTokenIssueCmd(),
+		newTokenRevokeCmd(),
+		newTokenRotateCmd(),
+		newTokenListCmd(),
+	)
+	return cmd
+}
+
+type tokenResult struct {
+	User     string `json:"user"`
+	Token    string `json:"token"`
+	Role     string `json:"role"`
+	IssuedAt string `json:"issued_at"`
+	Expires  string `json:"expires"`
+}
+
+func newTokenIssueCmd() *cobra.Command {
+	var user, role, expires string
+	cmd := &cobra.Command{
+		Use:   "issue",
+		Short: "Issue a new token",
+		RunE: func(cmd *cobra.Command, _ []string) error {
+			if user == "" || role == "" {
+				return fmt.Errorf("--user and --role are required")
+			}
+			body := map[string]any{"user": user, "role": role}
+			if expires != "" {
+				days, err := parseDuration(expires)
+				if err != nil {
+					return err
+				}
+				body["expires_days"] = days
+			}
+			ac, err := resolveAdminClient()
+			if err != nil {
+				return err
+			}
+			var result tokenResult
+			if err := ac.Do("POST", "/tokens", body, &result); err != nil {
+				return err
+			}
+			out := cmd.OutOrStdout()
+			fmt.Fprintf(out, "\nToken issued for '%s':\n", result.User)
+			fmt.Fprintf(out, "  Role:    %s\n", result.Role)
+			fmt.Fprintf(out, "  Expires: %s\n", result.Expires)
+			fmt.Fprintf(out, "\n  Token: %s\n", result.Token)
+			fmt.Fprintln(out, "\n  WARNING: This token will NOT be shown again. Share it securely.")
+			return nil
+		},
+	}
+	cmd.Flags().StringVar(&user, "user", "", "Username")
+	cmd.Flags().StringVar(&role, "role", "", "Role name")
+	cmd.Flags().StringVar(&expires, "expires", "", "Duration until expiry (e.g. 90d, 12w, 6m)")
+	_ = cmd.MarkFlagRequired("user")
+	_ = cmd.MarkFlagRequired("role")
+	return cmd
+}
+
+func newTokenRevokeCmd() *cobra.Command {
+	var user string
+	cmd := &cobra.Command{
+		Use:   "revoke",
+		Short: "Revoke a user's token",
+		RunE: func(cmd *cobra.Command, _ []string) error {
+			ac, err := resolveAdminClient()
+			if err != nil {
+				return err
+			}
+			var result struct {
+				Message string `json:"message"`
+			}
+			if err := ac.Do("DELETE", "/tokens/"+user, nil, &result); err != nil {
+				return err
+			}
+			fmt.Fprintln(cmd.OutOrStdout(), result.Message)
+			return nil
+		},
+	}
+	cmd.Flags().StringVar(&user, "user", "", "Username")
+	_ = cmd.MarkFlagRequired("user")
+	return cmd
+}
+
+func newTokenRotateCmd() *cobra.Command {
+	var user string
+	var rotateAll bool
+	cmd := &cobra.Command{
+		Use:   "rotate",
+		Short: "Rotate one or all tokens",
+		RunE: func(cmd *cobra.Command, _ []string) error {
+			if (user == "") == (!rotateAll) {
+				return fmt.Errorf("exactly one of --user or --all is required")
+			}
+			ac, err := resolveAdminClient()
+			if err != nil {
+				return err
+			}
+			out := cmd.OutOrStdout()
+			if rotateAll {
+				var result struct {
+					Rotated int `json:"rotated"`
+					Tokens  []struct {
+						User  string `json:"user"`
+						Token string `json:"token"`
+						Role  string `json:"role"`
+					} `json:"tokens"`
+				}
+				if err := ac.Do("POST", "/tokens/_rotate_all", map[string]any{}, &result); err != nil {
+					return err
+				}
+				if result.Rotated == 0 {
+					fmt.Fprintln(out, "No tokens to rotate.")
+					return nil
+				}
+				fmt.Fprintf(out, "Rotated %d token(s):\n\n", result.Rotated)
+				for _, t := range result.Tokens {
+					fmt.Fprintf(out, "  %s: %s\n", t.User, t.Token)
+				}
+				fmt.Fprintln(out, "\n  WARNING: These tokens will NOT be shown again. Share them securely.")
+				return nil
+			}
+			var result tokenResult
+			if err := ac.Do("POST", "/tokens/"+user+"/rotate", map[string]any{}, &result); err != nil {
+				return err
+			}
+			fmt.Fprintf(out, "\nToken rotated for '%s':\n", result.User)
+			fmt.Fprintf(out, "  Role:    %s\n", result.Role)
+			fmt.Fprintf(out, "  Expires: %s\n", result.Expires)
+			fmt.Fprintf(out, "\n  Token: %s\n", result.Token)
+			fmt.Fprintln(out, "\n  WARNING: This token will NOT be shown again. Share it securely.")
+			return nil
+		},
+	}
+	cmd.Flags().StringVar(&user, "user", "", "Username to rotate")
+	cmd.Flags().BoolVar(&rotateAll, "all", false, "Rotate all tokens")
+	return cmd
+}
+
+func newTokenListCmd() *cobra.Command {
+	return &cobra.Command{
+		Use:   "list",
+		Short: "List all tokens",
+		RunE: func(cmd *cobra.Command, _ []string) error {
+			ac, err := resolveAdminClient()
+			if err != nil {
+				return err
+			}
+			var result struct {
+				Tokens []struct {
+					User      string `json:"user"`
+					Role      string `json:"role"`
+					TopK      any    `json:"top_k"`
+					RateLimit any    `json:"rate_limit"`
+					Expires   string `json:"expires"`
+				} `json:"tokens"`
+			}
+			if err := ac.Do("GET", "/tokens", nil, &result); err != nil {
+				return err
+			}
+			out := cmd.OutOrStdout()
+			if len(result.Tokens) == 0 {
+				fmt.Fprintln(out, "No tokens issued.")
+				return nil
+			}
+			// "{:<16} {:<10} {:>6} {:>10}  {:<12}" — match vault_admin_cli.py
+			fmt.Fprintf(out, "%-16s %-10s %6s %10s  %-12s\n", "USER", "ROLE", "TOP_K", "RATE", "EXPIRES")
+			for _, t := range result.Tokens {
+				fmt.Fprintf(out, "%-16s %-10s %6s %10s  %-12s\n",
+					t.User, t.Role, fmt.Sprintf("%v", t.TopK), fmt.Sprintf("%v", t.RateLimit), t.Expires)
+			}
+			return nil
+		},
+	}
+}
+
+// formatScope is referenced from role.go; defined here to share with token output if needed.
+func formatScope(scope []string) string { return strings.Join(scope, ",") }
diff --git a/vault/internal/commands/version.go b/vault/internal/commands/version.go
new file mode 100644
index 0000000..93ab188
--- /dev/null
+++ b/vault/internal/commands/version.go
@@ -0,0 +1,28 @@
+package commands
+
+import (
+	"fmt"
+	"runtime"
+
+	"github.com/spf13/cobra"
+)
+
+var (
+	buildVersion = "dev"
+	buildCommit  = "none"
+	buildDate    = "unknown"
+)
+
+func newVersionCmd() *cobra.Command {
+	return &cobra.Command{
+		Use:   "version",
+		Short: "Print runevault version (works without daemon or socket)",
+		RunE: func(cmd *cobra.Command, args []string) error {
+			fmt.Fprintf(cmd.OutOrStdout(),
+				"runevault %s (commit %s, built %s, %s/%s, %s)\n",
+				buildVersion, buildCommit, buildDate,
+				runtime.GOOS, runtime.GOARCH, runtime.Version())
+			return nil
+		},
+	}
+}
diff --git a/vault/internal/crypto/keys.go b/vault/internal/crypto/keys.go
new file mode 100644
index 0000000..bfa74ce
--- /dev/null
+++ b/vault/internal/crypto/keys.go
@@ -0,0 +1,118 @@
+package crypto
+
+import (
+	"errors"
+	"fmt"
+	"os"
+	"path/filepath"
+
+	envector "github.com/CryptoLabInc/envector-go-sdk"
+)
+
+// EnvectorKeys is a thin wrapper around envector-go-sdk's *Keys handle that
+// constrains usage to decrypt-only (KeyPartSec) — Vault never encrypts.
+//
+// On-disk layout matches pyenvector: <root>/<keyID>/{Enc,Sec,Eval}Key.json.
+// envector-go-sdk reads pyenvector's JSON envelope natively, so existing
+// installs work without migration.
+type EnvectorKeys struct {
+	keys *envector.Keys
+}
+
+// KeysParams names the on-disk key bundle and FHE dimension.
+type KeysParams struct {
+	// Root is the parent directory containing <KeyID>/.
+	// E.g., "/opt/runevault/vault-keys" with KeyID "vault-key" reads from
+	// "/opt/runevault/vault-keys/vault-key/{Enc,Sec,Eval}Key.json".
+	Root  string
+	KeyID string
+	Dim   int
+}
+
+func (p KeysParams) keyDir() string { return filepath.Join(p.Root, p.KeyID) }
+
+// KeysExist reports whether the bundle is present under Root/KeyID.
+func KeysExist(p KeysParams) bool {
+	return envector.KeysExist(
+		envector.WithKeyPath(p.keyDir()),
+		envector.WithKeyID(p.KeyID),
+		envector.WithKeyDim(p.Dim),
+	)
+}
+
+// EnsureKeys generates a fresh bundle if none exists. No-op if any of the
+// three slots is already present (envector.GenerateKeys never overwrites).
+func EnsureKeys(p KeysParams) error {
+	if KeysExist(p) {
+		return nil
+	}
+	if err := os.MkdirAll(p.keyDir(), 0o700); err != nil {
+		return fmt.Errorf("crypto: mkdir key dir: %w", err)
+	}
+	if err := envector.GenerateKeys(
+		envector.WithKeyPath(p.keyDir()),
+		envector.WithKeyID(p.KeyID),
+		envector.WithKeyDim(p.Dim),
+	); err != nil && !errors.Is(err, envector.ErrKeysAlreadyExist) {
+		return fmt.Errorf("crypto: generate keys: %w", err)
+	}
+	return nil
+}
+
+// OpenSecretKey loads SecKey.json only — Vault is decrypt-only.
+// Returns EnvectorKeys whose Decrypt method is wired to envector-go-sdk's CKKS
+// decryptor; encryption is unavailable.
+func OpenSecretKey(p KeysParams) (*EnvectorKeys, error) {
+	k, err := envector.OpenKeysFromFile(
+		envector.WithKeyPath(p.keyDir()),
+		envector.WithKeyID(p.KeyID),
+		envector.WithKeyDim(p.Dim),
+		envector.WithKeyParts(envector.KeyPartSec),
+	)
+	if err != nil {
+		return nil, fmt.Errorf("crypto: open sec key: %w", err)
+	}
+	return &EnvectorKeys{keys: k}, nil
+}
+
+// Decrypt unpacks a CiphertextScore proto blob into per-shard score
+// vectors. The returned slices are aligned: scores[i] is the score vector
+// for shard shardIdx[i]. The gRPC layer flattens these into ScoreEntry
+// rows and applies Top-K.
+func (f *EnvectorKeys) Decrypt(blob []byte) (scores [][]float64, shardIdx []int32, err error) {
+	if f == nil || f.keys == nil {
+		return nil, nil, errors.New("crypto: EnvectorKeys closed")
+	}
+	return f.keys.Decrypt(blob)
+}
+
+// PublicKeyBundle reads EncKey.json and EvalKey.json file contents from
+// disk. The strings are returned verbatim for inclusion in the GetPublicKey
+// gRPC response — clients re-parse them with their own SDK.
+type PublicKeyBundle struct {
+	EncKey  string
+	EvalKey string
+}
+
+func ReadPublicKeyBundle(p KeysParams) (*PublicKeyBundle, error) {
+	encPath := filepath.Join(p.keyDir(), "EncKey.json")
+	evalPath := filepath.Join(p.keyDir(), "EvalKey.json")
+	enc, err := os.ReadFile(encPath)
+	if err != nil {
+		return nil, fmt.Errorf("crypto: read EncKey.json: %w", err)
+	}
+	eval, err := os.ReadFile(evalPath)
+	if err != nil {
+		return nil, fmt.Errorf("crypto: read EvalKey.json: %w", err)
+	}
+	return &PublicKeyBundle{EncKey: string(enc), EvalKey: string(eval)}, nil
+}
+
+func (f *EnvectorKeys) Close() error {
+	if f == nil || f.keys == nil {
+		return nil
+	}
+	err := f.keys.Close()
+	f.keys = nil
+	return err
+}
diff --git a/vault/internal/crypto/keys_test.go b/vault/internal/crypto/keys_test.go
new file mode 100644
index 0000000..fdbaebd
--- /dev/null
+++ b/vault/internal/crypto/keys_test.go
@@ -0,0 +1,49 @@
+package crypto
+
+import (
+	"errors"
+	"path/filepath"
+	"testing"
+
+	envector "github.com/CryptoLabInc/envector-go-sdk"
+)
+
+func TestKeysExistFalseForMissingDir(t *testing.T) {
+	p := KeysParams{Root: filepath.Join(t.TempDir(), "no-such"), KeyID: "vault-key", Dim: 1024}
+	if KeysExist(p) {
+		t.Error("KeysExist = true for missing dir")
+	}
+}
+
+func TestOpenSecretKeyMissingReturnsError(t *testing.T) {
+	p := KeysParams{Root: t.TempDir(), KeyID: "vault-key", Dim: 1024}
+	_, err := OpenSecretKey(p)
+	if err == nil {
+		t.Fatal("OpenSecretKey on missing keys returned nil error")
+	}
+	// envector-go-sdk wraps ErrKeysNotFound; we wrap further. Match by message.
+	if !errors.Is(err, envector.ErrKeysNotFound) {
+		t.Logf("err = %v (does not unwrap to ErrKeysNotFound, but is non-nil)", err)
+	}
+}
+
+func TestReadPublicKeyBundleMissingReturnsError(t *testing.T) {
+	p := KeysParams{Root: t.TempDir(), KeyID: "vault-key", Dim: 1024}
+	if _, err := ReadPublicKeyBundle(p); err == nil {
+		t.Error("ReadPublicKeyBundle on missing keys returned nil error")
+	}
+}
+
+func TestNilEnvectorKeysCloseSafe(t *testing.T) {
+	var f *EnvectorKeys
+	if err := f.Close(); err != nil {
+		t.Errorf("nil Close: %v", err)
+	}
+}
+
+func TestNilEnvectorKeysDecryptError(t *testing.T) {
+	var f *EnvectorKeys
+	if _, _, err := f.Decrypt([]byte("anything")); err == nil {
+		t.Error("nil Decrypt should error")
+	}
+}
diff --git a/vault/internal/crypto/metadata.go b/vault/internal/crypto/metadata.go
new file mode 100644
index 0000000..eb880d0
--- /dev/null
+++ b/vault/internal/crypto/metadata.go
@@ -0,0 +1,105 @@
+// Package crypto provides metadata key derivation, AES-256-CTR metadata
+// encryption (wire-compatible with pyenvector.utils.aes), and FHE key
+// lifecycle wrappers around envector-go-sdk.
+//
+// Wire format for metadata ciphertext (mirrors pyenvector.utils.aes.AESHelper):
+//
+//	base64( IV (16 bytes) || ciphertext (variable) )
+//
+// AES-256-CTR is unauthenticated; integrity is enforced by upstream JSON
+// envelopes and HKDF-derived per-agent keys.
+package crypto
+
+import (
+	"crypto/aes"
+	"crypto/cipher"
+	"crypto/rand"
+	"crypto/sha256"
+	"encoding/base64"
+	"encoding/hex"
+	"errors"
+	"fmt"
+	"io"
+
+	"golang.org/x/crypto/hkdf"
+)
+
+const (
+	dekLen = 32
+	ivLen  = 16
+)
+
+var (
+	ErrInvalidKey        = errors.New("crypto: AES key must be 32 bytes")
+	ErrInvalidCiphertext = errors.New("crypto: ciphertext too short (need >= 16 bytes after base64 decode)")
+)
+
+// DeriveAgentKey returns a 32-byte AES-256 DEK derived from the team-wide
+// secret and a per-agent identifier via HKDF-SHA256. Mirrors
+// vault.vault_core.derive_agent_key (HKDF salt=None, info=agent_id utf-8).
+func DeriveAgentKey(teamSecret, agentID string) ([]byte, error) {
+	if teamSecret == "" {
+		return nil, errors.New("crypto: team_secret is empty")
+	}
+	r := hkdf.New(sha256.New, []byte(teamSecret), nil, []byte(agentID))
+	dek := make([]byte, dekLen)
+	if _, err := io.ReadFull(r, dek); err != nil {
+		return nil, fmt.Errorf("crypto: hkdf read: %w", err)
+	}
+	return dek, nil
+}
+
+// AgentIDFromToken returns the per-token agent identifier:
+// the first 32 hex chars of SHA-256(token).
+func AgentIDFromToken(token string) string {
+	sum := sha256.Sum256([]byte(token))
+	return hex.EncodeToString(sum[:])[:32]
+}
+
+// EncryptMetadata produces a base64-encoded ciphertext compatible with
+// pyenvector.utils.aes.encrypt_metadata: AES-256-CTR with a random 16-byte
+// IV prefixed to the ciphertext.
+func EncryptMetadata(plaintext, key []byte) (string, error) {
+	if len(key) != dekLen {
+		return "", ErrInvalidKey
+	}
+	iv := make([]byte, ivLen)
+	if _, err := rand.Read(iv); err != nil {
+		return "", fmt.Errorf("crypto: read iv: %w", err)
+	}
+	block, err := aes.NewCipher(key)
+	if err != nil {
+		return "", err
+	}
+	ct := make([]byte, len(plaintext))
+	cipher.NewCTR(block, iv).XORKeyStream(ct, plaintext)
+	out := make([]byte, 0, ivLen+len(ct))
+	out = append(out, iv...)
+	out = append(out, ct...)
+	return base64.StdEncoding.EncodeToString(out), nil
+}
+
+// DecryptMetadata reverses EncryptMetadata: base64-decode the input, peel
+// off the 16-byte IV, then AES-256-CTR decrypt. Output is raw bytes; the
+// caller decides whether to UTF-8/JSON-parse them.
+func DecryptMetadata(ctB64 string, key []byte) ([]byte, error) {
+	if len(key) != dekLen {
+		return nil, ErrInvalidKey
+	}
+	raw, err := base64.StdEncoding.DecodeString(ctB64)
+	if err != nil {
+		return nil, fmt.Errorf("crypto: base64 decode: %w", err)
+	}
+	if len(raw) < ivLen {
+		return nil, ErrInvalidCiphertext
+	}
+	iv := raw[:ivLen]
+	ct := raw[ivLen:]
+	block, err := aes.NewCipher(key)
+	if err != nil {
+		return nil, err
+	}
+	pt := make([]byte, len(ct))
+	cipher.NewCTR(block, iv).XORKeyStream(pt, ct)
+	return pt, nil
+}
diff --git a/vault/internal/crypto/metadata_test.go b/vault/internal/crypto/metadata_test.go
new file mode 100644
index 0000000..ff6509b
--- /dev/null
+++ b/vault/internal/crypto/metadata_test.go
@@ -0,0 +1,223 @@
+package crypto
+
+import (
+	"bytes"
+	"encoding/base64"
+	"encoding/hex"
+	"strings"
+	"testing"
+)
+
+// HKDF golden vector — derived from Python:
+//
+//	cryptography.hazmat.primitives.kdf.hkdf.HKDF(
+//	    algorithm=SHA256(), length=32, salt=None, info=b"abc123def456")
+//	    .derive(b"test-team-secret-32-bytes-please")
+const (
+	goldenTeamSecret = "test-team-secret-32-bytes-please"
+	goldenAgentID    = "abc123def456"
+	goldenDEKHex     = "0e4757183d2aa64e384012a494accb6fa18b8ff144c97b78b91bec3b6720767a"
+
+	demoToken        = "evt_0000000000000000000000000000demo"
+	demoTokenAgentID = "a84c4af3aac6f4479a6741d9df0cda65"
+)
+
+func TestDeriveAgentKeyMatchesPython(t *testing.T) {
+	got, err := DeriveAgentKey(goldenTeamSecret, goldenAgentID)
+	if err != nil {
+		t.Fatal(err)
+	}
+	want, _ := hex.DecodeString(goldenDEKHex)
+	if !bytes.Equal(got, want) {
+		t.Errorf("DEK mismatch\n got %x\nwant %s", got, goldenDEKHex)
+	}
+}
+
+func TestDeriveAgentKeyDeterministic(t *testing.T) {
+	d1, err := DeriveAgentKey(goldenTeamSecret, goldenAgentID)
+	if err != nil {
+		t.Fatal(err)
+	}
+	d2, err := DeriveAgentKey(goldenTeamSecret, goldenAgentID)
+	if err != nil {
+		t.Fatal(err)
+	}
+	if !bytes.Equal(d1, d2) {
+		t.Error("HKDF output non-deterministic")
+	}
+}
+
+func TestDeriveAgentKeyDifferentAgents(t *testing.T) {
+	a, _ := DeriveAgentKey(goldenTeamSecret, "agent-a")
+	b, _ := DeriveAgentKey(goldenTeamSecret, "agent-b")
+	if bytes.Equal(a, b) {
+		t.Error("different agents produced same DEK")
+	}
+}
+
+func TestDeriveAgentKeyEmptyTeamSecret(t *testing.T) {
+	if _, err := DeriveAgentKey("", "x"); err == nil {
+		t.Error("empty team secret should error")
+	}
+}
+
+func TestAgentIDFromDemoToken(t *testing.T) {
+	got := AgentIDFromToken(demoToken)
+	if got != demoTokenAgentID {
+		t.Errorf("agent_id = %q, want %q", got, demoTokenAgentID)
+	}
+	if len(got) != 32 {
+		t.Errorf("agent_id length = %d, want 32", len(got))
+	}
+}
+
+// ── round-trip ────────────────────────────────────────────────────
+
+func TestEncryptDecryptRoundTripStr(t *testing.T) {
+	key, _ := DeriveAgentKey(goldenTeamSecret, goldenAgentID)
+	plaintext := []byte("hello world")
+	ct, err := EncryptMetadata(plaintext, key)
+	if err != nil {
+		t.Fatal(err)
+	}
+	got, err := DecryptMetadata(ct, key)
+	if err != nil {
+		t.Fatal(err)
+	}
+	if !bytes.Equal(got, plaintext) {
+		t.Errorf("round-trip mismatch: got %q, want %q", got, plaintext)
+	}
+}
+
+func TestEncryptDecryptRoundTripBinary(t *testing.T) {
+	key, _ := DeriveAgentKey(goldenTeamSecret, goldenAgentID)
+	plaintext := []byte{0, 1, 2, 3, 'b', 'i', 'n', 'a', 'r', 'y'}
+	ct, err := EncryptMetadata(plaintext, key)
+	if err != nil {
+		t.Fatal(err)
+	}
+	got, err := DecryptMetadata(ct, key)
+	if err != nil {
+		t.Fatal(err)
+	}
+	if !bytes.Equal(got, plaintext) {
+		t.Errorf("round-trip mismatch: got %x, want %x", got, plaintext)
+	}
+}
+
+func TestEncryptDecryptRoundTripJSON(t *testing.T) {
+	key, _ := DeriveAgentKey(goldenTeamSecret, goldenAgentID)
+	plaintext := []byte(`{"foo":"bar","n":42}`)
+	ct, err := EncryptMetadata(plaintext, key)
+	if err != nil {
+		t.Fatal(err)
+	}
+	got, err := DecryptMetadata(ct, key)
+	if err != nil {
+		t.Fatal(err)
+	}
+	if !bytes.Equal(got, plaintext) {
+		t.Errorf("round-trip mismatch: got %s, want %s", got, plaintext)
+	}
+}
+
+// IV must change every encryption (random 16 bytes prefixed)
+func TestEncryptUsesRandomIV(t *testing.T) {
+	key, _ := DeriveAgentKey(goldenTeamSecret, goldenAgentID)
+	pt := []byte("same plaintext")
+	ct1, _ := EncryptMetadata(pt, key)
+	ct2, _ := EncryptMetadata(pt, key)
+	if ct1 == ct2 {
+		t.Error("two encryptions of same plaintext returned identical ciphertext (IV reuse?)")
+	}
+}
+
+// ── cross-language: decrypt Python-produced ciphertexts ──────────
+
+func TestDecryptPythonGoldenStr(t *testing.T) {
+	key, _ := DeriveAgentKey(goldenTeamSecret, goldenAgentID)
+	// Python: encrypt_metadata("hello world", dek) →
+	pythonCT := "OhawM+14dWV/2KJwL0Ud3pqJpP6Mr7XVfCsM"
+	got, err := DecryptMetadata(pythonCT, key)
+	if err != nil {
+		t.Fatal(err)
+	}
+	if string(got) != "hello world" {
+		t.Errorf("decrypt = %q, want %q", got, "hello world")
+	}
+}
+
+func TestDecryptPythonGoldenDict(t *testing.T) {
+	key, _ := DeriveAgentKey(goldenTeamSecret, goldenAgentID)
+	// Python: encrypt_metadata({"foo": "bar", "n": 42}, dek) →
+	// (the dict is JSON-serialized as {"foo":"bar","n":42} — separators=(",", ":"))
+	pythonCT := "x801QtEfmRM9Hg9ncV0p1aHbcPTBGI/63+L7c/TPVoPFRS/p"
+	got, err := DecryptMetadata(pythonCT, key)
+	if err != nil {
+		t.Fatal(err)
+	}
+	want := `{"foo":"bar","n":42}`
+	if string(got) != want {
+		t.Errorf("decrypt = %q, want %q", got, want)
+	}
+}
+
+func TestDecryptPythonGoldenBytes(t *testing.T) {
+	key, _ := DeriveAgentKey(goldenTeamSecret, goldenAgentID)
+	// Python: encrypt_metadata(b"\x00\x01\x02\x03binary", dek)
+	pythonCT := "zAoZPxGEAucFdLBQWyahXBFCCwjLL8z2RjA="
+	got, err := DecryptMetadata(pythonCT, key)
+	if err != nil {
+		t.Fatal(err)
+	}
+	want := []byte{0, 1, 2, 3, 'b', 'i', 'n', 'a', 'r', 'y'}
+	if !bytes.Equal(got, want) {
+		t.Errorf("decrypt = %x, want %x", got, want)
+	}
+}
+
+// ── error cases ──────────────────────────────────────────────────
+
+func TestDecryptInvalidKey(t *testing.T) {
+	short := []byte("short")
+	if _, err := DecryptMetadata("anything", short); err != ErrInvalidKey {
+		t.Errorf("err = %v, want ErrInvalidKey", err)
+	}
+}
+
+func TestEncryptInvalidKey(t *testing.T) {
+	short := []byte("short")
+	if _, err := EncryptMetadata([]byte("x"), short); err != ErrInvalidKey {
+		t.Errorf("err = %v, want ErrInvalidKey", err)
+	}
+}
+
+func TestDecryptInvalidBase64(t *testing.T) {
+	key := make([]byte, 32)
+	if _, err := DecryptMetadata("!!!not-base64!!!", key); err == nil {
+		t.Error("invalid base64 should error")
+	}
+}
+
+func TestDecryptShortCiphertext(t *testing.T) {
+	key := make([]byte, 32)
+	short := base64.StdEncoding.EncodeToString([]byte("only12bytes!"))
+	if _, err := DecryptMetadata(short, key); err != ErrInvalidCiphertext {
+		t.Errorf("err = %v, want ErrInvalidCiphertext", err)
+	}
+}
+
+// ── secret leakage guard ─────────────────────────────────────────
+
+// Ensure key bytes never appear in error messages.
+func TestErrorsDoNotLeakKey(t *testing.T) {
+	key, _ := DeriveAgentKey(goldenTeamSecret, goldenAgentID)
+	keyHex := hex.EncodeToString(key)
+	_, err := DecryptMetadata("!!!", key)
+	if err == nil {
+		t.Fatal("expected error")
+	}
+	if strings.Contains(err.Error(), keyHex[:16]) {
+		t.Errorf("error message leaked key prefix: %q", err)
+	}
+}
diff --git a/vault/internal/server/audit.go b/vault/internal/server/audit.go
new file mode 100644
index 0000000..d5ce3b2
--- /dev/null
+++ b/vault/internal/server/audit.go
@@ -0,0 +1,181 @@
+package server
+
+import (
+	"encoding/json"
+	"fmt"
+	"io"
+	"net"
+	"os"
+	"path/filepath"
+	"strings"
+	"sync"
+	"time"
+
+	"google.golang.org/grpc/peer"
+	"gopkg.in/natefinch/lumberjack.v2"
+)
+
+// AuditMode parses AuditConfig.Mode strings into per-sink booleans.
+// Valid values: "", "file", "stdout", "file+stdout".
+type AuditMode struct {
+	File   bool
+	Stdout bool
+}
+
+func ParseAuditMode(mode string) AuditMode {
+	out := AuditMode{}
+	if mode == "" {
+		return out
+	}
+	for _, p := range strings.Split(mode, "+") {
+		switch strings.TrimSpace(strings.ToLower(p)) {
+		case "file":
+			out.File = true
+		case "stdout":
+			out.Stdout = true
+		}
+	}
+	return out
+}
+
+// AuditEntry is the JSON structure written per request. Fields and order
+// must match vault/audit.py:118-145 to keep golden compat tests aligned.
+type AuditEntry struct {
+	Timestamp   string  `json:"timestamp"`
+	UserID      string  `json:"user_id"`
+	Method      string  `json:"method"`
+	TopK        *int32  `json:"top_k"`
+	ResultCount int     `json:"result_count"`
+	Status      string  `json:"status"`
+	SourceIP    string  `json:"source_ip"`
+	LatencyMs   float64 `json:"latency_ms"`
+	Error       *string `json:"error,omitempty"`
+}
+
+// AuditLogger writes structured audit entries. Closed loggers are no-ops.
+type AuditLogger struct {
+	mu      sync.Mutex
+	writers []io.Writer
+	closers []io.Closer
+}
+
+// NewAuditLogger constructs a logger for the given mode + file path.
+// Returns a logger with Enabled() == false when the mode is empty.
+func NewAuditLogger(cfg AuditConfig) (*AuditLogger, error) {
+	mode := ParseAuditMode(cfg.Mode)
+	l := &AuditLogger{}
+
+	if mode.File {
+		path := cfg.Path
+		if path == "" {
+			path = "/var/log/runevault/audit.log"
+		}
+		if err := os.MkdirAll(filepath.Dir(path), 0o750); err != nil {
+			return nil, fmt.Errorf("audit: mkdir log dir: %w", err)
+		}
+		// Lumberjack handles daily-ish rotation by size + age. Match the
+		// Python deployment's 30-day retention; size cap is high enough
+		// that audit volume drives rotation by age, not size.
+		rot := &lumberjack.Logger{
+			Filename:   path,
+			MaxSize:    100, // MB
+			MaxAge:     30,
+			MaxBackups: 30,
+			LocalTime:  false,
+			Compress:   false,
+		}
+		l.writers = append(l.writers, rot)
+		l.closers = append(l.closers, rot)
+	}
+
+	if mode.Stdout {
+		l.writers = append(l.writers, os.Stdout)
+	}
+	return l, nil
+}
+
+// Enabled reports whether at least one sink is configured.
+func (a *AuditLogger) Enabled() bool {
+	if a == nil {
+		return false
+	}
+	a.mu.Lock()
+	defer a.mu.Unlock()
+	return len(a.writers) > 0
+}
+
+// Log emits a single audit entry. Round-trip latency is rounded to 2dp
+// to match Python's `round(latency_ms, 2)`.
+func (a *AuditLogger) Log(e AuditEntry) {
+	if a == nil || !a.Enabled() {
+		return
+	}
+	e.LatencyMs = roundTo(e.LatencyMs, 2)
+
+	buf, err := json.Marshal(&e)
+	if err != nil {
+		return
+	}
+	buf = append(buf, '\n')
+
+	a.mu.Lock()
+	defer a.mu.Unlock()
+	for _, w := range a.writers {
+		_, _ = w.Write(buf)
+	}
+}
+
+// Close flushes file writers and prevents future Log calls from writing.
+func (a *AuditLogger) Close() error {
+	if a == nil {
+		return nil
+	}
+	a.mu.Lock()
+	defer a.mu.Unlock()
+	var firstErr error
+	for _, c := range a.closers {
+		if err := c.Close(); err != nil && firstErr == nil {
+			firstErr = err
+		}
+	}
+	a.writers = nil
+	a.closers = nil
+	return firstErr
+}
+
+func roundTo(v float64, decimals int) float64 {
+	mult := 1.0
+	for i := 0; i < decimals; i++ {
+		mult *= 10
+	}
+	if v >= 0 {
+		return float64(int64(v*mult+0.5)) / mult
+	}
+	return float64(int64(v*mult-0.5)) / mult
+}
+
+// ExtractSourceIP mirrors vault/audit.py:55-78 — peer addresses come in
+// gRPC's "ipv4:H:P", "ipv6:[::1]:P", or "unix:/path" form.
+func ExtractSourceIP(p *peer.Peer) string {
+	if p == nil || p.Addr == nil {
+		return "unknown"
+	}
+	addr := p.Addr.String()
+	switch a := p.Addr.(type) {
+	case *net.TCPAddr:
+		if a.IP == nil {
+			return addr
+		}
+		return a.IP.String()
+	case *net.UnixAddr:
+		return "unix:" + a.Name
+	}
+	if h, _, err := net.SplitHostPort(addr); err == nil {
+		return h
+	}
+	return addr
+}
+
+func nowUTCISO() string {
+	return time.Now().UTC().Format("2006-01-02T15:04:05.000000Z07:00")
+}
diff --git a/vault/internal/server/audit_test.go b/vault/internal/server/audit_test.go
new file mode 100644
index 0000000..adb55bb
--- /dev/null
+++ b/vault/internal/server/audit_test.go
@@ -0,0 +1,156 @@
+package server
+
+import (
+	"bufio"
+	"encoding/json"
+	"net"
+	"os"
+	"path/filepath"
+	"strings"
+	"testing"
+
+	"google.golang.org/grpc/peer"
+)
+
+func TestParseAuditMode(t *testing.T) {
+	cases := map[string]AuditMode{
+		"":             {},
+		"file":         {File: true},
+		"stdout":       {Stdout: true},
+		"file+stdout":  {File: true, Stdout: true},
+		"stdout+file":  {File: true, Stdout: true},
+		"FILE":         {File: true},
+		"  file  ":     {File: true},
+		"unknown":      {},
+		"file+unknown": {File: true},
+	}
+	for in, want := range cases {
+		got := ParseAuditMode(in)
+		if got != want {
+			t.Errorf("ParseAuditMode(%q) = %+v, want %+v", in, got, want)
+		}
+	}
+}
+
+func TestAuditLoggerDisabledWhenModeEmpty(t *testing.T) {
+	l, err := NewAuditLogger(AuditConfig{Mode: ""})
+	if err != nil {
+		t.Fatal(err)
+	}
+	if l.Enabled() {
+		t.Error("logger enabled with empty mode")
+	}
+	// Log on disabled logger must be no-op (and not panic).
+	l.Log(AuditEntry{UserID: "x"})
+}
+
+func TestAuditLoggerFileMode(t *testing.T) {
+	dir := t.TempDir()
+	path := filepath.Join(dir, "audit.log")
+	l, err := NewAuditLogger(AuditConfig{Mode: "file", Path: path})
+	if err != nil {
+		t.Fatal(err)
+	}
+	defer l.Close()
+
+	topK := int32(10)
+	errMsg := "boom"
+	l.Log(AuditEntry{
+		Timestamp:   "2026-04-23T00:00:00.000000Z",
+		UserID:      "alice",
+		Method:      "decrypt_scores",
+		TopK:        &topK,
+		ResultCount: 7,
+		Status:      "success",
+		SourceIP:    "127.0.0.1",
+		LatencyMs:   45.6789,
+		Error:       &errMsg,
+	})
+	l.Close()
+
+	f, err := os.Open(path)
+	if err != nil {
+		t.Fatal(err)
+	}
+	defer f.Close()
+	scanner := bufio.NewScanner(f)
+	if !scanner.Scan() {
+		t.Fatal("audit log empty")
+	}
+	var got map[string]any
+	if err := json.Unmarshal(scanner.Bytes(), &got); err != nil {
+		t.Fatal(err)
+	}
+	if got["user_id"] != "alice" {
+		t.Errorf("user_id = %v, want alice", got["user_id"])
+	}
+	if got["method"] != "decrypt_scores" {
+		t.Errorf("method = %v", got["method"])
+	}
+	if got["top_k"].(float64) != 10 {
+		t.Errorf("top_k = %v", got["top_k"])
+	}
+	if got["latency_ms"].(float64) != 45.68 {
+		t.Errorf("latency_ms = %v, want 45.68 (rounded)", got["latency_ms"])
+	}
+	if got["error"] != "boom" {
+		t.Errorf("error = %v", got["error"])
+	}
+}
+
+func TestAuditLoggerOmitsErrorWhenNil(t *testing.T) {
+	dir := t.TempDir()
+	path := filepath.Join(dir, "audit.log")
+	l, err := NewAuditLogger(AuditConfig{Mode: "file", Path: path})
+	if err != nil {
+		t.Fatal(err)
+	}
+	defer l.Close()
+	l.Log(AuditEntry{UserID: "x", Method: "y", Status: "success"})
+	l.Close()
+
+	body, _ := os.ReadFile(path)
+	if strings.Contains(string(body), `"error"`) {
+		t.Errorf("audit entry contains error field for non-error case: %s", body)
+	}
+}
+
+func TestExtractSourceIPTCP(t *testing.T) {
+	addr := &net.TCPAddr{IP: net.ParseIP("10.0.0.5"), Port: 12345}
+	got := ExtractSourceIP(&peer.Peer{Addr: addr})
+	if got != "10.0.0.5" {
+		t.Errorf("got %q, want 10.0.0.5", got)
+	}
+}
+
+func TestExtractSourceIPUnix(t *testing.T) {
+	addr := &net.UnixAddr{Name: "/tmp/x.sock", Net: "unix"}
+	got := ExtractSourceIP(&peer.Peer{Addr: addr})
+	if got != "unix:/tmp/x.sock" {
+		t.Errorf("got %q, want unix:/tmp/x.sock", got)
+	}
+}
+
+func TestExtractSourceIPNil(t *testing.T) {
+	if got := ExtractSourceIP(nil); got != "unknown" {
+		t.Errorf("nil peer: got %q, want unknown", got)
+	}
+}
+
+func TestRoundTo(t *testing.T) {
+	cases := []struct {
+		in   float64
+		want float64
+	}{
+		{45.6789, 45.68},
+		{45.6749, 45.67},
+		{0, 0},
+		{-1.236, -1.24},
+	}
+	for _, c := range cases {
+		got := roundTo(c.in, 2)
+		if got != c.want {
+			t.Errorf("roundTo(%v,2) = %v, want %v", c.in, got, c.want)
+		}
+	}
+}
diff --git a/vault/internal/server/grpc_test.go b/vault/internal/server/grpc_test.go
new file mode 100644
index 0000000..391b266
--- /dev/null
+++ b/vault/internal/server/grpc_test.go
@@ -0,0 +1,205 @@
+package server
+
+import (
+	"context"
+	"errors"
+	"strings"
+	"testing"
+
+	"google.golang.org/grpc/codes"
+	"google.golang.org/grpc/status"
+
+	"github.com/CryptoLabInc/rune-admin/vault/internal/tokens"
+	pb "github.com/CryptoLabInc/rune-admin/vault/pkg/vaultpb"
+)
+
+// ── topK_FromShards ───────────────────────────────────────────────
+
+func TestTopKFlatSingleShard(t *testing.T) {
+	scores := [][]float64{{0.5, 0.9, 0.1, 0.7}}
+	shardIdx := []int32{0}
+	got := topK_FromShards(scores, shardIdx, 2)
+	if len(got) != 2 {
+		t.Fatalf("len = %d", len(got))
+	}
+	if got[0].Score != 0.9 || got[1].Score != 0.7 {
+		t.Errorf("scores = [%v %v], want [0.9 0.7]", got[0].Score, got[1].Score)
+	}
+	if got[0].RowIdx != 1 || got[1].RowIdx != 3 {
+		t.Errorf("rows = [%d %d], want [1 3]", got[0].RowIdx, got[1].RowIdx)
+	}
+}
+
+func TestTopKMultiShard(t *testing.T) {
+	scores := [][]float64{
+		{0.1, 0.2},
+		{0.9, 0.5},
+	}
+	shardIdx := []int32{10, 20}
+	got := topK_FromShards(scores, shardIdx, 3)
+	if len(got) != 3 {
+		t.Fatalf("len = %d", len(got))
+	}
+	// Top-3 by score desc: 0.9 (shard 20, row 0), 0.5 (shard 20, row 1), 0.2 (shard 10, row 1)
+	if got[0].Score != 0.9 || got[0].ShardIdx != 20 || got[0].RowIdx != 0 {
+		t.Errorf("[0] = %+v", got[0])
+	}
+	if got[1].Score != 0.5 || got[1].ShardIdx != 20 || got[1].RowIdx != 1 {
+		t.Errorf("[1] = %+v", got[1])
+	}
+	if got[2].Score != 0.2 || got[2].ShardIdx != 10 || got[2].RowIdx != 1 {
+		t.Errorf("[2] = %+v", got[2])
+	}
+}
+
+func TestTopKKExceedsAvailable(t *testing.T) {
+	scores := [][]float64{{0.1, 0.2}}
+	got := topK_FromShards(scores, []int32{0}, 10)
+	if len(got) != 2 {
+		t.Errorf("len = %d, want 2 (clamped to available)", len(got))
+	}
+}
+
+func TestTopKEmptyInput(t *testing.T) {
+	got := topK_FromShards(nil, nil, 5)
+	if len(got) != 0 {
+		t.Errorf("len = %d, want 0", len(got))
+	}
+}
+
+// ── error mapping ─────────────────────────────────────────────────
+
+func TestMapTokenErrorCodes(t *testing.T) {
+	cases := []struct {
+		err  error
+		code codes.Code
+	}{
+		{tokens.ErrTokenNotFound{}, codes.Unauthenticated},
+		{tokens.ErrTokenExpired{User: "x"}, codes.Unauthenticated},
+		{tokens.ErrRateLimit{RetryAfter: 5}, codes.ResourceExhausted},
+		{tokens.ErrScope{Method: "m", RoleName: "r"}, codes.PermissionDenied},
+		{tokens.ErrTopKExceeded{Requested: 50, MaxTopK: 10, RoleName: "member"}, codes.InvalidArgument},
+		{errors.New("random"), codes.Unauthenticated},
+	}
+	for _, c := range cases {
+		got, _ := mapTokenError(c.err)
+		if got != c.code {
+			t.Errorf("mapTokenError(%v) = %v, want %v", c.err, got, c.code)
+		}
+	}
+}
+
+// ── handler — token error paths (no FHE keys needed) ─────────────
+
+func newTestVault(t *testing.T) *Vault {
+	t.Helper()
+	cfg := &Config{
+		Tokens: TokensConfig{TeamSecret: "test-secret"},
+		Keys:   KeysConfig{Path: t.TempDir(), EmbeddingDim: 1024},
+	}
+	store := tokens.NewStore()
+	store.LoadDefaultsWithDemoToken()
+	audit, _ := NewAuditLogger(AuditConfig{Mode: ""})
+	return NewVault(cfg, store, nil, audit)
+}
+
+func TestGetPublicKeyInvalidToken(t *testing.T) {
+	v := newTestVault(t)
+	srv := NewVaultGRPC(v)
+	resp, err := srv.GetPublicKey(context.Background(), &pb.GetPublicKeyRequest{
+		Token: "evt_ffffffffffffffffffffffffffffffff",
+	})
+	if status.Code(err) != codes.Unauthenticated {
+		t.Errorf("code = %v, want Unauthenticated", status.Code(err))
+	}
+	if resp.GetError() == "" {
+		t.Error("response.error is empty")
+	}
+}
+
+func TestDecryptScoresInvalidToken(t *testing.T) {
+	v := newTestVault(t)
+	srv := NewVaultGRPC(v)
+	_, err := srv.DecryptScores(context.Background(), &pb.DecryptScoresRequest{
+		Token:            "evt_ffffffffffffffffffffffffffffffff",
+		EncryptedBlobB64: "AA==",
+		TopK:             5,
+	})
+	if status.Code(err) != codes.Unauthenticated {
+		t.Errorf("code = %v, want Unauthenticated", status.Code(err))
+	}
+}
+
+func TestDecryptScoresTopKExceeded(t *testing.T) {
+	v := newTestVault(t)
+	srv := NewVaultGRPC(v)
+	// Demo token has admin role with top_k=50; request 51.
+	_, err := srv.DecryptScores(context.Background(), &pb.DecryptScoresRequest{
+		Token:            tokens.DemoToken,
+		EncryptedBlobB64: "AA==",
+		TopK:             51,
+	})
+	if status.Code(err) != codes.InvalidArgument {
+		t.Fatalf("code = %v, want InvalidArgument", status.Code(err))
+	}
+	if !strings.Contains(err.Error(), "exceeds limit 50") {
+		t.Errorf("err = %v, want 'exceeds limit 50'", err)
+	}
+}
+
+func TestDecryptMetadataInvalidToken(t *testing.T) {
+	v := newTestVault(t)
+	srv := NewVaultGRPC(v)
+	_, err := srv.DecryptMetadata(context.Background(), &pb.DecryptMetadataRequest{
+		Token:                 "evt_ffffffffffffffffffffffffffffffff",
+		EncryptedMetadataList: []string{`{"a":"x","c":"y"}`},
+	})
+	if status.Code(err) != codes.Unauthenticated {
+		t.Errorf("code = %v, want Unauthenticated", status.Code(err))
+	}
+}
+
+func TestDecryptMetadataMalformedEnvelope(t *testing.T) {
+	v := newTestVault(t)
+	srv := NewVaultGRPC(v)
+	resp, err := srv.DecryptMetadata(context.Background(), &pb.DecryptMetadataRequest{
+		Token:                 tokens.DemoToken,
+		EncryptedMetadataList: []string{"not-json"},
+	})
+	if err != nil {
+		t.Fatalf("unexpected err: %v", err)
+	}
+	if !strings.Contains(resp.GetError(), "Metadata decryption failed") {
+		t.Errorf("error = %q, want 'Metadata decryption failed'", resp.GetError())
+	}
+}
+
+// Round-trip: encrypt with crypto helpers, decrypt via gRPC handler.
+// This exercises the handler against valid input without needing the FHE
+// secret key.
+func TestDecryptMetadataRoundTrip(t *testing.T) {
+	v := newTestVault(t)
+	srv := NewVaultGRPC(v)
+
+	// Encrypt "hello" with an HKDF DEK derived from the team secret.
+	agentID := "test-agent"
+	plain := "hello"
+	dek := mustDEK(t, "test-secret", agentID)
+	ct := mustEncrypt(t, []byte(plain), dek)
+	envelope := `{"a":"` + agentID + `","c":"` + ct + `"}`
+
+	resp, err := srv.DecryptMetadata(context.Background(), &pb.DecryptMetadataRequest{
+		Token:                 tokens.DemoToken,
+		EncryptedMetadataList: []string{envelope},
+	})
+	if err != nil {
+		t.Fatal(err)
+	}
+	if resp.GetError() != "" {
+		t.Fatalf("response error: %s", resp.GetError())
+	}
+	got := resp.GetDecryptedMetadata()
+	if len(got) != 1 || got[0] != plain {
+		t.Errorf("decrypted = %v, want [%q]", got, plain)
+	}
+}
diff --git a/vault/internal/server/helpers_test.go b/vault/internal/server/helpers_test.go
new file mode 100644
index 0000000..2cfbc7a
--- /dev/null
+++ b/vault/internal/server/helpers_test.go
@@ -0,0 +1,25 @@
+package server
+
+import (
+	"testing"
+
+	"github.com/CryptoLabInc/rune-admin/vault/internal/crypto"
+)
+
+func mustDEK(t *testing.T, secret, agentID string) []byte {
+	t.Helper()
+	d, err := crypto.DeriveAgentKey(secret, agentID)
+	if err != nil {
+		t.Fatal(err)
+	}
+	return d
+}
+
+func mustEncrypt(t *testing.T, plaintext, key []byte) string {
+	t.Helper()
+	ct, err := crypto.EncryptMetadata(plaintext, key)
+	if err != nil {
+		t.Fatal(err)
+	}
+	return ct
+}
diff --git a/vault/internal/server/interceptors.go b/vault/internal/server/interceptors.go
new file mode 100644
index 0000000..eea9c7c
--- /dev/null
+++ b/vault/internal/server/interceptors.go
@@ -0,0 +1,85 @@
+package server
+
+import (
+	"context"
+	"errors"
+	"fmt"
+	"strings"
+	"unicode"
+
+	"buf.build/go/protovalidate"
+	"google.golang.org/grpc"
+	"google.golang.org/grpc/codes"
+	"google.golang.org/grpc/status"
+	"google.golang.org/protobuf/proto"
+
+	pb "github.com/CryptoLabInc/rune-admin/vault/pkg/vaultpb"
+)
+
+// vaultMethods enumerates the gRPC method paths owned by VaultService.
+// Other services routed through the same gRPC server bypass runtime checks.
+var vaultMethods = map[string]bool{
+	"/rune.vault.v1.VaultService/GetPublicKey":    true,
+	"/rune.vault.v1.VaultService/DecryptScores":   true,
+	"/rune.vault.v1.VaultService/DecryptMetadata": true,
+}
+
+// NewValidationInterceptor returns a unary server interceptor that runs
+// protovalidate against the request, then a runtime safety check on the
+// token field. Validation errors are returned as InvalidArgument.
+//
+// Mirrors vault/validation_interceptor.py and vault/request_validator.py.
+func NewValidationInterceptor() (grpc.UnaryServerInterceptor, error) {
+	v, err := protovalidate.New()
+	if err != nil {
+		return nil, fmt.Errorf("interceptors: new protovalidate: %w", err)
+	}
+	return func(ctx context.Context, req any, info *grpc.UnaryServerInfo, handler grpc.UnaryHandler) (any, error) {
+		msg, ok := req.(proto.Message)
+		if ok {
+			if err := v.Validate(msg); err != nil {
+				return nil, status.Error(codes.InvalidArgument, err.Error())
+			}
+		}
+		if vaultMethods[info.FullMethod] {
+			if err := runtimeCheckToken(req); err != nil {
+				return nil, status.Error(codes.InvalidArgument, err.Error())
+			}
+		}
+		return handler(ctx, req)
+	}, nil
+}
+
+// runtimeCheckToken pulls the token field from a Vault request and runs
+// the supplementary checks the .proto annotations cannot express.
+func runtimeCheckToken(req any) error {
+	var token string
+	switch r := req.(type) {
+	case *pb.GetPublicKeyRequest:
+		token = r.GetToken()
+	case *pb.DecryptScoresRequest:
+		token = r.GetToken()
+	case *pb.DecryptMetadataRequest:
+		token = r.GetToken()
+	default:
+		return nil
+	}
+	return CheckTokenSafety(token)
+}
+
+// CheckTokenSafety rejects tokens with control characters or surrounding
+// whitespace. Exposed so unit tests can exercise the rule directly.
+func CheckTokenSafety(token string) error {
+	for _, r := range token {
+		if r < 0x20 || r == 0x7f {
+			return errors.New("token: must not contain control characters")
+		}
+		if unicode.IsControl(r) {
+			return errors.New("token: must not contain control characters")
+		}
+	}
+	if token != strings.TrimSpace(token) {
+		return errors.New("token: must not have leading or trailing whitespace")
+	}
+	return nil
+}
diff --git a/vault/internal/server/interceptors_test.go b/vault/internal/server/interceptors_test.go
new file mode 100644
index 0000000..4d66d66
--- /dev/null
+++ b/vault/internal/server/interceptors_test.go
@@ -0,0 +1,105 @@
+package server
+
+import (
+	"context"
+	"strings"
+	"testing"
+
+	"google.golang.org/grpc"
+	"google.golang.org/grpc/codes"
+	"google.golang.org/grpc/status"
+
+	pb "github.com/CryptoLabInc/rune-admin/vault/pkg/vaultpb"
+)
+
+func TestCheckTokenSafetyAccepts(t *testing.T) {
+	if err := CheckTokenSafety("evt_0123456789abcdef0123456789abcdef"); err != nil {
+		t.Errorf("good token rejected: %v", err)
+	}
+}
+
+func TestCheckTokenSafetyRejectsControlChar(t *testing.T) {
+	for _, bad := range []string{"\x00token", "tok\x01en", "tok\x1fen", "tok\x7fen"} {
+		if err := CheckTokenSafety(bad); err == nil {
+			t.Errorf("control char accepted: %q", bad)
+		}
+	}
+}
+
+func TestCheckTokenSafetyRejectsWhitespace(t *testing.T) {
+	for _, bad := range []string{" token", "token ", "\ttoken", "token\n"} {
+		if err := CheckTokenSafety(bad); err == nil {
+			t.Errorf("whitespace accepted: %q", bad)
+		}
+	}
+}
+
+// noopHandler is a grpc.UnaryHandler that returns the request unchanged.
+func noopHandler(_ context.Context, req any) (any, error) { return req, nil }
+
+func mustInterceptor(t *testing.T) grpc.UnaryServerInterceptor {
+	t.Helper()
+	ic, err := NewValidationInterceptor()
+	if err != nil {
+		t.Fatal(err)
+	}
+	return ic
+}
+
+func vaultMethodInfo(name string) *grpc.UnaryServerInfo {
+	return &grpc.UnaryServerInfo{FullMethod: "/rune.vault.v1.VaultService/" + name}
+}
+
+func TestInterceptorPassesValidRequest(t *testing.T) {
+	ic := mustInterceptor(t)
+	req := &pb.GetPublicKeyRequest{Token: "evt_0123456789abcdef0123456789abcdef"}
+	out, err := ic(context.Background(), req, vaultMethodInfo("GetPublicKey"), noopHandler)
+	if err != nil {
+		t.Fatalf("err = %v, want nil", err)
+	}
+	if out != req {
+		t.Errorf("interceptor mutated request")
+	}
+}
+
+func TestInterceptorRejectsBadProtovalidate(t *testing.T) {
+	ic := mustInterceptor(t)
+	// Token shorter than 36 fails the proto-level constraint.
+	req := &pb.GetPublicKeyRequest{Token: "too_short"}
+	_, err := ic(context.Background(), req, vaultMethodInfo("GetPublicKey"), noopHandler)
+	if err == nil {
+		t.Fatal("err = nil, want validation error")
+	}
+	if status.Code(err) != codes.InvalidArgument {
+		t.Errorf("code = %v, want InvalidArgument", status.Code(err))
+	}
+}
+
+func TestInterceptorRejectsControlCharToken(t *testing.T) {
+	ic := mustInterceptor(t)
+	// 36-char token containing a control byte (\x00) inside.
+	// protovalidate only checks length, so the runtime layer catches this.
+	req := &pb.GetPublicKeyRequest{Token: "evt_0123456789abcdef0123456789abc\x00ef"}
+	if len(req.Token) != 36 {
+		t.Fatalf("test setup: token length = %d, want 36", len(req.Token))
+	}
+	_, err := ic(context.Background(), req, vaultMethodInfo("GetPublicKey"), noopHandler)
+	if err == nil {
+		t.Fatal("err = nil, want runtime error")
+	}
+	if !strings.Contains(err.Error(), "control") {
+		t.Errorf("err = %v, want 'control characters' message", err)
+	}
+}
+
+func TestInterceptorAllowsNonVaultMethod(t *testing.T) {
+	ic := mustInterceptor(t)
+	// Whitespace-around token would normally fail runtime check, but
+	// non-Vault methods skip runtime checks (and the proto for this
+	// dummy message doesn't apply).
+	req := &pb.GetPublicKeyRequest{Token: "evt_0123456789abcdef0123456789abcdef"}
+	info := &grpc.UnaryServerInfo{FullMethod: "/grpc.health.v1.Health/Check"}
+	if _, err := ic(context.Background(), req, info, noopHandler); err != nil {
+		t.Errorf("non-vault method blocked: %v", err)
+	}
+}
diff --git a/vault/internal/tests/decrypt_pipeline_test.go b/vault/internal/tests/decrypt_pipeline_test.go
new file mode 100644
index 0000000..7310e32
--- /dev/null
+++ b/vault/internal/tests/decrypt_pipeline_test.go
@@ -0,0 +1,316 @@
+package tests
+
+import (
+	"context"
+	"encoding/json"
+	"math"
+	"os"
+	"path/filepath"
+	"sort"
+	"strings"
+	"testing"
+
+	"github.com/CryptoLabInc/rune-admin/vault/internal/crypto"
+	"github.com/CryptoLabInc/rune-admin/vault/internal/server"
+	"github.com/CryptoLabInc/rune-admin/vault/internal/tokens"
+	pb "github.com/CryptoLabInc/rune-admin/vault/pkg/vaultpb"
+)
+
+type fixtureBundle struct {
+	Config    fixtureConfig
+	Envelope  []string
+	Expected  []any // any: JSON object/array/string per envelope
+	ScoresB64 string
+	ScoreExp  fixtureScoreExpected
+	KeysDir   string
+}
+
+type fixtureConfig struct {
+	TeamSecret string `json:"team_secret"`
+	AgentID    string `json:"agent_id"`
+	Token      string `json:"token"`
+	Dim        int    `json:"dim"`
+}
+
+type fixtureScoreExpected struct {
+	Score    [][]float64 `json:"score"`
+	ShardIdx []int32     `json:"shard_idx"`
+}
+
+func loadFixtures(t *testing.T) *fixtureBundle {
+	t.Helper()
+	if !FixturesAvailable() {
+		t.Skip(SkipReason)
+	}
+	dir := FixturesDir()
+
+	var fb fixtureBundle
+	mustJSON(t, filepath.Join(dir, "config.json"), &fb.Config)
+	scoresExp := mustReadFile(t, filepath.Join(dir, "expected_scores.json"))
+	if err := json.Unmarshal(scoresExp, &fb.ScoreExp); err != nil {
+		t.Fatal(err)
+	}
+	fb.ScoresB64 = strings.TrimSpace(string(mustReadFile(t, filepath.Join(dir, "ciphertext_score.b64"))))
+	mustJSON(t, filepath.Join(dir, "metadata_envelopes.json"), &fb.Envelope)
+	mustJSON(t, filepath.Join(dir, "expected_metadata.json"), &fb.Expected)
+	fb.KeysDir = filepath.Join(dir, "keys")
+	return &fb
+}
+
+func mustJSON(t *testing.T, path string, dst any) {
+	t.Helper()
+	body := mustReadFile(t, path)
+	if err := json.Unmarshal(body, dst); err != nil {
+		t.Fatalf("parse %s: %v", path, err)
+	}
+}
+
+func mustReadFile(t *testing.T, path string) []byte {
+	t.Helper()
+	b, err := os.ReadFile(path)
+	if err != nil {
+		t.Fatalf("read %s: %v", path, err)
+	}
+	return b
+}
+
+// fixtureVault wires a Vault around the decrypted fixture bundle.
+// keys.path points at the temp dir copy of fixture keys so envector-go-sdk
+// can stage the bundle without touching the read-only fixture tree.
+func fixtureVault(t *testing.T, fb *fixtureBundle) *server.Vault {
+	t.Helper()
+	keyDir := t.TempDir()
+	for _, name := range []string{"EncKey.json", "EvalKey.json", "SecKey.json"} {
+		src := filepath.Join(fb.KeysDir, name)
+		if _, err := os.Stat(src); err != nil {
+			t.Skipf("fixture key %s missing: %v", name, err)
+		}
+		body, _ := os.ReadFile(src)
+		if err := os.WriteFile(filepath.Join(keyDir, name), body, 0o600); err != nil {
+			t.Fatal(err)
+		}
+	}
+	// envector.OpenKeysFromFile expects WithKeyPath = directory containing
+	// the JSON envelopes; use keyDir directly + KeyID = "vault-key" so the
+	// joined path matches.
+	keysParams := crypto.KeysParams{Root: filepath.Dir(keyDir), KeyID: filepath.Base(keyDir), Dim: fb.Config.Dim}
+	keys, err := crypto.OpenSecretKey(keysParams)
+	if err != nil {
+		t.Fatalf("OpenSecretKey: %v", err)
+	}
+	t.Cleanup(func() { keys.Close() })
+
+	cfg := &server.Config{
+		Tokens: server.TokensConfig{TeamSecret: fb.Config.TeamSecret},
+		Keys:   server.KeysConfig{Path: filepath.Dir(keyDir), EmbeddingDim: fb.Config.Dim},
+	}
+	store := tokens.NewStore()
+	store.LoadDefaultsWithDemoToken()
+	// Replace the demo token with the fixture's token so the test can
+	// authenticate without re-keying every envelope.
+	if fb.Config.Token != "" && fb.Config.Token != tokens.DemoToken {
+		// Inject manually via a minimal hack: load defaults then add user.
+		_, _ = store.AddRole("fixture", []string{"get_public_key", "decrypt_scores", "decrypt_metadata"}, 1000, "10000/60s")
+		// AddToken would generate a new token; we need the fixture's exact
+		// token string. The store has no public "InsertToken" — for tests
+		// we resort to LoadFromFiles via tempfiles.
+		injectFixtureToken(t, store, fb.Config.Token)
+	}
+	audit, _ := server.NewAuditLogger(server.AuditConfig{Mode: ""})
+	return server.NewVault(cfg, store, keys, audit)
+}
+
+func injectFixtureToken(t *testing.T, store *tokens.Store, token string) {
+	t.Helper()
+	dir := t.TempDir()
+	rolesPath := filepath.Join(dir, "roles.yml")
+	tokensPath := filepath.Join(dir, "tokens.yml")
+	if err := os.WriteFile(rolesPath, []byte(`roles:
+  fixture:
+    scope: [get_public_key, decrypt_scores, decrypt_metadata]
+    top_k: 1000
+    rate_limit: 10000/60s
+`), 0o600); err != nil {
+		t.Fatal(err)
+	}
+	if err := os.WriteFile(tokensPath, []byte(`tokens:
+  - user: fixture
+    token: `+token+`
+    role: fixture
+    issued_at: "2026-01-01"
+`), 0o600); err != nil {
+		t.Fatal(err)
+	}
+	if err := store.LoadFromFiles(rolesPath, tokensPath); err != nil {
+		t.Fatal(err)
+	}
+}
+
+// ── decrypt_scores via gRPC handler ───────────────────────────────
+
+func TestDecryptScoresAgainstFixture(t *testing.T) {
+	fb := loadFixtures(t)
+	v := fixtureVault(t, fb)
+	srv := server.NewVaultGRPC(v)
+
+	totalScores := 0
+	for _, row := range fb.ScoreExp.Score {
+		totalScores += len(row)
+	}
+	resp, err := srv.DecryptScores(context.Background(), &pb.DecryptScoresRequest{
+		Token:            fb.Config.Token,
+		EncryptedBlobB64: fb.ScoresB64,
+		TopK:             int32(totalScores),
+	})
+	if err != nil {
+		t.Fatal(err)
+	}
+	if resp.GetError() != "" {
+		t.Fatalf("error: %s", resp.GetError())
+	}
+
+	expectedFlat := make([]struct {
+		shard int32
+		row   int32
+		score float64
+	}, 0)
+	for i, row := range fb.ScoreExp.Score {
+		shard := int32(i)
+		if i < len(fb.ScoreExp.ShardIdx) {
+			shard = fb.ScoreExp.ShardIdx[i]
+		}
+		for j, s := range row {
+			expectedFlat = append(expectedFlat, struct {
+				shard int32
+				row   int32
+				score float64
+			}{shard, int32(j), s})
+		}
+	}
+	sort.SliceStable(expectedFlat, func(i, j int) bool {
+		return expectedFlat[i].score > expectedFlat[j].score
+	})
+
+	if len(resp.Results) != len(expectedFlat) {
+		t.Fatalf("len(results) = %d, want %d", len(resp.Results), len(expectedFlat))
+	}
+	for i, got := range resp.Results {
+		want := expectedFlat[i]
+		if got.ShardIdx != want.shard || got.RowIdx != want.row {
+			t.Errorf("[%d] shard/row = (%d,%d), want (%d,%d)", i, got.ShardIdx, got.RowIdx, want.shard, want.row)
+		}
+		if math.Abs(got.Score-want.score) > 1e-6 {
+			t.Errorf("[%d] score = %v, want %v", i, got.Score, want.score)
+		}
+	}
+}
+
+func TestDecryptScoresTopKAgainstFixture(t *testing.T) {
+	fb := loadFixtures(t)
+	v := fixtureVault(t, fb)
+	srv := server.NewVaultGRPC(v)
+
+	allScores := []float64{}
+	for _, row := range fb.ScoreExp.Score {
+		allScores = append(allScores, row...)
+	}
+	sort.Sort(sort.Reverse(sort.Float64Slice(allScores)))
+	topN := 3
+	if len(allScores) < topN {
+		topN = len(allScores)
+	}
+	resp, err := srv.DecryptScores(context.Background(), &pb.DecryptScoresRequest{
+		Token:            fb.Config.Token,
+		EncryptedBlobB64: fb.ScoresB64,
+		TopK:             int32(topN),
+	})
+	if err != nil {
+		t.Fatal(err)
+	}
+	if len(resp.Results) != topN {
+		t.Fatalf("len = %d, want %d", len(resp.Results), topN)
+	}
+	for i, got := range resp.Results {
+		if math.Abs(got.Score-allScores[i]) > 1e-6 {
+			t.Errorf("[%d] score = %v, want %v", i, got.Score, allScores[i])
+		}
+	}
+	for i := 1; i < len(resp.Results); i++ {
+		if resp.Results[i].Score > resp.Results[i-1].Score {
+			t.Errorf("results not descending at %d", i)
+		}
+	}
+}
+
+// ── decrypt_metadata via gRPC handler ─────────────────────────────
+
+func TestDecryptMetadataSingleAgainstFixture(t *testing.T) {
+	fb := loadFixtures(t)
+	v := fixtureVault(t, fb)
+	srv := server.NewVaultGRPC(v)
+
+	if len(fb.Envelope) == 0 {
+		t.Skip("no envelopes in fixture")
+	}
+	resp, err := srv.DecryptMetadata(context.Background(), &pb.DecryptMetadataRequest{
+		Token:                 fb.Config.Token,
+		EncryptedMetadataList: []string{fb.Envelope[0]},
+	})
+	if err != nil {
+		t.Fatal(err)
+	}
+	if resp.GetError() != "" {
+		t.Fatalf("error: %s", resp.GetError())
+	}
+	if len(resp.DecryptedMetadata) != 1 {
+		t.Fatalf("len = %d", len(resp.DecryptedMetadata))
+	}
+	got := decodeAny(t, resp.DecryptedMetadata[0])
+	want := fb.Expected[0]
+	if !jsonEq(got, want) {
+		t.Errorf("metadata mismatch\n got %#v\nwant %#v", got, want)
+	}
+}
+
+func TestDecryptMetadataMultipleAgainstFixture(t *testing.T) {
+	fb := loadFixtures(t)
+	v := fixtureVault(t, fb)
+	srv := server.NewVaultGRPC(v)
+
+	resp, err := srv.DecryptMetadata(context.Background(), &pb.DecryptMetadataRequest{
+		Token:                 fb.Config.Token,
+		EncryptedMetadataList: fb.Envelope,
+	})
+	if err != nil {
+		t.Fatal(err)
+	}
+	if resp.GetError() != "" {
+		t.Fatalf("error: %s", resp.GetError())
+	}
+	if len(resp.DecryptedMetadata) != len(fb.Expected) {
+		t.Fatalf("len = %d, want %d", len(resp.DecryptedMetadata), len(fb.Expected))
+	}
+	for i, raw := range resp.DecryptedMetadata {
+		got := decodeAny(t, raw)
+		if !jsonEq(got, fb.Expected[i]) {
+			t.Errorf("[%d] mismatch\n got %#v\nwant %#v", i, got, fb.Expected[i])
+		}
+	}
+}
+
+// decodeAny tries to JSON-parse a string; returns the raw string on failure.
+func decodeAny(_ *testing.T, raw string) any {
+	var v any
+	if err := json.Unmarshal([]byte(raw), &v); err == nil {
+		return v
+	}
+	return raw
+}
+
+// jsonEq compares two values by re-serialising to JSON. Handles float vs
+// int promotion that comes out of encoding/json's default decoding.
+func jsonEq(a, b any) bool {
+	ja, _ := json.Marshal(a)
+	jb, _ := json.Marshal(b)
+	return string(ja) == string(jb)
+}
diff --git a/vault/internal/tests/fixtures.go b/vault/internal/tests/fixtures.go
new file mode 100644
index 0000000..f23574d
--- /dev/null
+++ b/vault/internal/tests/fixtures.go
@@ -0,0 +1,36 @@
+// Package tests provides shared helpers and hosts cross-package end-to-end tests.
+// Integration tests require the GPG-encrypted fixtures to be decrypted into
+// tests/fixtures/ first (run `mise run fixtures:decrypt`).
+package tests
+
+import (
+	"os"
+	"path/filepath"
+	"runtime"
+)
+
+// RepoRoot returns the absolute path to the rune-admin repository root,
+// resolved relative to this source file. Works regardless of the test's
+// cwd, so tests can locate tests/fixtures/ from any subpackage.
+func RepoRoot() string {
+	_, thisFile, _, _ := runtime.Caller(0)
+	// thisFile = .../vault/internal/tests/fixtures.go → repo root is 3 levels up.
+	return filepath.Clean(filepath.Join(filepath.Dir(thisFile), "..", "..", ".."))
+}
+
+// FixturesDir returns the absolute path to tests/fixtures/.
+func FixturesDir() string {
+	return filepath.Join(RepoRoot(), "tests", "fixtures")
+}
+
+// FixturesAvailable reports whether the GPG-encrypted fixtures have been
+// decrypted into tests/fixtures/. Use as a guard in TestMain or as the
+// condition for t.Skip in integration tests.
+func FixturesAvailable() bool {
+	_, err := os.Stat(filepath.Join(FixturesDir(), "config.json"))
+	return err == nil
+}
+
+// SkipReason returns the standard skip message for tests that require
+// decrypted fixtures.
+const SkipReason = "fixtures not decrypted — run `mise run fixtures:decrypt` (requires FIXTURES_GPG_PASSPHRASE)"
diff --git a/vault/internal/tokens/errors.go b/vault/internal/tokens/errors.go
new file mode 100644
index 0000000..ba464a0
--- /dev/null
+++ b/vault/internal/tokens/errors.go
@@ -0,0 +1,43 @@
+package tokens
+
+import "fmt"
+
+type ErrTokenNotFound struct{}
+
+func (ErrTokenNotFound) Error() string { return "Invalid authentication token" }
+
+type ErrTokenExpired struct {
+	User string
+}
+
+func (e ErrTokenExpired) Error() string {
+	return fmt.Sprintf("Token expired for user '%s'", e.User)
+}
+
+type ErrRateLimit struct {
+	RetryAfter int
+}
+
+func (e ErrRateLimit) Error() string {
+	return fmt.Sprintf("Rate limit exceeded. Retry after %ds", e.RetryAfter)
+}
+
+type ErrTopKExceeded struct {
+	Requested int
+	MaxTopK   int
+	RoleName  string
+}
+
+func (e ErrTopKExceeded) Error() string {
+	return fmt.Sprintf("top_k %d exceeds limit %d for role '%s'",
+		e.Requested, e.MaxTopK, e.RoleName)
+}
+
+type ErrScope struct {
+	Method   string
+	RoleName string
+}
+
+func (e ErrScope) Error() string {
+	return fmt.Sprintf("Method '%s' not permitted for role '%s'", e.Method, e.RoleName)
+}
diff --git a/vault/internal/tokens/ratelimit.go b/vault/internal/tokens/ratelimit.go
new file mode 100644
index 0000000..bf0d15d
--- /dev/null
+++ b/vault/internal/tokens/ratelimit.go
@@ -0,0 +1,72 @@
+package tokens
+
+import (
+	"sync"
+	"time"
+)
+
+type RateLimiter struct {
+	maxRequests int
+	window      time.Duration
+	now         func() time.Time
+
+	mu       sync.Mutex
+	requests map[string][]time.Time
+}
+
+func NewRateLimiter(maxRequests int, window time.Duration) *RateLimiter {
+	return &RateLimiter{
+		maxRequests: maxRequests,
+		window:      window,
+		now:         time.Now,
+		requests:    make(map[string][]time.Time),
+	}
+}
+
+func (rl *RateLimiter) IsAllowed(clientID string) bool {
+	now := rl.now()
+	cutoff := now.Add(-rl.window)
+
+	rl.mu.Lock()
+	defer rl.mu.Unlock()
+
+	kept := rl.requests[clientID][:0]
+	for _, t := range rl.requests[clientID] {
+		if t.After(cutoff) {
+			kept = append(kept, t)
+		}
+	}
+	if len(kept) >= rl.maxRequests {
+		rl.requests[clientID] = kept
+		return false
+	}
+	rl.requests[clientID] = append(kept, now)
+	return true
+}
+
+func (rl *RateLimiter) RetryAfter(clientID string) int {
+	rl.mu.Lock()
+	defer rl.mu.Unlock()
+
+	reqs := rl.requests[clientID]
+	if len(reqs) == 0 {
+		return 0
+	}
+	oldest := reqs[0]
+	for _, t := range reqs[1:] {
+		if t.Before(oldest) {
+			oldest = t
+		}
+	}
+	remaining := rl.window - rl.now().Sub(oldest)
+	if remaining < 0 {
+		return 0
+	}
+	return int(remaining.Seconds())
+}
+
+func (rl *RateLimiter) Remove(clientID string) {
+	rl.mu.Lock()
+	defer rl.mu.Unlock()
+	delete(rl.requests, clientID)
+}
diff --git a/vault/internal/tokens/ratelimit_test.go b/vault/internal/tokens/ratelimit_test.go
new file mode 100644
index 0000000..7d607bd
--- /dev/null
+++ b/vault/internal/tokens/ratelimit_test.go
@@ -0,0 +1,88 @@
+package tokens
+
+import (
+	"sync"
+	"testing"
+	"time"
+)
+
+func TestRateLimiterAllowsUnderLimit(t *testing.T) {
+	rl := NewRateLimiter(3, time.Minute)
+	for i := 0; i < 3; i++ {
+		if !rl.IsAllowed("u") {
+			t.Fatalf("request %d denied, want allowed", i+1)
+		}
+	}
+}
+
+func TestRateLimiterDeniesOverLimit(t *testing.T) {
+	rl := NewRateLimiter(2, time.Minute)
+	rl.IsAllowed("u")
+	rl.IsAllowed("u")
+	if rl.IsAllowed("u") {
+		t.Error("3rd request allowed, want denied")
+	}
+}
+
+func TestRateLimiterPerClient(t *testing.T) {
+	rl := NewRateLimiter(1, time.Minute)
+	if !rl.IsAllowed("a") {
+		t.Fatal("a denied")
+	}
+	if !rl.IsAllowed("b") {
+		t.Fatal("b denied — should be tracked separately")
+	}
+	if rl.IsAllowed("a") {
+		t.Error("a 2nd request allowed, want denied")
+	}
+}
+
+func TestRateLimiterRetryAfter(t *testing.T) {
+	rl := NewRateLimiter(1, 10*time.Second)
+	now := time.Date(2026, 4, 23, 0, 0, 0, 0, time.UTC)
+	rl.now = func() time.Time { return now }
+	rl.IsAllowed("u")
+	rl.now = func() time.Time { return now.Add(3 * time.Second) }
+	got := rl.RetryAfter("u")
+	if got < 6 || got > 7 {
+		t.Errorf("RetryAfter = %d, want ~7", got)
+	}
+}
+
+func TestRateLimiterRemove(t *testing.T) {
+	rl := NewRateLimiter(1, time.Minute)
+	rl.IsAllowed("u")
+	rl.Remove("u")
+	if !rl.IsAllowed("u") {
+		t.Error("after Remove, request should be allowed again")
+	}
+}
+
+func TestRateLimiterConcurrent(t *testing.T) {
+	rl := NewRateLimiter(100, time.Minute)
+	var wg sync.WaitGroup
+	for i := 0; i < 50; i++ {
+		wg.Add(1)
+		go func() {
+			defer wg.Done()
+			rl.IsAllowed("u")
+		}()
+	}
+	wg.Wait()
+}
+
+func TestRateLimiterWindowEvicts(t *testing.T) {
+	rl := NewRateLimiter(1, 5*time.Second)
+	now := time.Date(2026, 4, 23, 0, 0, 0, 0, time.UTC)
+	rl.now = func() time.Time { return now }
+	if !rl.IsAllowed("u") {
+		t.Fatal("first denied")
+	}
+	if rl.IsAllowed("u") {
+		t.Fatal("second allowed inside window")
+	}
+	rl.now = func() time.Time { return now.Add(6 * time.Second) }
+	if !rl.IsAllowed("u") {
+		t.Error("after window, request should be allowed")
+	}
+}
diff --git a/vault/internal/tokens/role.go b/vault/internal/tokens/role.go
new file mode 100644
index 0000000..52ea586
--- /dev/null
+++ b/vault/internal/tokens/role.go
@@ -0,0 +1,66 @@
+package tokens
+
+import (
+	"fmt"
+	"regexp"
+	"strconv"
+	"time"
+)
+
+type Role struct {
+	Name      string   `yaml:"-"`
+	Scope     []string `yaml:"scope"`
+	TopK      int      `yaml:"top_k"`
+	RateLimit string   `yaml:"rate_limit"`
+}
+
+var rateLimitRE = regexp.MustCompile(`^(\d+)/(\d+)s$`)
+
+func (r *Role) RateLimitParsed() (max int, window time.Duration, err error) {
+	m := rateLimitRE.FindStringSubmatch(r.RateLimit)
+	if m == nil {
+		return 0, 0, fmt.Errorf("invalid rate_limit format %q (expected '<max>/<window>s')", r.RateLimit)
+	}
+	maxReq, _ := strconv.Atoi(m[1])
+	winSec, _ := strconv.Atoi(m[2])
+	return maxReq, time.Duration(winSec) * time.Second, nil
+}
+
+func (r *Role) CheckScope(method string) error {
+	for _, s := range r.Scope {
+		if s == method {
+			return nil
+		}
+	}
+	return ErrScope{Method: method, RoleName: r.Name}
+}
+
+func validateRateLimit(s string) error {
+	if !rateLimitRE.MatchString(s) {
+		return fmt.Errorf("invalid rate_limit format %q (expected '<max>/<window>s')", s)
+	}
+	return nil
+}
+
+const DemoToken = "evt_0000000000000000000000000000demo"
+
+func DefaultRoles() map[string]*Role {
+	return map[string]*Role{
+		"admin": {
+			Name:      "admin",
+			Scope:     []string{"get_public_key", "decrypt_scores", "decrypt_metadata", "manage_tokens"},
+			TopK:      50,
+			RateLimit: "150/60s",
+		},
+		"member": {
+			Name:      "member",
+			Scope:     []string{"get_public_key", "decrypt_scores", "decrypt_metadata"},
+			TopK:      10,
+			RateLimit: "30/60s",
+		},
+	}
+}
+
+func isDefaultRoleName(name string) bool {
+	return name == "admin" || name == "member"
+}
diff --git a/vault/internal/tokens/store.go b/vault/internal/tokens/store.go
new file mode 100644
index 0000000..9f90ecf
--- /dev/null
+++ b/vault/internal/tokens/store.go
@@ -0,0 +1,612 @@
+package tokens
+
+import (
+	"crypto/rand"
+	"encoding/hex"
+	"fmt"
+	"os"
+	"path/filepath"
+	"sort"
+	"sync"
+	"time"
+
+	"gopkg.in/yaml.v3"
+)
+
+const persistDebounce = 100 * time.Millisecond
+
+type Store struct {
+	mu           sync.RWMutex
+	tokens       map[string]*Token // keyed by token string
+	tokensByUser map[string]*Token // keyed by username
+	roles        map[string]*Role
+	rateLimiters map[string]*RateLimiter // keyed by username
+	rolesPath    string
+	tokensPath   string
+
+	now func() time.Time
+
+	persistMu     sync.Mutex
+	persistTimer  *time.Timer
+	persistWG     sync.WaitGroup
+	persistClosed bool
+}
+
+func NewStore() *Store {
+	return &Store{
+		tokens:       make(map[string]*Token),
+		tokensByUser: make(map[string]*Token),
+		roles:        make(map[string]*Role),
+		rateLimiters: make(map[string]*RateLimiter),
+		now:          func() time.Time { return time.Now().UTC() },
+	}
+}
+
+// LoadFromFiles reads roles and tokens from YAML at startup.
+// Missing files cause defaults to be loaded and an immediate persist scheduled.
+func (s *Store) LoadFromFiles(rolesPath, tokensPath string) error {
+	s.mu.Lock()
+	s.rolesPath = rolesPath
+	s.tokensPath = tokensPath
+
+	// Roles
+	if data, err := os.ReadFile(rolesPath); err == nil {
+		var doc struct {
+			Roles map[string]struct {
+				Scope     []string `yaml:"scope"`
+				TopK      int      `yaml:"top_k"`
+				RateLimit string   `yaml:"rate_limit"`
+			} `yaml:"roles"`
+		}
+		if err := yaml.Unmarshal(data, &doc); err != nil {
+			s.mu.Unlock()
+			return fmt.Errorf("parse roles file %s: %w", rolesPath, err)
+		}
+		for name, cfg := range doc.Roles {
+			topK := cfg.TopK
+			if topK == 0 {
+				topK = 5
+			}
+			rl := cfg.RateLimit
+			if rl == "" {
+				rl = "30/60s"
+			}
+			s.roles[name] = &Role{Name: name, Scope: cfg.Scope, TopK: topK, RateLimit: rl}
+		}
+	} else if !os.IsNotExist(err) {
+		s.mu.Unlock()
+		return fmt.Errorf("read roles file %s: %w", rolesPath, err)
+	} else {
+		for name, role := range DefaultRoles() {
+			s.roles[name] = role
+		}
+	}
+	for name, role := range DefaultRoles() {
+		if _, ok := s.roles[name]; !ok {
+			s.roles[name] = role
+		}
+	}
+
+	// Tokens
+	rolesMissing := false
+	if _, err := os.Stat(rolesPath); os.IsNotExist(err) {
+		rolesMissing = true
+	}
+	tokensMissing := false
+	if data, err := os.ReadFile(tokensPath); err == nil {
+		var doc struct {
+			Tokens []struct {
+				User     string `yaml:"user"`
+				Token    string `yaml:"token"`
+				Role     string `yaml:"role"`
+				IssuedAt string `yaml:"issued_at"`
+				Created  string `yaml:"created"`
+				Expires  string `yaml:"expires"`
+			} `yaml:"tokens"`
+		}
+		if err := yaml.Unmarshal(data, &doc); err != nil {
+			s.mu.Unlock()
+			return fmt.Errorf("parse tokens file %s: %w", tokensPath, err)
+		}
+		for _, e := range doc.Tokens {
+			issued := e.IssuedAt
+			if issued == "" {
+				issued = e.Created
+			}
+			tok := &Token{
+				User:     e.User,
+				Token:    e.Token,
+				Role:     e.Role,
+				IssuedAt: issued,
+				Expires:  e.Expires,
+			}
+			s.tokens[tok.Token] = tok
+			s.tokensByUser[tok.User] = tok
+		}
+	} else if !os.IsNotExist(err) {
+		s.mu.Unlock()
+		return fmt.Errorf("read tokens file %s: %w", tokensPath, err)
+	} else {
+		tokensMissing = true
+	}
+	s.mu.Unlock()
+
+	if rolesMissing || tokensMissing {
+		s.schedulePersist()
+	}
+	return nil
+}
+
+// LoadDefaultsWithDemoToken seeds the store with default roles and the demo token.
+// Useful for dev/CI bootstraps that don't ship persisted state.
+func (s *Store) LoadDefaultsWithDemoToken() {
+	s.mu.Lock()
+	defer s.mu.Unlock()
+	for name, role := range DefaultRoles() {
+		s.roles[name] = role
+	}
+	tok := &Token{
+		User:     "demo",
+		Token:    DemoToken,
+		Role:     "admin",
+		IssuedAt: s.now().Format(dateFormat),
+	}
+	s.tokens[tok.Token] = tok
+	s.tokensByUser[tok.User] = tok
+}
+
+func (s *Store) Validate(tokenStr string) (string, *Role, error) {
+	s.mu.Lock()
+	tok, ok := s.tokens[tokenStr]
+	if !ok {
+		s.mu.Unlock()
+		return "", nil, ErrTokenNotFound{}
+	}
+	if tok.IsExpiredAt(s.now()) {
+		user := tok.User
+		s.mu.Unlock()
+		return "", nil, ErrTokenExpired{User: user}
+	}
+	role, ok := s.roles[tok.Role]
+	if !ok {
+		s.mu.Unlock()
+		return "", nil, ErrTokenNotFound{}
+	}
+	limiter, err := s.getOrCreateLimiterLocked(tok.User, role)
+	s.mu.Unlock()
+	if err != nil {
+		return "", nil, err
+	}
+	if !limiter.IsAllowed(tok.User) {
+		return "", nil, ErrRateLimit{RetryAfter: limiter.RetryAfter(tok.User)}
+	}
+	return tok.User, role, nil
+}
+
+func (s *Store) GetUsername(tokenStr string) string {
+	s.mu.RLock()
+	defer s.mu.RUnlock()
+	if tok, ok := s.tokens[tokenStr]; ok {
+		return tok.User
+	}
+	return ""
+}
+
+func (s *Store) getOrCreateLimiterLocked(user string, role *Role) (*RateLimiter, error) {
+	if l, ok := s.rateLimiters[user]; ok {
+		return l, nil
+	}
+	maxReq, window, err := role.RateLimitParsed()
+	if err != nil {
+		return nil, err
+	}
+	l := NewRateLimiter(maxReq, window)
+	s.rateLimiters[user] = l
+	return l, nil
+}
+
+func (s *Store) AddToken(user, roleName string, expiresDays *int) (*Token, error) {
+	s.mu.Lock()
+	if _, ok := s.roles[roleName]; !ok {
+		s.mu.Unlock()
+		return nil, fmt.Errorf("role '%s' does not exist", roleName)
+	}
+	if _, ok := s.tokensByUser[user]; ok {
+		s.mu.Unlock()
+		return nil, fmt.Errorf("token already exists for user '%s'", user)
+	}
+	tokStr, err := newTokenString()
+	if err != nil {
+		s.mu.Unlock()
+		return nil, err
+	}
+	today := s.now()
+	tok := &Token{
+		User:     user,
+		Token:    tokStr,
+		Role:     roleName,
+		IssuedAt: today.Format(dateFormat),
+		Expires:  expiryDate(today, expiresDays),
+	}
+	s.tokens[tok.Token] = tok
+	s.tokensByUser[tok.User] = tok
+	s.mu.Unlock()
+	s.schedulePersist()
+	return tok, nil
+}
+
+func (s *Store) RevokeToken(user string) bool {
+	s.mu.Lock()
+	tok, ok := s.tokensByUser[user]
+	if !ok {
+		s.mu.Unlock()
+		return false
+	}
+	delete(s.tokensByUser, user)
+	delete(s.tokens, tok.Token)
+	if l, ok := s.rateLimiters[user]; ok {
+		delete(s.rateLimiters, user)
+		l.Remove(user)
+	}
+	s.mu.Unlock()
+	s.schedulePersist()
+	return true
+}
+
+func (s *Store) RotateToken(user string) (*Token, error) {
+	s.mu.Lock()
+	old, ok := s.tokensByUser[user]
+	if !ok {
+		s.mu.Unlock()
+		return nil, fmt.Errorf("no token found for user '%s'", user)
+	}
+	var expiresDays *int
+	if old.Expires != "" {
+		issued, errIss := time.Parse(dateFormat, old.IssuedAt)
+		exp, errExp := time.Parse(dateFormat, old.Expires)
+		if errIss == nil && errExp == nil {
+			d := int(exp.Sub(issued).Hours() / 24)
+			expiresDays = &d
+		}
+	}
+	delete(s.tokens, old.Token)
+	delete(s.tokensByUser, user)
+	if l, ok := s.rateLimiters[user]; ok {
+		delete(s.rateLimiters, user)
+		l.Remove(user)
+	}
+	tokStr, err := newTokenString()
+	if err != nil {
+		s.mu.Unlock()
+		return nil, err
+	}
+	today := s.now()
+	newTok := &Token{
+		User:     user,
+		Token:    tokStr,
+		Role:     old.Role,
+		IssuedAt: today.Format(dateFormat),
+		Expires:  expiryDate(today, expiresDays),
+	}
+	s.tokens[newTok.Token] = newTok
+	s.tokensByUser[user] = newTok
+	s.mu.Unlock()
+	s.schedulePersist()
+	return newTok, nil
+}
+
+func (s *Store) RotateAllTokens() ([]*Token, error) {
+	s.mu.RLock()
+	users := make([]string, 0, len(s.tokensByUser))
+	for u := range s.tokensByUser {
+		users = append(users, u)
+	}
+	s.mu.RUnlock()
+	sort.Strings(users)
+
+	result := make([]*Token, 0, len(users))
+	for _, u := range users {
+		tok, err := s.RotateToken(u)
+		if err != nil {
+			return result, err
+		}
+		result = append(result, tok)
+	}
+	return result, nil
+}
+
+type TokenInfo struct {
+	User      string `json:"user" yaml:"user"`
+	Role      string `json:"role" yaml:"role"`
+	TopK      any    `json:"top_k" yaml:"top_k"`
+	RateLimit any    `json:"rate_limit" yaml:"rate_limit"`
+	Expires   string `json:"expires" yaml:"expires"`
+}
+
+func (s *Store) ListTokens() []TokenInfo {
+	s.mu.RLock()
+	defer s.mu.RUnlock()
+
+	users := make([]string, 0, len(s.tokensByUser))
+	for u := range s.tokensByUser {
+		users = append(users, u)
+	}
+	sort.Strings(users)
+
+	out := make([]TokenInfo, 0, len(users))
+	for _, u := range users {
+		tok := s.tokensByUser[u]
+		info := TokenInfo{User: tok.User, Role: tok.Role, Expires: "never"}
+		if tok.Expires != "" {
+			info.Expires = tok.Expires
+		}
+		if role, ok := s.roles[tok.Role]; ok {
+			info.TopK = role.TopK
+			info.RateLimit = role.RateLimit
+		} else {
+			info.TopK = "?"
+			info.RateLimit = "?"
+		}
+		out = append(out, info)
+	}
+	return out
+}
+
+type RoleInfo struct {
+	Name      string   `json:"name" yaml:"name"`
+	Scope     []string `json:"scope" yaml:"scope"`
+	TopK      int      `json:"top_k" yaml:"top_k"`
+	RateLimit string   `json:"rate_limit" yaml:"rate_limit"`
+}
+
+func (s *Store) AddRole(name string, scope []string, topK int, rateLimit string) (*Role, error) {
+	if err := validateRateLimit(rateLimit); err != nil {
+		return nil, err
+	}
+	s.mu.Lock()
+	if _, ok := s.roles[name]; ok {
+		s.mu.Unlock()
+		return nil, fmt.Errorf("role '%s' already exists", name)
+	}
+	role := &Role{Name: name, Scope: scope, TopK: topK, RateLimit: rateLimit}
+	s.roles[name] = role
+	s.mu.Unlock()
+	s.schedulePersist()
+	return role, nil
+}
+
+type UpdateRoleOpts struct {
+	Scope     *[]string
+	TopK      *int
+	RateLimit *string
+}
+
+func (s *Store) UpdateRole(name string, opts UpdateRoleOpts) (*Role, error) {
+	if opts.RateLimit != nil {
+		if err := validateRateLimit(*opts.RateLimit); err != nil {
+			return nil, err
+		}
+	}
+	s.mu.Lock()
+	role, ok := s.roles[name]
+	if !ok {
+		s.mu.Unlock()
+		return nil, fmt.Errorf("role '%s' does not exist", name)
+	}
+	if opts.Scope != nil {
+		role.Scope = *opts.Scope
+	}
+	if opts.TopK != nil {
+		role.TopK = *opts.TopK
+	}
+	if opts.RateLimit != nil {
+		role.RateLimit = *opts.RateLimit
+		for _, tok := range s.tokensByUser {
+			if tok.Role == name {
+				delete(s.rateLimiters, tok.User)
+			}
+		}
+	}
+	s.mu.Unlock()
+	s.schedulePersist()
+	return role, nil
+}
+
+func (s *Store) DeleteRole(name string) error {
+	if isDefaultRoleName(name) {
+		return fmt.Errorf("Cannot delete default role '%s'", name)
+	}
+	s.mu.Lock()
+	if _, ok := s.roles[name]; !ok {
+		s.mu.Unlock()
+		return fmt.Errorf("role '%s' does not exist", name)
+	}
+	for _, tok := range s.tokensByUser {
+		if tok.Role == name {
+			s.mu.Unlock()
+			return fmt.Errorf("Cannot delete role '%s': token for user '%s' is assigned to it", name, tok.User)
+		}
+	}
+	delete(s.roles, name)
+	s.mu.Unlock()
+	s.schedulePersist()
+	return nil
+}
+
+func (s *Store) ListRoles() []RoleInfo {
+	s.mu.RLock()
+	defer s.mu.RUnlock()
+	names := make([]string, 0, len(s.roles))
+	for n := range s.roles {
+		names = append(names, n)
+	}
+	sort.Strings(names)
+	out := make([]RoleInfo, 0, len(names))
+	for _, n := range names {
+		r := s.roles[n]
+		scope := append([]string(nil), r.Scope...)
+		out = append(out, RoleInfo{Name: r.Name, Scope: scope, TopK: r.TopK, RateLimit: r.RateLimit})
+	}
+	return out
+}
+
+// Shutdown cancels any pending persist and waits for in-flight writes to finish.
+// Use Flush instead when you want pending changes to be written before exit.
+func (s *Store) Shutdown() {
+	s.persistMu.Lock()
+	s.persistClosed = true
+	if s.persistTimer != nil {
+		s.persistTimer.Stop()
+		s.persistTimer = nil
+	}
+	s.persistMu.Unlock()
+	s.persistWG.Wait()
+}
+
+// Flush forces any pending debounced persist to run synchronously,
+// then blocks until in-flight writes complete.
+func (s *Store) Flush() {
+	s.persistMu.Lock()
+	pending := false
+	if s.persistTimer != nil {
+		if s.persistTimer.Stop() {
+			pending = true
+		}
+		s.persistTimer = nil
+	}
+	s.persistMu.Unlock()
+	if pending {
+		s.doPersist()
+	}
+	s.persistWG.Wait()
+}
+
+func (s *Store) schedulePersist() {
+	s.persistMu.Lock()
+	defer s.persistMu.Unlock()
+	if s.persistClosed {
+		return
+	}
+	if s.rolesPath == "" || s.tokensPath == "" {
+		return
+	}
+	if s.persistTimer != nil {
+		s.persistTimer.Stop()
+	}
+	s.persistTimer = time.AfterFunc(persistDebounce, func() {
+		s.persistMu.Lock()
+		s.persistTimer = nil
+		closed := s.persistClosed
+		s.persistMu.Unlock()
+		if closed {
+			return
+		}
+		s.doPersist()
+	})
+}
+
+func (s *Store) doPersist() {
+	s.persistWG.Add(1)
+	defer s.persistWG.Done()
+
+	s.mu.RLock()
+	rolesPath := s.rolesPath
+	tokensPath := s.tokensPath
+
+	rolesDoc := struct {
+		Roles map[string]struct {
+			Scope     []string `yaml:"scope"`
+			TopK      int      `yaml:"top_k"`
+			RateLimit string   `yaml:"rate_limit"`
+		} `yaml:"roles"`
+	}{Roles: make(map[string]struct {
+		Scope     []string `yaml:"scope"`
+		TopK      int      `yaml:"top_k"`
+		RateLimit string   `yaml:"rate_limit"`
+	})}
+	for n, r := range s.roles {
+		rolesDoc.Roles[n] = struct {
+			Scope     []string `yaml:"scope"`
+			TopK      int      `yaml:"top_k"`
+			RateLimit string   `yaml:"rate_limit"`
+		}{Scope: append([]string(nil), r.Scope...), TopK: r.TopK, RateLimit: r.RateLimit}
+	}
+
+	tokensDoc := struct {
+		Tokens []map[string]string `yaml:"tokens"`
+	}{Tokens: make([]map[string]string, 0, len(s.tokensByUser))}
+	users := make([]string, 0, len(s.tokensByUser))
+	for u := range s.tokensByUser {
+		users = append(users, u)
+	}
+	sort.Strings(users)
+	for _, u := range users {
+		t := s.tokensByUser[u]
+		entry := map[string]string{
+			"user":      t.User,
+			"token":     t.Token,
+			"role":      t.Role,
+			"issued_at": t.IssuedAt,
+		}
+		if t.Expires != "" {
+			entry["expires"] = t.Expires
+		}
+		tokensDoc.Tokens = append(tokensDoc.Tokens, entry)
+	}
+	s.mu.RUnlock()
+
+	if err := atomicWriteYAML(rolesPath, rolesDoc); err != nil {
+		fmt.Fprintf(os.Stderr, "tokens: persist roles failed: %v\n", err)
+	}
+	if err := atomicWriteYAML(tokensPath, tokensDoc); err != nil {
+		fmt.Fprintf(os.Stderr, "tokens: persist tokens failed: %v\n", err)
+	}
+}
+
+func atomicWriteYAML(path string, data any) error {
+	dir := filepath.Dir(path)
+	if dir == "" {
+		dir = "."
+	}
+	if err := os.MkdirAll(dir, 0o750); err != nil {
+		return err
+	}
+	tmp, err := os.CreateTemp(dir, ".persist-*.tmp")
+	if err != nil {
+		return err
+	}
+	tmpPath := tmp.Name()
+	enc := yaml.NewEncoder(tmp)
+	enc.SetIndent(2)
+	if err := enc.Encode(data); err != nil {
+		_ = enc.Close()
+		_ = tmp.Close()
+		_ = os.Remove(tmpPath)
+		return err
+	}
+	if err := enc.Close(); err != nil {
+		_ = tmp.Close()
+		_ = os.Remove(tmpPath)
+		return err
+	}
+	if err := tmp.Close(); err != nil {
+		_ = os.Remove(tmpPath)
+		return err
+	}
+	return os.Rename(tmpPath, path)
+}
+
+func newTokenString() (string, error) {
+	b := make([]byte, 16)
+	if _, err := rand.Read(b); err != nil {
+		return "", err
+	}
+	return "evt_" + hex.EncodeToString(b), nil
+}
+
+func expiryDate(today time.Time, days *int) string {
+	if days == nil {
+		return ""
+	}
+	return today.AddDate(0, 0, *days).Format(dateFormat)
+}
diff --git a/vault/internal/tokens/store_test.go b/vault/internal/tokens/store_test.go
new file mode 100644
index 0000000..58c16eb
--- /dev/null
+++ b/vault/internal/tokens/store_test.go
@@ -0,0 +1,563 @@
+package tokens
+
+import (
+	"errors"
+	"os"
+	"path/filepath"
+	"strings"
+	"testing"
+	"time"
+)
+
+func newTestStore(t *testing.T) *Store {
+	t.Helper()
+	s := NewStore()
+	for n, r := range DefaultRoles() {
+		s.roles[n] = r
+	}
+	return s
+}
+
+func intp(v int) *int { return &v }
+
+// ── add / validate / revoke ────────────────────────────────────────
+
+func TestAddAndValidateToken(t *testing.T) {
+	s := newTestStore(t)
+	tok, err := s.AddToken("alice", "member", intp(90))
+	if err != nil {
+		t.Fatalf("AddToken: %v", err)
+	}
+	if tok.User != "alice" {
+		t.Errorf("user = %q, want alice", tok.User)
+	}
+	if !strings.HasPrefix(tok.Token, "evt_") {
+		t.Errorf("token = %q, want evt_ prefix", tok.Token)
+	}
+	if len(tok.Token) != 36 {
+		t.Errorf("token length = %d, want 36", len(tok.Token))
+	}
+	if tok.Role != "member" {
+		t.Errorf("role = %q, want member", tok.Role)
+	}
+
+	user, role, err := s.Validate(tok.Token)
+	if err != nil {
+		t.Fatalf("Validate: %v", err)
+	}
+	if user != "alice" || role.Name != "member" {
+		t.Errorf("got (%q, %q), want (alice, member)", user, role.Name)
+	}
+}
+
+func TestInvalidTokenRaises(t *testing.T) {
+	s := newTestStore(t)
+	_, _, err := s.Validate("nonexistent_token")
+	if !errors.Is(err, ErrTokenNotFound{}) {
+		t.Errorf("err = %v, want ErrTokenNotFound", err)
+	}
+}
+
+func TestExpiredTokenRaises(t *testing.T) {
+	s := newTestStore(t)
+	tok, err := s.AddToken("bob", "member", intp(1))
+	if err != nil {
+		t.Fatalf("AddToken: %v", err)
+	}
+	tok.Expires = time.Now().AddDate(0, 0, -1).Format(dateFormat)
+
+	_, _, err = s.Validate(tok.Token)
+	var exp ErrTokenExpired
+	if !errors.As(err, &exp) {
+		t.Fatalf("err = %v, want ErrTokenExpired", err)
+	}
+	if exp.User != "bob" {
+		t.Errorf("user = %q, want bob", exp.User)
+	}
+}
+
+func TestRevokeToken(t *testing.T) {
+	s := newTestStore(t)
+	tok, _ := s.AddToken("charlie", "member", nil)
+	if !s.RevokeToken("charlie") {
+		t.Fatal("RevokeToken returned false")
+	}
+	_, _, err := s.Validate(tok.Token)
+	if !errors.Is(err, ErrTokenNotFound{}) {
+		t.Errorf("err after revoke = %v, want ErrTokenNotFound", err)
+	}
+}
+
+func TestRevokeNonexistentReturnsFalse(t *testing.T) {
+	s := newTestStore(t)
+	if s.RevokeToken("nobody") {
+		t.Error("RevokeToken(nobody) = true, want false")
+	}
+}
+
+func TestDuplicateUserRejected(t *testing.T) {
+	s := newTestStore(t)
+	if _, err := s.AddToken("alice", "member", nil); err != nil {
+		t.Fatalf("first AddToken: %v", err)
+	}
+	_, err := s.AddToken("alice", "member", nil)
+	if err == nil || !strings.Contains(err.Error(), "already exists") {
+		t.Errorf("err = %v, want 'already exists'", err)
+	}
+}
+
+func TestInvalidRoleRejected(t *testing.T) {
+	s := newTestStore(t)
+	_, err := s.AddToken("alice", "nonexistent_role", nil)
+	if err == nil || !strings.Contains(err.Error(), "does not exist") {
+		t.Errorf("err = %v, want 'does not exist'", err)
+	}
+}
+
+func TestListTokensHidesValues(t *testing.T) {
+	s := newTestStore(t)
+	if _, err := s.AddToken("alice", "member", intp(30)); err != nil {
+		t.Fatalf("AddToken: %v", err)
+	}
+	res := s.ListTokens()
+	if len(res) != 1 {
+		t.Fatalf("len = %d, want 1", len(res))
+	}
+	if res[0].User != "alice" {
+		t.Errorf("user = %q, want alice", res[0].User)
+	}
+	// TokenInfo struct intentionally has no Token field.
+}
+
+func TestRateLimitingPerUser(t *testing.T) {
+	s := newTestStore(t)
+	if _, err := s.AddRole("limited", []string{"get_public_key"}, 5, "2/60s"); err != nil {
+		t.Fatalf("AddRole: %v", err)
+	}
+	tok, err := s.AddToken("ratelimited_user", "limited", nil)
+	if err != nil {
+		t.Fatalf("AddToken: %v", err)
+	}
+	if _, _, err := s.Validate(tok.Token); err != nil {
+		t.Fatalf("first Validate: %v", err)
+	}
+	if _, _, err := s.Validate(tok.Token); err != nil {
+		t.Fatalf("second Validate: %v", err)
+	}
+	_, _, err = s.Validate(tok.Token)
+	var rl ErrRateLimit
+	if !errors.As(err, &rl) {
+		t.Fatalf("third Validate err = %v, want ErrRateLimit", err)
+	}
+}
+
+func TestTopKFromRole(t *testing.T) {
+	s := newTestStore(t)
+	tok, _ := s.AddToken("alice", "member", nil)
+	_, role, err := s.Validate(tok.Token)
+	if err != nil {
+		t.Fatal(err)
+	}
+	if role.TopK != 10 {
+		t.Errorf("top_k = %d, want 10", role.TopK)
+	}
+}
+
+func TestNeverExpiresToken(t *testing.T) {
+	s := newTestStore(t)
+	tok, err := s.AddToken("permanent_user", "admin", nil)
+	if err != nil {
+		t.Fatal(err)
+	}
+	if tok.Expires != "" {
+		t.Errorf("expires = %q, want empty", tok.Expires)
+	}
+	if tok.IsExpired() {
+		t.Error("IsExpired = true, want false")
+	}
+	user, _, err := s.Validate(tok.Token)
+	if err != nil {
+		t.Fatal(err)
+	}
+	if user != "permanent_user" {
+		t.Errorf("user = %q, want permanent_user", user)
+	}
+}
+
+func TestPersistAndReload(t *testing.T) {
+	dir := t.TempDir()
+	rolesPath := filepath.Join(dir, "roles.yml")
+	tokensPath := filepath.Join(dir, "tokens.yml")
+
+	s1 := NewStore()
+	if err := s1.LoadFromFiles(rolesPath, tokensPath); err != nil {
+		t.Fatalf("LoadFromFiles: %v", err)
+	}
+	if _, err := s1.AddRole("researcher", []string{"get_public_key", "decrypt_scores"}, 3, "10/60s"); err != nil {
+		t.Fatalf("AddRole: %v", err)
+	}
+	tok, err := s1.AddToken("alice", "member", intp(90))
+	if err != nil {
+		t.Fatalf("AddToken: %v", err)
+	}
+	s1.Flush()
+
+	s2 := NewStore()
+	if err := s2.LoadFromFiles(rolesPath, tokensPath); err != nil {
+		t.Fatalf("reload LoadFromFiles: %v", err)
+	}
+	user, role, err := s2.Validate(tok.Token)
+	if err != nil {
+		t.Fatalf("reload Validate: %v", err)
+	}
+	if user != "alice" || role.Name != "member" {
+		t.Errorf("got (%q, %q), want (alice, member)", user, role.Name)
+	}
+
+	roles := s2.ListRoles()
+	found := false
+	for _, r := range roles {
+		if r.Name == "researcher" {
+			found = true
+			break
+		}
+	}
+	if !found {
+		t.Error("researcher role missing after reload")
+	}
+}
+
+// ── rotation ───────────────────────────────────────────────────────
+
+func TestRotateToken(t *testing.T) {
+	s := newTestStore(t)
+	old, _ := s.AddToken("alice", "member", nil)
+	newTok, err := s.RotateToken("alice")
+	if err != nil {
+		t.Fatal(err)
+	}
+	if newTok.User != "alice" || newTok.Role != "member" {
+		t.Errorf("got (%q, %q), want (alice, member)", newTok.User, newTok.Role)
+	}
+	if !strings.HasPrefix(newTok.Token, "evt_") {
+		t.Errorf("token = %q, want evt_ prefix", newTok.Token)
+	}
+	if newTok.Token == old.Token {
+		t.Error("new token equals old token")
+	}
+}
+
+func TestRotatePreservesExpiry(t *testing.T) {
+	s := newTestStore(t)
+	if _, err := s.AddToken("alice", "member", intp(90)); err != nil {
+		t.Fatal(err)
+	}
+	newTok, err := s.RotateToken("alice")
+	if err != nil {
+		t.Fatal(err)
+	}
+	if newTok.Expires == "" {
+		t.Fatal("expires empty after rotation")
+	}
+	got, err := time.Parse(dateFormat, newTok.Expires)
+	if err != nil {
+		t.Fatal(err)
+	}
+	want := time.Now().UTC().AddDate(0, 0, 90).Format(dateFormat)
+	if got.Format(dateFormat) != want {
+		t.Errorf("expires = %s, want %s", got.Format(dateFormat), want)
+	}
+}
+
+func TestRotateInvalidatesOldToken(t *testing.T) {
+	s := newTestStore(t)
+	old, _ := s.AddToken("alice", "member", nil)
+	if _, err := s.RotateToken("alice"); err != nil {
+		t.Fatal(err)
+	}
+	if _, _, err := s.Validate(old.Token); !errors.Is(err, ErrTokenNotFound{}) {
+		t.Errorf("err = %v, want ErrTokenNotFound", err)
+	}
+}
+
+func TestRotateNewTokenValidates(t *testing.T) {
+	s := newTestStore(t)
+	if _, err := s.AddToken("alice", "member", nil); err != nil {
+		t.Fatal(err)
+	}
+	newTok, err := s.RotateToken("alice")
+	if err != nil {
+		t.Fatal(err)
+	}
+	user, role, err := s.Validate(newTok.Token)
+	if err != nil {
+		t.Fatal(err)
+	}
+	if user != "alice" || role.Name != "member" {
+		t.Errorf("got (%q, %q), want (alice, member)", user, role.Name)
+	}
+}
+
+func TestRotateNonexistentUserRaises(t *testing.T) {
+	s := newTestStore(t)
+	_, err := s.RotateToken("nobody")
+	if err == nil || !strings.Contains(err.Error(), "no token found") {
+		t.Errorf("err = %v, want 'no token found'", err)
+	}
+}
+
+func TestRotateAll(t *testing.T) {
+	s := newTestStore(t)
+	tokA, _ := s.AddToken("alice", "member", nil)
+	tokB, _ := s.AddToken("bob", "admin", nil)
+	res, err := s.RotateAllTokens()
+	if err != nil {
+		t.Fatal(err)
+	}
+	if len(res) != 2 {
+		t.Fatalf("len = %d, want 2", len(res))
+	}
+	got := map[string]bool{}
+	for _, tk := range res {
+		got[tk.User] = true
+	}
+	if !got["alice"] || !got["bob"] {
+		t.Errorf("got users = %v, want alice + bob", got)
+	}
+	if _, _, err := s.Validate(tokA.Token); !errors.Is(err, ErrTokenNotFound{}) {
+		t.Errorf("alice old token still valid")
+	}
+	if _, _, err := s.Validate(tokB.Token); !errors.Is(err, ErrTokenNotFound{}) {
+		t.Errorf("bob old token still valid")
+	}
+}
+
+func TestRotatePersists(t *testing.T) {
+	dir := t.TempDir()
+	rolesPath := filepath.Join(dir, "roles.yml")
+	tokensPath := filepath.Join(dir, "tokens.yml")
+
+	s1 := NewStore()
+	if err := s1.LoadFromFiles(rolesPath, tokensPath); err != nil {
+		t.Fatal(err)
+	}
+	if _, err := s1.AddToken("alice", "member", intp(30)); err != nil {
+		t.Fatal(err)
+	}
+	newTok, err := s1.RotateToken("alice")
+	if err != nil {
+		t.Fatal(err)
+	}
+	s1.Flush()
+
+	s2 := NewStore()
+	if err := s2.LoadFromFiles(rolesPath, tokensPath); err != nil {
+		t.Fatal(err)
+	}
+	user, role, err := s2.Validate(newTok.Token)
+	if err != nil {
+		t.Fatal(err)
+	}
+	if user != "alice" || role.Name != "member" {
+		t.Errorf("got (%q, %q), want (alice, member)", user, role.Name)
+	}
+}
+
+// ── role CRUD ──────────────────────────────────────────────────────
+
+func TestCreateRole(t *testing.T) {
+	s := newTestStore(t)
+	r, err := s.AddRole("researcher", []string{"get_public_key", "decrypt_scores"}, 3, "10/60s")
+	if err != nil {
+		t.Fatal(err)
+	}
+	if r.Name != "researcher" || r.TopK != 3 {
+		t.Errorf("got (%q, %d), want (researcher, 3)", r.Name, r.TopK)
+	}
+	if err := r.CheckScope("get_public_key"); err != nil {
+		t.Errorf("CheckScope(get_public_key): %v", err)
+	}
+}
+
+func TestCreateDuplicateRoleRejected(t *testing.T) {
+	s := newTestStore(t)
+	_, err := s.AddRole("admin", []string{"get_public_key"}, 5, "30/60s")
+	if err == nil || !strings.Contains(err.Error(), "already exists") {
+		t.Errorf("err = %v, want 'already exists'", err)
+	}
+}
+
+func TestUpdateRole(t *testing.T) {
+	s := newTestStore(t)
+	r, err := s.UpdateRole("member", UpdateRoleOpts{TopK: intp(8)})
+	if err != nil {
+		t.Fatal(err)
+	}
+	if r.TopK != 8 || r.Name != "member" {
+		t.Errorf("got (%q, %d), want (member, 8)", r.Name, r.TopK)
+	}
+}
+
+func TestUpdateNonexistentRoleRejected(t *testing.T) {
+	s := newTestStore(t)
+	_, err := s.UpdateRole("nonexistent", UpdateRoleOpts{TopK: intp(5)})
+	if err == nil || !strings.Contains(err.Error(), "does not exist") {
+		t.Errorf("err = %v, want 'does not exist'", err)
+	}
+}
+
+func TestDeleteCustomRole(t *testing.T) {
+	s := newTestStore(t)
+	if _, err := s.AddRole("temp", []string{"get_public_key"}, 1, "5/60s"); err != nil {
+		t.Fatal(err)
+	}
+	if err := s.DeleteRole("temp"); err != nil {
+		t.Fatal(err)
+	}
+	for _, r := range s.ListRoles() {
+		if r.Name == "temp" {
+			t.Error("temp role still present after delete")
+		}
+	}
+}
+
+func TestDeleteDefaultRoleRejected(t *testing.T) {
+	s := newTestStore(t)
+	for _, name := range []string{"admin", "member"} {
+		err := s.DeleteRole(name)
+		if err == nil || !strings.Contains(err.Error(), "Cannot delete default") {
+			t.Errorf("delete %s: err = %v, want 'Cannot delete default'", name, err)
+		}
+	}
+}
+
+func TestDeleteRoleWithActiveTokensRejected(t *testing.T) {
+	s := newTestStore(t)
+	if _, err := s.AddRole("temp", []string{"get_public_key"}, 1, "5/60s"); err != nil {
+		t.Fatal(err)
+	}
+	if _, err := s.AddToken("user1", "temp", nil); err != nil {
+		t.Fatal(err)
+	}
+	err := s.DeleteRole("temp")
+	if err == nil || !strings.Contains(err.Error(), "token for user") {
+		t.Errorf("err = %v, want 'token for user'", err)
+	}
+}
+
+func TestListRoles(t *testing.T) {
+	s := newTestStore(t)
+	roles := s.ListRoles()
+	if len(roles) < 2 {
+		t.Fatalf("len = %d, want >= 2", len(roles))
+	}
+	names := map[string]bool{}
+	for _, r := range roles {
+		names[r.Name] = true
+	}
+	if !names["admin"] || !names["member"] {
+		t.Errorf("missing default roles, got %v", names)
+	}
+}
+
+func TestUpdateRoleClearsRateLimiters(t *testing.T) {
+	s := newTestStore(t)
+	tok, _ := s.AddToken("alice", "member", nil)
+	if _, _, err := s.Validate(tok.Token); err != nil {
+		t.Fatal(err)
+	}
+	if _, ok := s.rateLimiters["alice"]; !ok {
+		t.Fatal("rate limiter not created on validate")
+	}
+	rl := "100/60s"
+	if _, err := s.UpdateRole("member", UpdateRoleOpts{RateLimit: &rl}); err != nil {
+		t.Fatal(err)
+	}
+	if _, ok := s.rateLimiters["alice"]; ok {
+		t.Error("rate limiter not cleared after rate_limit change")
+	}
+}
+
+func TestRoleRateLimitParsed(t *testing.T) {
+	r := &Role{Name: "test", RateLimit: "30/60s"}
+	maxReq, window, err := r.RateLimitParsed()
+	if err != nil {
+		t.Fatal(err)
+	}
+	if maxReq != 30 {
+		t.Errorf("max = %d, want 30", maxReq)
+	}
+	if window != 60*time.Second {
+		t.Errorf("window = %v, want 60s", window)
+	}
+}
+
+// ── scope check ────────────────────────────────────────────────────
+
+func TestScopeAllowsValidMethod(t *testing.T) {
+	r := &Role{Name: "member", Scope: []string{"get_public_key", "decrypt_scores"}}
+	if err := r.CheckScope("get_public_key"); err != nil {
+		t.Errorf("err = %v, want nil", err)
+	}
+}
+
+func TestScopeRejectsInvalidMethod(t *testing.T) {
+	r := &Role{Name: "limited", Scope: []string{"get_public_key"}}
+	err := r.CheckScope("decrypt_scores")
+	var se ErrScope
+	if !errors.As(err, &se) {
+		t.Fatalf("err = %v, want ErrScope", err)
+	}
+	if se.Method != "decrypt_scores" || se.RoleName != "limited" {
+		t.Errorf("got (%q, %q), want (decrypt_scores, limited)", se.Method, se.RoleName)
+	}
+}
+
+// ── TopKExceeded ───────────────────────────────────────────────────
+
+func TestTopKExceededMessage(t *testing.T) {
+	err := ErrTopKExceeded{Requested: 15, MaxTopK: 10, RoleName: "admin"}
+	msg := err.Error()
+	for _, want := range []string{"15", "10", "admin"} {
+		if !strings.Contains(msg, want) {
+			t.Errorf("msg = %q, missing %q", msg, want)
+		}
+	}
+}
+
+// ── demo token loader ─────────────────────────────────────────────
+
+func TestLoadDefaultsWithDemoToken(t *testing.T) {
+	s := NewStore()
+	s.LoadDefaultsWithDemoToken()
+	user, role, err := s.Validate(DemoToken)
+	if err != nil {
+		t.Fatal(err)
+	}
+	if user != "demo" || role.Name != "admin" {
+		t.Errorf("got (%q, %q), want (demo, admin)", user, role.Name)
+	}
+}
+
+// ── persistence file content sanity ──────────────────────────────
+
+func TestPersistedTokensFileContainsToken(t *testing.T) {
+	dir := t.TempDir()
+	rolesPath := filepath.Join(dir, "roles.yml")
+	tokensPath := filepath.Join(dir, "tokens.yml")
+
+	s := NewStore()
+	if err := s.LoadFromFiles(rolesPath, tokensPath); err != nil {
+		t.Fatal(err)
+	}
+	tok, _ := s.AddToken("alice", "member", intp(7))
+	s.Flush()
+
+	body, err := os.ReadFile(tokensPath)
+	if err != nil {
+		t.Fatal(err)
+	}
+	if !strings.Contains(string(body), tok.Token) {
+		t.Errorf("tokens.yml missing token %q", tok.Token)
+	}
+}
diff --git a/vault/internal/tokens/token.go b/vault/internal/tokens/token.go
new file mode 100644
index 0000000..563dbae
--- /dev/null
+++ b/vault/internal/tokens/token.go
@@ -0,0 +1,29 @@
+package tokens
+
+import "time"
+
+type Token struct {
+	User     string `yaml:"user"`
+	Token    string `yaml:"token"`
+	Role     string `yaml:"role"`
+	IssuedAt string `yaml:"issued_at"`         // ISO date
+	Expires  string `yaml:"expires,omitempty"` // ISO date, empty = never
+}
+
+const dateFormat = "2006-01-02"
+
+func (t *Token) IsExpired() bool {
+	return t.IsExpiredAt(time.Now().UTC())
+}
+
+func (t *Token) IsExpiredAt(now time.Time) bool {
+	if t.Expires == "" {
+		return false
+	}
+	exp, err := time.Parse(dateFormat, t.Expires)
+	if err != nil {
+		return false
+	}
+	today := time.Date(now.Year(), now.Month(), now.Day(), 0, 0, 0, 0, time.UTC)
+	return exp.Before(today)
+}
diff --git a/vault/pkg/vaultpb/vault_service.pb.go b/vault/pkg/vaultpb/vault_service.pb.go
new file mode 100644
index 0000000..e2ba23d
--- /dev/null
+++ b/vault/pkg/vaultpb/vault_service.pb.go
@@ -0,0 +1,499 @@
+// Code generated by protoc-gen-go. DO NOT EDIT.
+// versions:
+// 	protoc-gen-go v1.36.11
+// 	protoc        (unknown)
+// source: vault_service.proto
+
+package vaultpb
+
+import (
+	_ "buf.build/gen/go/bufbuild/protovalidate/protocolbuffers/go/buf/validate"
+	protoreflect "google.golang.org/protobuf/reflect/protoreflect"
+	protoimpl "google.golang.org/protobuf/runtime/protoimpl"
+	reflect "reflect"
+	sync "sync"
+	unsafe "unsafe"
+)
+
+const (
+	// Verify that this generated code is sufficiently up-to-date.
+	_ = protoimpl.EnforceVersion(20 - protoimpl.MinVersion)
+	// Verify that runtime/protoimpl is sufficiently up-to-date.
+	_ = protoimpl.EnforceVersion(protoimpl.MaxVersion - 20)
+)
+
+type GetPublicKeyRequest struct {
+	state protoimpl.MessageState `protogen:"open.v1"`
+	// Auth token. Required, Fixed 36 chars (evt_ + 32 hex).
+	Token         string `protobuf:"bytes,1,opt,name=token,proto3" json:"token,omitempty"`
+	unknownFields protoimpl.UnknownFields
+	sizeCache     protoimpl.SizeCache
+}
+
+func (x *GetPublicKeyRequest) Reset() {
+	*x = GetPublicKeyRequest{}
+	mi := &file_vault_service_proto_msgTypes[0]
+	ms := protoimpl.X.MessageStateOf(protoimpl.Pointer(x))
+	ms.StoreMessageInfo(mi)
+}
+
+func (x *GetPublicKeyRequest) String() string {
+	return protoimpl.X.MessageStringOf(x)
+}
+
+func (*GetPublicKeyRequest) ProtoMessage() {}
+
+func (x *GetPublicKeyRequest) ProtoReflect() protoreflect.Message {
+	mi := &file_vault_service_proto_msgTypes[0]
+	if x != nil {
+		ms := protoimpl.X.MessageStateOf(protoimpl.Pointer(x))
+		if ms.LoadMessageInfo() == nil {
+			ms.StoreMessageInfo(mi)
+		}
+		return ms
+	}
+	return mi.MessageOf(x)
+}
+
+// Deprecated: Use GetPublicKeyRequest.ProtoReflect.Descriptor instead.
+func (*GetPublicKeyRequest) Descriptor() ([]byte, []int) {
+	return file_vault_service_proto_rawDescGZIP(), []int{0}
+}
+
+func (x *GetPublicKeyRequest) GetToken() string {
+	if x != nil {
+		return x.Token
+	}
+	return ""
+}
+
+type GetPublicKeyResponse struct {
+	state protoimpl.MessageState `protogen:"open.v1"`
+	// JSON string: {"EncKey.json": "...", "EvalKey.json": "...", "index_name": "..."}
+	KeyBundleJson string `protobuf:"bytes,1,opt,name=key_bundle_json,json=keyBundleJson,proto3" json:"key_bundle_json,omitempty"`
+	Error         string `protobuf:"bytes,2,opt,name=error,proto3" json:"error,omitempty"` // Non-empty on error
+	unknownFields protoimpl.UnknownFields
+	sizeCache     protoimpl.SizeCache
+}
+
+func (x *GetPublicKeyResponse) Reset() {
+	*x = GetPublicKeyResponse{}
+	mi := &file_vault_service_proto_msgTypes[1]
+	ms := protoimpl.X.MessageStateOf(protoimpl.Pointer(x))
+	ms.StoreMessageInfo(mi)
+}
+
+func (x *GetPublicKeyResponse) String() string {
+	return protoimpl.X.MessageStringOf(x)
+}
+
+func (*GetPublicKeyResponse) ProtoMessage() {}
+
+func (x *GetPublicKeyResponse) ProtoReflect() protoreflect.Message {
+	mi := &file_vault_service_proto_msgTypes[1]
+	if x != nil {
+		ms := protoimpl.X.MessageStateOf(protoimpl.Pointer(x))
+		if ms.LoadMessageInfo() == nil {
+			ms.StoreMessageInfo(mi)
+		}
+		return ms
+	}
+	return mi.MessageOf(x)
+}
+
+// Deprecated: Use GetPublicKeyResponse.ProtoReflect.Descriptor instead.
+func (*GetPublicKeyResponse) Descriptor() ([]byte, []int) {
+	return file_vault_service_proto_rawDescGZIP(), []int{1}
+}
+
+func (x *GetPublicKeyResponse) GetKeyBundleJson() string {
+	if x != nil {
+		return x.KeyBundleJson
+	}
+	return ""
+}
+
+func (x *GetPublicKeyResponse) GetError() string {
+	if x != nil {
+		return x.Error
+	}
+	return ""
+}
+
+type DecryptScoresRequest struct {
+	state protoimpl.MessageState `protogen:"open.v1"`
+	// Auth token. Required, Fixed 36 chars (evt_ + 32 hex).
+	Token string `protobuf:"bytes,1,opt,name=token,proto3" json:"token,omitempty"`
+	// Base64-encoded CiphertextScore protobuf. Required.
+	EncryptedBlobB64 string `protobuf:"bytes,2,opt,name=encrypted_blob_b64,json=encryptedBlobB64,proto3" json:"encrypted_blob_b64,omitempty"`
+	// Number of top results to return.
+	// Per-role limits (e.g., admin=50, member=10) enforced at the business logic layer.
+	TopK          int32 `protobuf:"varint,3,opt,name=top_k,json=topK,proto3" json:"top_k,omitempty"`
+	unknownFields protoimpl.UnknownFields
+	sizeCache     protoimpl.SizeCache
+}
+
+func (x *DecryptScoresRequest) Reset() {
+	*x = DecryptScoresRequest{}
+	mi := &file_vault_service_proto_msgTypes[2]
+	ms := protoimpl.X.MessageStateOf(protoimpl.Pointer(x))
+	ms.StoreMessageInfo(mi)
+}
+
+func (x *DecryptScoresRequest) String() string {
+	return protoimpl.X.MessageStringOf(x)
+}
+
+func (*DecryptScoresRequest) ProtoMessage() {}
+
+func (x *DecryptScoresRequest) ProtoReflect() protoreflect.Message {
+	mi := &file_vault_service_proto_msgTypes[2]
+	if x != nil {
+		ms := protoimpl.X.MessageStateOf(protoimpl.Pointer(x))
+		if ms.LoadMessageInfo() == nil {
+			ms.StoreMessageInfo(mi)
+		}
+		return ms
+	}
+	return mi.MessageOf(x)
+}
+
+// Deprecated: Use DecryptScoresRequest.ProtoReflect.Descriptor instead.
+func (*DecryptScoresRequest) Descriptor() ([]byte, []int) {
+	return file_vault_service_proto_rawDescGZIP(), []int{2}
+}
+
+func (x *DecryptScoresRequest) GetToken() string {
+	if x != nil {
+		return x.Token
+	}
+	return ""
+}
+
+func (x *DecryptScoresRequest) GetEncryptedBlobB64() string {
+	if x != nil {
+		return x.EncryptedBlobB64
+	}
+	return ""
+}
+
+func (x *DecryptScoresRequest) GetTopK() int32 {
+	if x != nil {
+		return x.TopK
+	}
+	return 0
+}
+
+type ScoreEntry struct {
+	state         protoimpl.MessageState `protogen:"open.v1"`
+	ShardIdx      int32                  `protobuf:"varint,1,opt,name=shard_idx,json=shardIdx,proto3" json:"shard_idx,omitempty"`
+	RowIdx        int32                  `protobuf:"varint,2,opt,name=row_idx,json=rowIdx,proto3" json:"row_idx,omitempty"`
+	Score         float64                `protobuf:"fixed64,3,opt,name=score,proto3" json:"score,omitempty"`
+	unknownFields protoimpl.UnknownFields
+	sizeCache     protoimpl.SizeCache
+}
+
+func (x *ScoreEntry) Reset() {
+	*x = ScoreEntry{}
+	mi := &file_vault_service_proto_msgTypes[3]
+	ms := protoimpl.X.MessageStateOf(protoimpl.Pointer(x))
+	ms.StoreMessageInfo(mi)
+}
+
+func (x *ScoreEntry) String() string {
+	return protoimpl.X.MessageStringOf(x)
+}
+
+func (*ScoreEntry) ProtoMessage() {}
+
+func (x *ScoreEntry) ProtoReflect() protoreflect.Message {
+	mi := &file_vault_service_proto_msgTypes[3]
+	if x != nil {
+		ms := protoimpl.X.MessageStateOf(protoimpl.Pointer(x))
+		if ms.LoadMessageInfo() == nil {
+			ms.StoreMessageInfo(mi)
+		}
+		return ms
+	}
+	return mi.MessageOf(x)
+}
+
+// Deprecated: Use ScoreEntry.ProtoReflect.Descriptor instead.
+func (*ScoreEntry) Descriptor() ([]byte, []int) {
+	return file_vault_service_proto_rawDescGZIP(), []int{3}
+}
+
+func (x *ScoreEntry) GetShardIdx() int32 {
+	if x != nil {
+		return x.ShardIdx
+	}
+	return 0
+}
+
+func (x *ScoreEntry) GetRowIdx() int32 {
+	if x != nil {
+		return x.RowIdx
+	}
+	return 0
+}
+
+func (x *ScoreEntry) GetScore() float64 {
+	if x != nil {
+		return x.Score
+	}
+	return 0
+}
+
+type DecryptScoresResponse struct {
+	state         protoimpl.MessageState `protogen:"open.v1"`
+	Results       []*ScoreEntry          `protobuf:"bytes,1,rep,name=results,proto3" json:"results,omitempty"` // Top-K results sorted by score descending
+	Error         string                 `protobuf:"bytes,2,opt,name=error,proto3" json:"error,omitempty"`     // Non-empty on error
+	unknownFields protoimpl.UnknownFields
+	sizeCache     protoimpl.SizeCache
+}
+
+func (x *DecryptScoresResponse) Reset() {
+	*x = DecryptScoresResponse{}
+	mi := &file_vault_service_proto_msgTypes[4]
+	ms := protoimpl.X.MessageStateOf(protoimpl.Pointer(x))
+	ms.StoreMessageInfo(mi)
+}
+
+func (x *DecryptScoresResponse) String() string {
+	return protoimpl.X.MessageStringOf(x)
+}
+
+func (*DecryptScoresResponse) ProtoMessage() {}
+
+func (x *DecryptScoresResponse) ProtoReflect() protoreflect.Message {
+	mi := &file_vault_service_proto_msgTypes[4]
+	if x != nil {
+		ms := protoimpl.X.MessageStateOf(protoimpl.Pointer(x))
+		if ms.LoadMessageInfo() == nil {
+			ms.StoreMessageInfo(mi)
+		}
+		return ms
+	}
+	return mi.MessageOf(x)
+}
+
+// Deprecated: Use DecryptScoresResponse.ProtoReflect.Descriptor instead.
+func (*DecryptScoresResponse) Descriptor() ([]byte, []int) {
+	return file_vault_service_proto_rawDescGZIP(), []int{4}
+}
+
+func (x *DecryptScoresResponse) GetResults() []*ScoreEntry {
+	if x != nil {
+		return x.Results
+	}
+	return nil
+}
+
+func (x *DecryptScoresResponse) GetError() string {
+	if x != nil {
+		return x.Error
+	}
+	return ""
+}
+
+type DecryptMetadataRequest struct {
+	state protoimpl.MessageState `protogen:"open.v1"`
+	// Auth token. Required, Fixed 36 chars (evt_ + 32 hex).
+	Token string `protobuf:"bytes,1,opt,name=token,proto3" json:"token,omitempty"`
+	// Base64-encoded AES blobs. Required, max 1000 items, each non-empty.
+	EncryptedMetadataList []string `protobuf:"bytes,2,rep,name=encrypted_metadata_list,json=encryptedMetadataList,proto3" json:"encrypted_metadata_list,omitempty"`
+	unknownFields         protoimpl.UnknownFields
+	sizeCache             protoimpl.SizeCache
+}
+
+func (x *DecryptMetadataRequest) Reset() {
+	*x = DecryptMetadataRequest{}
+	mi := &file_vault_service_proto_msgTypes[5]
+	ms := protoimpl.X.MessageStateOf(protoimpl.Pointer(x))
+	ms.StoreMessageInfo(mi)
+}
+
+func (x *DecryptMetadataRequest) String() string {
+	return protoimpl.X.MessageStringOf(x)
+}
+
+func (*DecryptMetadataRequest) ProtoMessage() {}
+
+func (x *DecryptMetadataRequest) ProtoReflect() protoreflect.Message {
+	mi := &file_vault_service_proto_msgTypes[5]
+	if x != nil {
+		ms := protoimpl.X.MessageStateOf(protoimpl.Pointer(x))
+		if ms.LoadMessageInfo() == nil {
+			ms.StoreMessageInfo(mi)
+		}
+		return ms
+	}
+	return mi.MessageOf(x)
+}
+
+// Deprecated: Use DecryptMetadataRequest.ProtoReflect.Descriptor instead.
+func (*DecryptMetadataRequest) Descriptor() ([]byte, []int) {
+	return file_vault_service_proto_rawDescGZIP(), []int{5}
+}
+
+func (x *DecryptMetadataRequest) GetToken() string {
+	if x != nil {
+		return x.Token
+	}
+	return ""
+}
+
+func (x *DecryptMetadataRequest) GetEncryptedMetadataList() []string {
+	if x != nil {
+		return x.EncryptedMetadataList
+	}
+	return nil
+}
+
+type DecryptMetadataResponse struct {
+	state protoimpl.MessageState `protogen:"open.v1"`
+	// Each element is a JSON-serialized decrypted metadata object
+	DecryptedMetadata []string `protobuf:"bytes,1,rep,name=decrypted_metadata,json=decryptedMetadata,proto3" json:"decrypted_metadata,omitempty"`
+	Error             string   `protobuf:"bytes,2,opt,name=error,proto3" json:"error,omitempty"` // Non-empty on error
+	unknownFields     protoimpl.UnknownFields
+	sizeCache         protoimpl.SizeCache
+}
+
+func (x *DecryptMetadataResponse) Reset() {
+	*x = DecryptMetadataResponse{}
+	mi := &file_vault_service_proto_msgTypes[6]
+	ms := protoimpl.X.MessageStateOf(protoimpl.Pointer(x))
+	ms.StoreMessageInfo(mi)
+}
+
+func (x *DecryptMetadataResponse) String() string {
+	return protoimpl.X.MessageStringOf(x)
+}
+
+func (*DecryptMetadataResponse) ProtoMessage() {}
+
+func (x *DecryptMetadataResponse) ProtoReflect() protoreflect.Message {
+	mi := &file_vault_service_proto_msgTypes[6]
+	if x != nil {
+		ms := protoimpl.X.MessageStateOf(protoimpl.Pointer(x))
+		if ms.LoadMessageInfo() == nil {
+			ms.StoreMessageInfo(mi)
+		}
+		return ms
+	}
+	return mi.MessageOf(x)
+}
+
+// Deprecated: Use DecryptMetadataResponse.ProtoReflect.Descriptor instead.
+func (*DecryptMetadataResponse) Descriptor() ([]byte, []int) {
+	return file_vault_service_proto_rawDescGZIP(), []int{6}
+}
+
+func (x *DecryptMetadataResponse) GetDecryptedMetadata() []string {
+	if x != nil {
+		return x.DecryptedMetadata
+	}
+	return nil
+}
+
+func (x *DecryptMetadataResponse) GetError() string {
+	if x != nil {
+		return x.Error
+	}
+	return ""
+}
+
+var File_vault_service_proto protoreflect.FileDescriptor
+
+const file_vault_service_proto_rawDesc = "" +
+	"\n" +
+	"\x13vault_service.proto\x12\rrune.vault.v1\x1a\x1bbuf/validate/validate.proto\"6\n" +
+	"\x13GetPublicKeyRequest\x12\x1f\n" +
+	"\x05token\x18\x01 \x01(\tB\t\xbaH\x06r\x04\x10$\x18$R\x05token\"T\n" +
+	"\x14GetPublicKeyResponse\x12&\n" +
+	"\x0fkey_bundle_json\x18\x01 \x01(\tR\rkeyBundleJson\x12\x14\n" +
+	"\x05error\x18\x02 \x01(\tR\x05error\"\x8f\x01\n" +
+	"\x14DecryptScoresRequest\x12\x1f\n" +
+	"\x05token\x18\x01 \x01(\tB\t\xbaH\x06r\x04\x10$\x18$R\x05token\x125\n" +
+	"\x12encrypted_blob_b64\x18\x02 \x01(\tB\a\xbaH\x04r\x02\x10\x01R\x10encryptedBlobB64\x12\x1f\n" +
+	"\x05top_k\x18\x03 \x01(\x05B\n" +
+	"\xbaH\a\x1a\x05\x18\xac\x02(\x01R\x04topK\"X\n" +
+	"\n" +
+	"ScoreEntry\x12\x1b\n" +
+	"\tshard_idx\x18\x01 \x01(\x05R\bshardIdx\x12\x17\n" +
+	"\arow_idx\x18\x02 \x01(\x05R\x06rowIdx\x12\x14\n" +
+	"\x05score\x18\x03 \x01(\x01R\x05score\"b\n" +
+	"\x15DecryptScoresResponse\x123\n" +
+	"\aresults\x18\x01 \x03(\v2\x19.rune.vault.v1.ScoreEntryR\aresults\x12\x14\n" +
+	"\x05error\x18\x02 \x01(\tR\x05error\"\x84\x01\n" +
+	"\x16DecryptMetadataRequest\x12\x1f\n" +
+	"\x05token\x18\x01 \x01(\tB\t\xbaH\x06r\x04\x10$\x18$R\x05token\x12I\n" +
+	"\x17encrypted_metadata_list\x18\x02 \x03(\tB\x11\xbaH\x0e\x92\x01\v\b\x01\x10\xe8\a\"\x04r\x02\x10\x01R\x15encryptedMetadataList\"^\n" +
+	"\x17DecryptMetadataResponse\x12-\n" +
+	"\x12decrypted_metadata\x18\x01 \x03(\tR\x11decryptedMetadata\x12\x14\n" +
+	"\x05error\x18\x02 \x01(\tR\x05error2\xa5\x02\n" +
+	"\fVaultService\x12W\n" +
+	"\fGetPublicKey\x12\".rune.vault.v1.GetPublicKeyRequest\x1a#.rune.vault.v1.GetPublicKeyResponse\x12Z\n" +
+	"\rDecryptScores\x12#.rune.vault.v1.DecryptScoresRequest\x1a$.rune.vault.v1.DecryptScoresResponse\x12`\n" +
+	"\x0fDecryptMetadata\x12%.rune.vault.v1.DecryptMetadataRequest\x1a&.rune.vault.v1.DecryptMetadataResponseb\x06proto3"
+
+var (
+	file_vault_service_proto_rawDescOnce sync.Once
+	file_vault_service_proto_rawDescData []byte
+)
+
+func file_vault_service_proto_rawDescGZIP() []byte {
+	file_vault_service_proto_rawDescOnce.Do(func() {
+		file_vault_service_proto_rawDescData = protoimpl.X.CompressGZIP(unsafe.Slice(unsafe.StringData(file_vault_service_proto_rawDesc), len(file_vault_service_proto_rawDesc)))
+	})
+	return file_vault_service_proto_rawDescData
+}
+
+var file_vault_service_proto_msgTypes = make([]protoimpl.MessageInfo, 7)
+var file_vault_service_proto_goTypes = []any{
+	(*GetPublicKeyRequest)(nil),     // 0: rune.vault.v1.GetPublicKeyRequest
+	(*GetPublicKeyResponse)(nil),    // 1: rune.vault.v1.GetPublicKeyResponse
+	(*DecryptScoresRequest)(nil),    // 2: rune.vault.v1.DecryptScoresRequest
+	(*ScoreEntry)(nil),              // 3: rune.vault.v1.ScoreEntry
+	(*DecryptScoresResponse)(nil),   // 4: rune.vault.v1.DecryptScoresResponse
+	(*DecryptMetadataRequest)(nil),  // 5: rune.vault.v1.DecryptMetadataRequest
+	(*DecryptMetadataResponse)(nil), // 6: rune.vault.v1.DecryptMetadataResponse
+}
+var file_vault_service_proto_depIdxs = []int32{
+	3, // 0: rune.vault.v1.DecryptScoresResponse.results:type_name -> rune.vault.v1.ScoreEntry
+	0, // 1: rune.vault.v1.VaultService.GetPublicKey:input_type -> rune.vault.v1.GetPublicKeyRequest
+	2, // 2: rune.vault.v1.VaultService.DecryptScores:input_type -> rune.vault.v1.DecryptScoresRequest
+	5, // 3: rune.vault.v1.VaultService.DecryptMetadata:input_type -> rune.vault.v1.DecryptMetadataRequest
+	1, // 4: rune.vault.v1.VaultService.GetPublicKey:output_type -> rune.vault.v1.GetPublicKeyResponse
+	4, // 5: rune.vault.v1.VaultService.DecryptScores:output_type -> rune.vault.v1.DecryptScoresResponse
+	6, // 6: rune.vault.v1.VaultService.DecryptMetadata:output_type -> rune.vault.v1.DecryptMetadataResponse
+	4, // [4:7] is the sub-list for method output_type
+	1, // [1:4] is the sub-list for method input_type
+	1, // [1:1] is the sub-list for extension type_name
+	1, // [1:1] is the sub-list for extension extendee
+	0, // [0:1] is the sub-list for field type_name
+}
+
+func init() { file_vault_service_proto_init() }
+func file_vault_service_proto_init() {
+	if File_vault_service_proto != nil {
+		return
+	}
+	type x struct{}
+	out := protoimpl.TypeBuilder{
+		File: protoimpl.DescBuilder{
+			GoPackagePath: reflect.TypeOf(x{}).PkgPath(),
+			RawDescriptor: unsafe.Slice(unsafe.StringData(file_vault_service_proto_rawDesc), len(file_vault_service_proto_rawDesc)),
+			NumEnums:      0,
+			NumMessages:   7,
+			NumExtensions: 0,
+			NumServices:   1,
+		},
+		GoTypes:           file_vault_service_proto_goTypes,
+		DependencyIndexes: file_vault_service_proto_depIdxs,
+		MessageInfos:      file_vault_service_proto_msgTypes,
+	}.Build()
+	File_vault_service_proto = out.File
+	file_vault_service_proto_goTypes = nil
+	file_vault_service_proto_depIdxs = nil
+}
diff --git a/vault/pkg/vaultpb/vault_service_grpc.pb.go b/vault/pkg/vaultpb/vault_service_grpc.pb.go
new file mode 100644
index 0000000..7108750
--- /dev/null
+++ b/vault/pkg/vaultpb/vault_service_grpc.pb.go
@@ -0,0 +1,209 @@
+// Code generated by protoc-gen-go-grpc. DO NOT EDIT.
+// versions:
+// - protoc-gen-go-grpc v1.6.1
+// - protoc             (unknown)
+// source: vault_service.proto
+
+package vaultpb
+
+import (
+	context "context"
+	grpc "google.golang.org/grpc"
+	codes "google.golang.org/grpc/codes"
+	status "google.golang.org/grpc/status"
+)
+
+// This is a compile-time assertion to ensure that this generated file
+// is compatible with the grpc package it is being compiled against.
+// Requires gRPC-Go v1.64.0 or later.
+const _ = grpc.SupportPackageIsVersion9
+
+const (
+	VaultService_GetPublicKey_FullMethodName    = "/rune.vault.v1.VaultService/GetPublicKey"
+	VaultService_DecryptScores_FullMethodName   = "/rune.vault.v1.VaultService/DecryptScores"
+	VaultService_DecryptMetadata_FullMethodName = "/rune.vault.v1.VaultService/DecryptMetadata"
+)
+
+// VaultServiceClient is the client API for VaultService service.
+//
+// For semantics around ctx use and closing/ending streaming RPCs, please refer to https://pkg.go.dev/google.golang.org/grpc/?tab=doc#ClientConn.NewStream.
+//
+// Rune-Vault gRPC service.
+// Holds the FHE secret key and performs all decryption operations.
+type VaultServiceClient interface {
+	// Returns the public key bundle (EncKey, EvalKey, optional team index name).
+	GetPublicKey(ctx context.Context, in *GetPublicKeyRequest, opts ...grpc.CallOption) (*GetPublicKeyResponse, error)
+	// Decrypts FHE-encrypted similarity scores and applies Top-K filtering.
+	DecryptScores(ctx context.Context, in *DecryptScoresRequest, opts ...grpc.CallOption) (*DecryptScoresResponse, error)
+	// Decrypts a list of AES-encrypted metadata strings.
+	DecryptMetadata(ctx context.Context, in *DecryptMetadataRequest, opts ...grpc.CallOption) (*DecryptMetadataResponse, error)
+}
+
+type vaultServiceClient struct {
+	cc grpc.ClientConnInterface
+}
+
+func NewVaultServiceClient(cc grpc.ClientConnInterface) VaultServiceClient {
+	return &vaultServiceClient{cc}
+}
+
+func (c *vaultServiceClient) GetPublicKey(ctx context.Context, in *GetPublicKeyRequest, opts ...grpc.CallOption) (*GetPublicKeyResponse, error) {
+	cOpts := append([]grpc.CallOption{grpc.StaticMethod()}, opts...)
+	out := new(GetPublicKeyResponse)
+	err := c.cc.Invoke(ctx, VaultService_GetPublicKey_FullMethodName, in, out, cOpts...)
+	if err != nil {
+		return nil, err
+	}
+	return out, nil
+}
+
+func (c *vaultServiceClient) DecryptScores(ctx context.Context, in *DecryptScoresRequest, opts ...grpc.CallOption) (*DecryptScoresResponse, error) {
+	cOpts := append([]grpc.CallOption{grpc.StaticMethod()}, opts...)
+	out := new(DecryptScoresResponse)
+	err := c.cc.Invoke(ctx, VaultService_DecryptScores_FullMethodName, in, out, cOpts...)
+	if err != nil {
+		return nil, err
+	}
+	return out, nil
+}
+
+func (c *vaultServiceClient) DecryptMetadata(ctx context.Context, in *DecryptMetadataRequest, opts ...grpc.CallOption) (*DecryptMetadataResponse, error) {
+	cOpts := append([]grpc.CallOption{grpc.StaticMethod()}, opts...)
+	out := new(DecryptMetadataResponse)
+	err := c.cc.Invoke(ctx, VaultService_DecryptMetadata_FullMethodName, in, out, cOpts...)
+	if err != nil {
+		return nil, err
+	}
+	return out, nil
+}
+
+// VaultServiceServer is the server API for VaultService service.
+// All implementations must embed UnimplementedVaultServiceServer
+// for forward compatibility.
+//
+// Rune-Vault gRPC service.
+// Holds the FHE secret key and performs all decryption operations.
+type VaultServiceServer interface {
+	// Returns the public key bundle (EncKey, EvalKey, optional team index name).
+	GetPublicKey(context.Context, *GetPublicKeyRequest) (*GetPublicKeyResponse, error)
+	// Decrypts FHE-encrypted similarity scores and applies Top-K filtering.
+	DecryptScores(context.Context, *DecryptScoresRequest) (*DecryptScoresResponse, error)
+	// Decrypts a list of AES-encrypted metadata strings.
+	DecryptMetadata(context.Context, *DecryptMetadataRequest) (*DecryptMetadataResponse, error)
+	mustEmbedUnimplementedVaultServiceServer()
+}
+
+// UnimplementedVaultServiceServer must be embedded to have
+// forward compatible implementations.
+//
+// NOTE: this should be embedded by value instead of pointer to avoid a nil
+// pointer dereference when methods are called.
+type UnimplementedVaultServiceServer struct{}
+
+func (UnimplementedVaultServiceServer) GetPublicKey(context.Context, *GetPublicKeyRequest) (*GetPublicKeyResponse, error) {
+	return nil, status.Error(codes.Unimplemented, "method GetPublicKey not implemented")
+}
+func (UnimplementedVaultServiceServer) DecryptScores(context.Context, *DecryptScoresRequest) (*DecryptScoresResponse, error) {
+	return nil, status.Error(codes.Unimplemented, "method DecryptScores not implemented")
+}
+func (UnimplementedVaultServiceServer) DecryptMetadata(context.Context, *DecryptMetadataRequest) (*DecryptMetadataResponse, error) {
+	return nil, status.Error(codes.Unimplemented, "method DecryptMetadata not implemented")
+}
+func (UnimplementedVaultServiceServer) mustEmbedUnimplementedVaultServiceServer() {}
+func (UnimplementedVaultServiceServer) testEmbeddedByValue()                      {}
+
+// UnsafeVaultServiceServer may be embedded to opt out of forward compatibility for this service.
+// Use of this interface is not recommended, as added methods to VaultServiceServer will
+// result in compilation errors.
+type UnsafeVaultServiceServer interface {
+	mustEmbedUnimplementedVaultServiceServer()
+}
+
+func RegisterVaultServiceServer(s grpc.ServiceRegistrar, srv VaultServiceServer) {
+	// If the following call panics, it indicates UnimplementedVaultServiceServer was
+	// embedded by pointer and is nil.  This will cause panics if an
+	// unimplemented method is ever invoked, so we test this at initialization
+	// time to prevent it from happening at runtime later due to I/O.
+	if t, ok := srv.(interface{ testEmbeddedByValue() }); ok {
+		t.testEmbeddedByValue()
+	}
+	s.RegisterService(&VaultService_ServiceDesc, srv)
+}
+
+func _VaultService_GetPublicKey_Handler(srv interface{}, ctx context.Context, dec func(interface{}) error, interceptor grpc.UnaryServerInterceptor) (interface{}, error) {
+	in := new(GetPublicKeyRequest)
+	if err := dec(in); err != nil {
+		return nil, err
+	}
+	if interceptor == nil {
+		return srv.(VaultServiceServer).GetPublicKey(ctx, in)
+	}
+	info := &grpc.UnaryServerInfo{
+		Server:     srv,
+		FullMethod: VaultService_GetPublicKey_FullMethodName,
+	}
+	handler := func(ctx context.Context, req interface{}) (interface{}, error) {
+		return srv.(VaultServiceServer).GetPublicKey(ctx, req.(*GetPublicKeyRequest))
+	}
+	return interceptor(ctx, in, info, handler)
+}
+
+func _VaultService_DecryptScores_Handler(srv interface{}, ctx context.Context, dec func(interface{}) error, interceptor grpc.UnaryServerInterceptor) (interface{}, error) {
+	in := new(DecryptScoresRequest)
+	if err := dec(in); err != nil {
+		return nil, err
+	}
+	if interceptor == nil {
+		return srv.(VaultServiceServer).DecryptScores(ctx, in)
+	}
+	info := &grpc.UnaryServerInfo{
+		Server:     srv,
+		FullMethod: VaultService_DecryptScores_FullMethodName,
+	}
+	handler := func(ctx context.Context, req interface{}) (interface{}, error) {
+		return srv.(VaultServiceServer).DecryptScores(ctx, req.(*DecryptScoresRequest))
+	}
+	return interceptor(ctx, in, info, handler)
+}
+
+func _VaultService_DecryptMetadata_Handler(srv interface{}, ctx context.Context, dec func(interface{}) error, interceptor grpc.UnaryServerInterceptor) (interface{}, error) {
+	in := new(DecryptMetadataRequest)
+	if err := dec(in); err != nil {
+		return nil, err
+	}
+	if interceptor == nil {
+		return srv.(VaultServiceServer).DecryptMetadata(ctx, in)
+	}
+	info := &grpc.UnaryServerInfo{
+		Server:     srv,
+		FullMethod: VaultService_DecryptMetadata_FullMethodName,
+	}
+	handler := func(ctx context.Context, req interface{}) (interface{}, error) {
+		return srv.(VaultServiceServer).DecryptMetadata(ctx, req.(*DecryptMetadataRequest))
+	}
+	return interceptor(ctx, in, info, handler)
+}
+
+// VaultService_ServiceDesc is the grpc.ServiceDesc for VaultService service.
+// It's only intended for direct use with grpc.RegisterService,
+// and not to be introspected or modified (even as a copy)
+var VaultService_ServiceDesc = grpc.ServiceDesc{
+	ServiceName: "rune.vault.v1.VaultService",
+	HandlerType: (*VaultServiceServer)(nil),
+	Methods: []grpc.MethodDesc{
+		{
+			MethodName: "GetPublicKey",
+			Handler:    _VaultService_GetPublicKey_Handler,
+		},
+		{
+			MethodName: "DecryptScores",
+			Handler:    _VaultService_DecryptScores_Handler,
+		},
+		{
+			MethodName: "DecryptMetadata",
+			Handler:    _VaultService_DecryptMetadata_Handler,
+		},
+	},
+	Streams:  []grpc.StreamDesc{},
+	Metadata: "vault_service.proto",
+}
diff --git a/vault/proto/__init__.py b/vault/proto/__init__.py
deleted file mode 100644
index e69de29..0000000
diff --git a/vault/request_validator.py b/vault/request_validator.py
deleted file mode 100644
index 61f5d17..0000000
--- a/vault/request_validator.py
+++ /dev/null
@@ -1,96 +0,0 @@
-"""
-gRPC request input validation for Rune-Vault.
-
-Two layers of validation:
-  1. Proto-level: protovalidate enforces constraints declared in .proto
-     annotations (field length, int range, repeated item rules).
-  2. Runtime: supplementary checks that cannot be expressed in proto
-     annotations (control characters, whitespace, path traversal).
-
-Both layers are executed by ValidationInterceptor before requests
-reach business logic.
-"""
-
-import re
-
-import protovalidate
-
-# ---------------------------------------------------------------------------
-# Shared constants & patterns
-# ---------------------------------------------------------------------------
-
-MAX_INDEX_NAME_LENGTH = 128
-INDEX_NAME_PATTERN = re.compile(r"^[a-zA-Z0-9_-]+$")
-
-_CONTROL_CHAR_RE = re.compile(r"[\x00-\x1f\x7f]")
-
-# Cached validator instance (compiles CEL rules once per descriptor).
-_validator = protovalidate.Validator()
-
-
-# ---------------------------------------------------------------------------
-# Proto-level validation (protovalidate)
-# ---------------------------------------------------------------------------
-
-
-def validate_proto(request) -> None:
-    """Run protovalidate against the request message.
-
-    Raises protovalidate.ValidationError with structured Violation list.
-    """
-    _validator.validate(request)
-
-
-# ---------------------------------------------------------------------------
-# Supplementary runtime checks
-# ---------------------------------------------------------------------------
-
-
-class RuntimeValidationError(Exception):
-    """Raised for checks that proto annotations cannot express."""
-
-
-def check_token_safety(token: str) -> None:
-    """Reject tokens with control characters or surrounding whitespace."""
-    if _CONTROL_CHAR_RE.search(token):
-        raise RuntimeValidationError("token: must not contain control characters")
-    if token != token.strip():
-        raise RuntimeValidationError("token: must not have leading or trailing whitespace")
-
-
-def validate_index_name(name: str) -> None:
-    """Validate an index name (for future use)."""
-    if not name:
-        raise RuntimeValidationError("index_name: must not be empty")
-    if len(name) > MAX_INDEX_NAME_LENGTH:
-        raise RuntimeValidationError(
-            f"index_name: length {len(name)} exceeds maximum {MAX_INDEX_NAME_LENGTH}"
-        )
-    if not INDEX_NAME_PATTERN.match(name):
-        raise RuntimeValidationError(
-            "index_name: must contain only alphanumeric characters, underscores, or hyphens"
-        )
-
-
-# ---------------------------------------------------------------------------
-# Vault-method supplementary checks (keyed by gRPC method path)
-# ---------------------------------------------------------------------------
-
-
-def _check_get_public_key(request) -> None:
-    check_token_safety(request.token)
-
-
-def _check_decrypt_scores(request) -> None:
-    check_token_safety(request.token)
-
-
-def _check_decrypt_metadata(request) -> None:
-    check_token_safety(request.token)
-
-
-RUNTIME_CHECKS = {
-    "/rune.vault.v1.VaultService/GetPublicKey": _check_get_public_key,
-    "/rune.vault.v1.VaultService/DecryptScores": _check_decrypt_scores,
-    "/rune.vault.v1.VaultService/DecryptMetadata": _check_decrypt_metadata,
-}
diff --git a/vault/requirements.txt b/vault/requirements.txt
deleted file mode 100644
index 35731bd..0000000
--- a/vault/requirements.txt
+++ /dev/null
@@ -1,20 +0,0 @@
-# Rune-Vault Dependencies
-
-# FHE Encryption
-pyenvector>=1.2.0
-numpy>=1.24.0
-
-# Token Management
-PyYAML>=6.0
-
-# Cryptography (HKDF key derivation)
-cryptography>=41.0.0
-
-# gRPC
-grpcio>=1.60.2,<=1.74.0
-grpcio-tools>=1.60.2,<=1.74.0
-grpcio-health-checking>=1.60.2,<=1.74.0
-grpcio-reflection>=1.60.2,<=1.74.0
-
-# gRPC input validation (protovalidate)
-protovalidate>=1.1.0
diff --git a/vault/scripts/proto-gen.sh b/vault/scripts/proto-gen.sh
deleted file mode 100755
index 084cc13..0000000
--- a/vault/scripts/proto-gen.sh
+++ /dev/null
@@ -1,52 +0,0 @@
-#!/usr/bin/env bash
-# Generate Python protobuf/gRPC stubs from .proto files.
-#
-# Prerequisites:
-#   brew install bufbuild/buf/buf   (or: https://buf.build/docs/installation)
-#   pip install grpcio-tools
-#
-# Usage:
-#   ./scripts/proto-gen.sh          (from vault/ directory)
-#   make proto-gen                  (via Makefile)
-set -euo pipefail
-cd "$(dirname "$0")/.."
-
-# ── 1. Resolve buf dependencies ──────────────────────────────────────
-echo "[proto-gen] Updating buf dependencies..."
-buf dep update
-
-# ── 2. Export protovalidate protos to temp dir ───────────────────────
-DEPS_DIR=$(mktemp -d)
-trap 'rm -rf "$DEPS_DIR"' EXIT
-
-echo "[proto-gen] Exporting protovalidate protos..."
-buf export buf.build/bufbuild/protovalidate -o "$DEPS_DIR"
-
-# ── 3. Locate google well-known protos bundled with grpcio-tools ────
-GRPC_PROTO=$(python3 -c "
-import grpc_tools, os
-print(os.path.join(os.path.dirname(grpc_tools.__file__), '_proto'))
-")
-
-# ── 4. Generate vault_service stubs ─────────────────────────────────
-echo "[proto-gen] Generating vault_service_pb2.py / vault_service_pb2_grpc.py..."
-python3 -m grpc_tools.protoc \
-  -Iproto \
-  -I"$DEPS_DIR" \
-  -I"$GRPC_PROTO" \
-  --python_out=proto \
-  --grpc_python_out=proto \
-  proto/vault_service.proto
-
-# ── 5. Generate protovalidate runtime stubs ──────────────────────────
-echo "[proto-gen] Generating buf/validate/validate_pb2.py..."
-python3 -m grpc_tools.protoc \
-  -I"$DEPS_DIR" \
-  -I"$GRPC_PROTO" \
-  --python_out=. \
-  "$DEPS_DIR/buf/validate/validate.proto"
-
-mkdir -p buf/validate
-touch buf/__init__.py buf/validate/__init__.py
-
-echo "[proto-gen] Done."
diff --git a/vault/token_store.py b/vault/token_store.py
deleted file mode 100644
index e3c4ba2..0000000
--- a/vault/token_store.py
+++ /dev/null
@@ -1,580 +0,0 @@
-"""
-Per-user token and role management with async YAML persistence.
-
-Memory-first architecture: changes take effect immediately in-memory,
-then async-persist to YAML files for startup recovery.
-"""
-
-import datetime
-import logging
-import os
-import secrets
-import tempfile
-import threading
-import time
-from collections import defaultdict
-from concurrent.futures import ThreadPoolExecutor
-from dataclasses import dataclass
-
-import yaml
-
-logger = logging.getLogger("vault.token_store")
-
-
-# =============================================================================
-# Data Classes
-# =============================================================================
-
-
-@dataclass
-class Role:
-    """Role definition with scope, top_k, and rate limit."""
-
-    name: str
-    scope: list[str]
-    top_k: int
-    rate_limit: str  # e.g. "30/60s"
-
-    @property
-    def rate_limit_parsed(self) -> tuple[int, int]:
-        """Parse rate_limit string into (max_requests, window_seconds)."""
-        parts = self.rate_limit.replace("s", "").split("/")
-        return int(parts[0]), int(parts[1])
-
-
-@dataclass
-class Token:
-    """Per-user token with role assignment and expiry."""
-
-    user: str
-    token: str
-    role: str
-    issued_at: str  # ISO date, e.g. "2026-03-20"
-    expires: str | None = None  # ISO date or None (never expires)
-
-    @property
-    def is_expired(self) -> bool:
-        if self.expires is None:
-            return False
-        return datetime.date.fromisoformat(self.expires) < datetime.date.today()
-
-
-# =============================================================================
-# Custom Exceptions (inherit ValueError for backward compat with gRPC handlers)
-# =============================================================================
-
-
-class TokenNotFoundError(ValueError):
-    """Token not found in store."""
-
-    def __init__(self):
-        super().__init__("Invalid authentication token")
-
-
-class TokenExpiredError(ValueError):
-    """Token has expired."""
-
-    def __init__(self, username: str):
-        self.username = username
-        super().__init__(f"Token expired for user '{username}'")
-
-
-class RateLimitError(ValueError):
-    """Rate limit exceeded."""
-
-    def __init__(self, retry_after: int):
-        self.retry_after = retry_after
-        super().__init__(f"Rate limit exceeded. Retry after {retry_after}s")
-
-
-class TopKExceededError(ValueError):
-    """Requested top_k exceeds role limit."""
-
-    def __init__(self, requested: int, max_top_k: int, role_name: str):
-        self.requested = requested
-        self.max_top_k = max_top_k
-        super().__init__(f"top_k {requested} exceeds limit {max_top_k} for role '{role_name}'")
-
-
-class ScopeError(ValueError):
-    """Method not permitted for role."""
-
-    def __init__(self, method: str, role_name: str):
-        self.method = method
-        super().__init__(f"Method '{method}' not permitted for role '{role_name}'")
-
-
-# =============================================================================
-# Rate Limiter (moved from vault_core.py)
-# =============================================================================
-
-
-class RateLimiter:
-    """Simple sliding window rate limiter."""
-
-    def __init__(self, max_requests: int = 30, window_seconds: int = 60):
-        self.max_requests = max_requests
-        self.window_seconds = window_seconds
-        self._requests: dict[str, list[float]] = defaultdict(list)
-        self._lock = threading.Lock()
-
-    def is_allowed(self, client_id: str) -> bool:
-        """Check if request is allowed and record it."""
-        now = time.time()
-        with self._lock:
-            self._requests[client_id] = [
-                t for t in self._requests[client_id] if now - t < self.window_seconds
-            ]
-            if len(self._requests[client_id]) >= self.max_requests:
-                return False
-            self._requests[client_id].append(now)
-            return True
-
-    def get_retry_after(self, client_id: str) -> int:
-        """Returns seconds until next request is allowed."""
-        with self._lock:
-            if not self._requests[client_id]:
-                return 0
-            oldest = min(self._requests[client_id])
-            return max(0, int(self.window_seconds - (time.time() - oldest)))
-
-    def remove(self, client_id: str):
-        """Remove a client's rate limit tracking."""
-        with self._lock:
-            self._requests.pop(client_id, None)
-
-
-# =============================================================================
-# Default Roles
-# =============================================================================
-
-DEFAULT_ROLES = {
-    "admin": Role(
-        "admin",
-        ["get_public_key", "decrypt_scores", "decrypt_metadata", "manage_tokens"],
-        50,
-        "150/60s",
-    ),
-    "member": Role(
-        "member",
-        ["get_public_key", "decrypt_scores", "decrypt_metadata"],
-        10,
-        "30/60s",
-    ),
-}
-
-DEFAULT_ROLE_NAMES = frozenset(DEFAULT_ROLES.keys())
-
-DEMO_TOKEN = "evt_0000000000000000000000000000demo"
-
-
-# =============================================================================
-# Token Store
-# =============================================================================
-
-
-class TokenStore:
-    """Thread-safe in-memory store for tokens and roles with async YAML persistence."""
-
-    def __init__(self):
-        self._lock = threading.RLock()
-        self._tokens: dict[str, Token] = {}  # keyed by token string
-        self._tokens_by_user: dict[str, Token] = {}  # keyed by username
-        self._roles: dict[str, Role] = {}
-        self._rate_limiters: dict[str, RateLimiter] = {}  # keyed by username
-        self._roles_path: str | None = None
-        self._tokens_path: str | None = None
-        self._persist_executor = ThreadPoolExecutor(max_workers=1)
-
-    # ── Loaders ──────────────────────────────────────────────────────────
-
-    def load_from_files(self, roles_path: str, tokens_path: str):
-        """Load roles and tokens from YAML config files at startup."""
-        with self._lock:
-            self._roles_path = roles_path
-            self._tokens_path = tokens_path
-
-            # Load roles
-            if os.path.exists(roles_path):
-                with open(roles_path) as f:
-                    data = yaml.safe_load(f) or {}
-                for name, cfg in data.get("roles", {}).items():
-                    self._roles[name] = Role(
-                        name=name,
-                        scope=cfg.get("scope", []),
-                        top_k=cfg.get("top_k", 5),
-                        rate_limit=cfg.get("rate_limit", "30/60s"),
-                    )
-                logger.info("Loaded %d roles from %s", len(self._roles), roles_path)
-            else:
-                self._roles = dict(DEFAULT_ROLES)
-                logger.info("No roles file found, using defaults")
-
-            # Ensure default roles always exist
-            for name, role in DEFAULT_ROLES.items():
-                if name not in self._roles:
-                    self._roles[name] = role
-
-            # Load tokens
-            if os.path.exists(tokens_path):
-                with open(tokens_path) as f:
-                    data = yaml.safe_load(f) or {}
-                for entry in data.get("tokens", []):
-                    tok = Token(
-                        user=entry["user"],
-                        token=entry["token"],
-                        role=entry["role"],
-                        issued_at=entry.get("issued_at") or entry.get("created", ""),
-                        expires=entry.get("expires"),
-                    )
-                    self._tokens[tok.token] = tok
-                    self._tokens_by_user[tok.user] = tok
-                logger.info("Loaded %d tokens from %s", len(self._tokens), tokens_path)
-
-        # Auto-generate default config files if they don't exist
-        if not os.path.exists(roles_path) or not os.path.exists(tokens_path):
-            self._schedule_persist()
-
-    def load_legacy_env(self, env_tokens: str):
-        """Backward compat: load comma-separated VAULT_TOKENS as legacy tokens."""
-        with self._lock:
-            self._roles = dict(DEFAULT_ROLES)
-            tokens = [t.strip() for t in env_tokens.split(",") if t.strip()]
-            for i, token_str in enumerate(tokens):
-                user = f"legacy_{i}"
-                tok = Token(
-                    user=user,
-                    token=token_str,
-                    role="admin",
-                    issued_at=datetime.date.today().isoformat(),
-                    expires=None,
-                )
-                self._tokens[tok.token] = tok
-                self._tokens_by_user[tok.user] = tok
-            logger.info("Loaded %d legacy tokens from env var", len(tokens))
-
-    def load_defaults_with_demo_token(self):
-        """Demo mode: load default roles and demo token."""
-        with self._lock:
-            self._roles = dict(DEFAULT_ROLES)
-            tok = Token(
-                user="demo",
-                token=DEMO_TOKEN,
-                role="admin",
-                issued_at=datetime.date.today().isoformat(),
-                expires=None,
-            )
-            self._tokens[tok.token] = tok
-            self._tokens_by_user[tok.user] = tok
-            logger.warning("Demo mode active with demo token")
-
-    # ── Validation ───────────────────────────────────────────────────────
-
-    def validate(self, token_str: str) -> tuple[str, Role]:
-        """
-        Validate a token string.
-
-        Returns (username, Role) on success.
-        Raises TokenNotFoundError, TokenExpiredError, or RateLimitError on failure.
-        """
-        with self._lock:
-            tok = self._tokens.get(token_str)
-            if tok is None:
-                raise TokenNotFoundError()
-
-            if tok.is_expired:
-                raise TokenExpiredError(tok.user)
-
-            role = self._roles.get(tok.role)
-            if role is None:
-                raise TokenNotFoundError()
-
-            # Per-user rate limiting with role-specific limits
-            limiter = self._get_or_create_limiter(tok.user, role)
-
-        # Rate limit check outside the main lock (limiter has its own lock)
-        if not limiter.is_allowed(tok.user):
-            retry_after = limiter.get_retry_after(tok.user)
-            raise RateLimitError(retry_after)
-
-        return tok.user, role
-
-    def get_username(self, token_str: str) -> str | None:
-        """Look up username for a token without side effects."""
-        with self._lock:
-            tok = self._tokens.get(token_str)
-            return tok.user if tok else None
-
-    def check_scope(self, role: Role, method_name: str):
-        """Check if a method is permitted for the given role."""
-        if method_name not in role.scope:
-            raise ScopeError(method_name, role.name)
-
-    def _get_or_create_limiter(self, username: str, role: Role) -> RateLimiter:
-        """Get or lazily create a rate limiter for a user with role-specific limits."""
-        # Must be called under self._lock
-        limiter = self._rate_limiters.get(username)
-        if limiter is None:
-            max_req, window = role.rate_limit_parsed
-            limiter = RateLimiter(max_requests=max_req, window_seconds=window)
-            self._rate_limiters[username] = limiter
-        return limiter
-
-    # ── Token CRUD ───────────────────────────────────────────────────────
-
-    def add_token(self, user: str, role: str, expires_days: int | None = None) -> Token:
-        """Issue a new token for a user."""
-        with self._lock:
-            if role not in self._roles:
-                raise ValueError(f"Role '{role}' does not exist")
-            if user in self._tokens_by_user:
-                raise ValueError(f"Token already exists for user '{user}'")
-
-            token_str = f"evt_{secrets.token_hex(16)}"
-            today = datetime.date.today()
-            expires = None
-            if expires_days is not None:
-                expires = (today + datetime.timedelta(days=expires_days)).isoformat()
-
-            tok = Token(
-                user=user,
-                token=token_str,
-                role=role,
-                issued_at=today.isoformat(),
-                expires=expires,
-            )
-            self._tokens[tok.token] = tok
-            self._tokens_by_user[tok.user] = tok
-
-        self._schedule_persist()
-        return tok
-
-    def revoke_token(self, user: str) -> bool:
-        """Revoke a user's token. Returns True if token was found and revoked."""
-        with self._lock:
-            tok = self._tokens_by_user.pop(user, None)
-            if tok is None:
-                return False
-            self._tokens.pop(tok.token, None)
-            # Clean up rate limiter
-            limiter = self._rate_limiters.pop(user, None)
-            if limiter:
-                limiter.remove(user)
-
-        self._schedule_persist()
-        return True
-
-    def rotate_token(self, user: str) -> Token:
-        """Atomically revoke old token and issue a new one for the same user/role."""
-        with self._lock:
-            old_tok = self._tokens_by_user.get(user)
-            if old_tok is None:
-                raise ValueError(f"No token found for user '{user}'")
-
-            old_role = old_tok.role
-            # Preserve original expiry duration
-            expires_days = None
-            if old_tok.expires:
-                issued_date = datetime.date.fromisoformat(old_tok.issued_at)
-                expires_date = datetime.date.fromisoformat(old_tok.expires)
-                expires_days = (expires_date - issued_date).days
-
-            # Revoke old (inline, within same lock)
-            self._tokens.pop(old_tok.token, None)
-            del self._tokens_by_user[user]
-            limiter = self._rate_limiters.pop(user, None)
-            if limiter:
-                limiter.remove(user)
-
-            # Issue new
-            token_str = f"evt_{secrets.token_hex(16)}"
-            today = datetime.date.today()
-            expires = None
-            if expires_days is not None:
-                expires = (today + datetime.timedelta(days=expires_days)).isoformat()
-
-            new_tok = Token(
-                user=user,
-                token=token_str,
-                role=old_role,
-                issued_at=today.isoformat(),
-                expires=expires,
-            )
-            self._tokens[new_tok.token] = new_tok
-            self._tokens_by_user[user] = new_tok
-
-        self._schedule_persist()
-        logger.info("Rotated token for user '%s'", user)
-        return new_tok
-
-    def rotate_all_tokens(self) -> list[Token]:
-        """Rotate all tokens. Each rotation is individually atomic."""
-        with self._lock:
-            users = list(self._tokens_by_user.keys())
-        results = []
-        for user in users:
-            results.append(self.rotate_token(user))
-        return results
-
-    def list_tokens(self) -> list[dict]:
-        """List all tokens (token values truncated for security)."""
-        with self._lock:
-            result = []
-            for tok in self._tokens_by_user.values():
-                role = self._roles.get(tok.role)
-                result.append(
-                    {
-                        "user": tok.user,
-                        "role": tok.role,
-                        "top_k": role.top_k if role else "?",
-                        "rate_limit": role.rate_limit if role else "?",
-                        "expires": tok.expires or "never",
-                    }
-                )
-            return result
-
-    # ── Role CRUD ────────────────────────────────────────────────────────
-
-    @staticmethod
-    def _validate_rate_limit(rate_limit: str):
-        """Validate rate_limit format (e.g. '30/60s')."""
-        import re
-
-        if not re.fullmatch(r"\d+/\d+s", rate_limit):
-            raise ValueError(
-                f"Invalid rate_limit format '{rate_limit}'."
-                " Expected '<max>/<window>s' (e.g. '30/60s')"
-            )
-
-    def add_role(self, name: str, scope: list[str], top_k: int, rate_limit: str) -> Role:
-        """Create a new role."""
-        self._validate_rate_limit(rate_limit)
-        with self._lock:
-            if name in self._roles:
-                raise ValueError(f"Role '{name}' already exists")
-            role = Role(name=name, scope=scope, top_k=top_k, rate_limit=rate_limit)
-            self._roles[name] = role
-
-        self._schedule_persist()
-        return role
-
-    def update_role(self, name: str, **kwargs) -> Role:
-        """Update an existing role. Accepts scope, top_k, rate_limit kwargs."""
-        if "rate_limit" in kwargs:
-            self._validate_rate_limit(kwargs["rate_limit"])
-        with self._lock:
-            role = self._roles.get(name)
-            if role is None:
-                raise ValueError(f"Role '{name}' does not exist")
-
-            if "scope" in kwargs:
-                role.scope = kwargs["scope"]
-            if "top_k" in kwargs:
-                role.top_k = kwargs["top_k"]
-            if "rate_limit" in kwargs:
-                role.rate_limit = kwargs["rate_limit"]
-                # Clear rate limiters for affected users so they pick up new limits
-                for tok in self._tokens_by_user.values():
-                    if tok.role == name and tok.user in self._rate_limiters:
-                        del self._rate_limiters[tok.user]
-
-        self._schedule_persist()
-        return role
-
-    def delete_role(self, name: str):
-        """Delete a role. Rejects deletion of default roles."""
-        with self._lock:
-            if name in DEFAULT_ROLE_NAMES:
-                raise ValueError(f"Cannot delete default role '{name}'")
-            if name not in self._roles:
-                raise ValueError(f"Role '{name}' does not exist")
-
-            # Check if any tokens reference this role
-            for tok in self._tokens_by_user.values():
-                if tok.role == name:
-                    raise ValueError(
-                        f"Cannot delete role '{name}': "
-                        f"token for user '{tok.user}' is assigned to it"
-                    )
-
-            del self._roles[name]
-
-        self._schedule_persist()
-
-    def list_roles(self) -> list[dict]:
-        """List all roles."""
-        with self._lock:
-            return [
-                {
-                    "name": r.name,
-                    "scope": r.scope,
-                    "top_k": r.top_k,
-                    "rate_limit": r.rate_limit,
-                }
-                for r in self._roles.values()
-            ]
-
-    # ── Persistence ──────────────────────────────────────────────────────
-
-    def _schedule_persist(self):
-        """Schedule async persistence to YAML files."""
-        if self._roles_path is None or self._tokens_path is None:
-            return  # No file paths configured (legacy/demo mode)
-        self._persist_executor.submit(self._do_persist)
-
-    def _do_persist(self):
-        """Atomically write current state to YAML files."""
-        try:
-            time.sleep(0.1)  # Debounce rapid changes
-
-            with self._lock:
-                roles_data = {
-                    "roles": {
-                        r.name: {
-                            "scope": r.scope,
-                            "top_k": r.top_k,
-                            "rate_limit": r.rate_limit,
-                        }
-                        for r in self._roles.values()
-                    }
-                }
-                tokens_data = {
-                    "tokens": [
-                        {
-                            "user": t.user,
-                            "token": t.token,
-                            "role": t.role,
-                            "issued_at": t.issued_at,
-                            **({"expires": t.expires} if t.expires else {}),
-                        }
-                        for t in self._tokens_by_user.values()
-                    ]
-                }
-
-            # Atomic writes: temp file + os.replace
-            if self._roles_path:
-                self._atomic_write(self._roles_path, roles_data)
-            if self._tokens_path:
-                self._atomic_write(self._tokens_path, tokens_data)
-
-            logger.debug("Persisted token/role state to YAML")
-        except Exception:
-            logger.exception("Failed to persist token/role state")
-
-    @staticmethod
-    def _atomic_write(path: str, data: dict):
-        """Write data to a file atomically via temp file + os.replace."""
-        dir_name = os.path.dirname(path) or "."
-        os.makedirs(dir_name, exist_ok=True)
-        fd, tmp_path = tempfile.mkstemp(dir=dir_name, suffix=".tmp")
-        try:
-            with os.fdopen(fd, "w") as f:
-                yaml.safe_dump(data, f, default_flow_style=False, sort_keys=False)
-            os.replace(tmp_path, path)
-        except Exception:
-            os.unlink(tmp_path)
-            raise
-
-
-# Module-level singleton
-token_store = TokenStore()
diff --git a/vault/validation_interceptor.py b/vault/validation_interceptor.py
deleted file mode 100644
index 4ed6ddf..0000000
--- a/vault/validation_interceptor.py
+++ /dev/null
@@ -1,65 +0,0 @@
-"""
-gRPC server interceptor that validates request fields before processing.
-
-Runs two validation layers:
-  1. protovalidate — enforces .proto annotation constraints
-  2. Runtime checks — control chars, whitespace (not expressible in proto)
-
-Rejects malformed requests with INVALID_ARGUMENT before they reach
-VaultServiceServicer methods. Non-vault methods (health, reflection)
-pass through untouched.
-"""
-
-import logging
-
-import grpc
-import protovalidate
-from request_validator import (
-    RUNTIME_CHECKS,
-    RuntimeValidationError,
-    validate_proto,
-)
-
-logger = logging.getLogger("rune.vault.validation")
-
-
-class ValidationInterceptor(grpc.ServerInterceptor):
-    """Intercepts unary-unary gRPC calls to validate request fields."""
-
-    def intercept_service(self, continuation, handler_call_details):
-        method = handler_call_details.method
-        next_handler = continuation(handler_call_details)
-
-        if next_handler is None:
-            return None
-
-        runtime_check = RUNTIME_CHECKS.get(method)
-        if runtime_check is None:
-            return next_handler
-
-        original_handler = next_handler.unary_unary
-        if original_handler is None:
-            return next_handler
-
-        def validating_handler(request, context):
-            try:
-                # Layer 1: proto annotation constraints
-                validate_proto(request)
-                # Layer 2: supplementary runtime checks
-                runtime_check(request)
-            except protovalidate.ValidationError as exc:
-                msg = "; ".join(f"{v.proto.field}: {v.proto.message}" for v in exc.violations)
-                logger.warning("Validation rejected %s: %s", method, msg)
-                context.abort(grpc.StatusCode.INVALID_ARGUMENT, msg)
-                return None
-            except RuntimeValidationError as exc:
-                logger.warning("Validation rejected %s: %s", method, exc)
-                context.abort(grpc.StatusCode.INVALID_ARGUMENT, str(exc))
-                return None
-            return original_handler(request, context)
-
-        return grpc.unary_unary_rpc_method_handler(
-            validating_handler,
-            request_deserializer=next_handler.request_deserializer,
-            response_serializer=next_handler.response_serializer,
-        )
diff --git a/vault/vault_admin_cli.py b/vault/vault_admin_cli.py
deleted file mode 100644
index 5f206af..0000000
--- a/vault/vault_admin_cli.py
+++ /dev/null
@@ -1,250 +0,0 @@
-#!/usr/bin/env python3
-"""
-Vault Admin CLI — manages per-user tokens and roles.
-
-Usage (via docker exec or runevault alias):
-    runevault token issue --user alice --role member --expires 90d
-    runevault token revoke --user alice
-    runevault token list
-    runevault role list
-    runevault role create --name researcher \\
-        --scope get_public_key,decrypt_scores --top-k 3 --rate-limit 10/60s
-    runevault role update --name member --top-k 8
-    runevault role delete --name researcher
-"""
-
-import argparse
-import http.client
-import json
-import re
-import sys
-
-ADMIN_HOST = "127.0.0.1"
-ADMIN_PORT = 8081
-
-
-def _request(method: str, path: str, body: dict | None = None) -> dict:
-    """Send an HTTP request to the admin server and return parsed JSON."""
-    conn = http.client.HTTPConnection(ADMIN_HOST, ADMIN_PORT)
-    headers = {"Content-Type": "application/json"} if body else {}
-    data = json.dumps(body).encode() if body else None
-    try:
-        conn.request(method, path, body=data, headers=headers)
-        resp = conn.getresponse()
-        result = json.loads(resp.read().decode())
-        if resp.status >= 400:
-            print(f"Error: {result.get('error', 'Unknown error')}", file=sys.stderr)
-            sys.exit(1)
-        return result
-    except ConnectionRefusedError:
-        print("Error: Cannot connect to admin server. Is Vault running?", file=sys.stderr)
-        sys.exit(1)
-    finally:
-        conn.close()
-
-
-# ── Token commands ───────────────────────────────────────────────────────
-
-
-def _parse_duration(value: str) -> int:
-    """Parse duration string like '90d', '12w', '6m' into days."""
-    m = re.fullmatch(r"(\d+)([dwm])", value)
-    if not m:
-        print(
-            f"Error: Invalid duration '{value}'. Use <number><d|w|m> (e.g. 90d, 12w, 6m)",
-            file=sys.stderr,
-        )
-        sys.exit(1)
-    n, unit = int(m.group(1)), m.group(2)
-    if unit == "d":
-        return n
-    if unit == "w":
-        return n * 7
-    return n * 30  # 'm' approximation
-
-
-def cmd_token_issue(args):
-    body = {"user": args.user, "role": args.role}
-    if args.expires is not None:
-        body["expires_days"] = _parse_duration(args.expires)
-    result = _request("POST", "/tokens", body)
-    print(f"\nToken issued for '{result['user']}':")
-    print(f"  Role:    {result['role']}")
-    print(f"  Expires: {result['expires']}")
-    print(f"\n  Token: {result['token']}")
-    print("\n  WARNING: This token will NOT be shown again. Share it securely.")
-
-
-def cmd_token_revoke(args):
-    result = _request("DELETE", f"/tokens/{args.user}")
-    print(result["message"])
-
-
-def cmd_token_rotate(args):
-    if args.rotate_all:
-        result = _request("POST", "/tokens/_rotate_all", {})
-        count = result["rotated"]
-        if count == 0:
-            print("No tokens to rotate.")
-            return
-        print(f"Rotated {count} token(s):\n")
-        for t in result["tokens"]:
-            print(f"  {t['user']}: {t['token']}")
-        print("\n  WARNING: These tokens will NOT be shown again. Share them securely.")
-    else:
-        result = _request("POST", f"/tokens/{args.user}/rotate", {})
-        print(f"\nToken rotated for '{result['user']}':")
-        print(f"  Role:    {result['role']}")
-        print(f"  Expires: {result['expires']}")
-        print(f"\n  Token: {result['token']}")
-        print("\n  WARNING: This token will NOT be shown again. Share it securely.")
-
-
-def cmd_token_list(args):
-    result = _request("GET", "/tokens")
-    tokens = result.get("tokens", [])
-    if not tokens:
-        print("No tokens issued.")
-        return
-    # Table header
-    fmt = "{:<16} {:<10} {:>6} {:>10}  {:<12}"
-    print(fmt.format("USER", "ROLE", "TOP_K", "RATE", "EXPIRES"))
-    for t in tokens:
-        print(
-            fmt.format(
-                t["user"],
-                t["role"],
-                str(t["top_k"]),
-                str(t["rate_limit"]),
-                t["expires"],
-            )
-        )
-
-
-# ── Role commands ────────────────────────────────────────────────────────
-
-
-def cmd_role_list(args):
-    result = _request("GET", "/roles")
-    roles = result.get("roles", [])
-    if not roles:
-        print("No roles defined.")
-        return
-    fmt = "{:<12} {:<50} {:>6} {:>10}"
-    print(fmt.format("ROLE", "SCOPE", "TOP_K", "RATE"))
-    for r in roles:
-        scope_str = ",".join(r["scope"])
-        print(fmt.format(r["name"], scope_str, str(r["top_k"]), r["rate_limit"]))
-
-
-def cmd_role_create(args):
-    scope = [s.strip() for s in args.scope.split(",")]
-    body = {
-        "name": args.name,
-        "scope": scope,
-        "top_k": args.top_k,
-        "rate_limit": args.rate_limit,
-    }
-    _request("POST", "/roles", body)
-    print(f"Role '{args.name}' created.")
-
-
-def cmd_role_update(args):
-    body = {}
-    if args.scope is not None:
-        body["scope"] = [s.strip() for s in args.scope.split(",")]
-    if args.top_k is not None:
-        body["top_k"] = args.top_k
-    if args.rate_limit is not None:
-        body["rate_limit"] = args.rate_limit
-    if not body:
-        print("Error: No fields to update.", file=sys.stderr)
-        sys.exit(1)
-    _request("PUT", f"/roles/{args.name}", body)
-    print(
-        f"Role '{args.name}' updated."
-        " Changes take effect immediately for all tokens with this role."
-    )
-
-
-def cmd_role_delete(args):
-    _request("DELETE", f"/roles/{args.name}")
-    print(f"Role '{args.name}' deleted.")
-
-
-# ── Argument parsing ─────────────────────────────────────────────────────
-
-
-def build_parser() -> argparse.ArgumentParser:
-    parser = argparse.ArgumentParser(
-        prog="runevault",
-        description="Rune-Vault Admin CLI",
-    )
-    sub = parser.add_subparsers(dest="resource", required=True)
-
-    # ── token ──
-    token_parser = sub.add_parser("token", help="Manage per-user tokens")
-    token_sub = token_parser.add_subparsers(dest="action", required=True)
-
-    issue_p = token_sub.add_parser("issue", help="Issue a new token")
-    issue_p.add_argument("--user", required=True, help="Username")
-    issue_p.add_argument("--role", required=True, help="Role name")
-    issue_p.add_argument(
-        "--expires", default=None, help="Duration until expiry (e.g. 90d, 12w, 6m)"
-    )
-    issue_p.set_defaults(func=cmd_token_issue)
-
-    revoke_p = token_sub.add_parser("revoke", help="Revoke a user's token")
-    revoke_p.add_argument("--user", required=True, help="Username")
-    revoke_p.set_defaults(func=cmd_token_revoke)
-
-    rotate_p = token_sub.add_parser("rotate", help="Rotate a token (revoke + reissue)")
-    rotate_group = rotate_p.add_mutually_exclusive_group(required=True)
-    rotate_group.add_argument("--user", help="Username to rotate")
-    rotate_group.add_argument(
-        "--all", action="store_true", dest="rotate_all", help="Rotate all tokens"
-    )
-    rotate_p.set_defaults(func=cmd_token_rotate)
-
-    list_p = token_sub.add_parser("list", help="List all tokens")
-    list_p.set_defaults(func=cmd_token_list)
-
-    # ── role ──
-    role_parser = sub.add_parser("role", help="Manage roles")
-    role_sub = role_parser.add_subparsers(dest="action", required=True)
-
-    rlist_p = role_sub.add_parser("list", help="List all roles")
-    rlist_p.set_defaults(func=cmd_role_list)
-
-    create_p = role_sub.add_parser("create", help="Create a new role")
-    create_p.add_argument("--name", required=True, help="Role name")
-    create_p.add_argument("--scope", required=True, help="Comma-separated scope list")
-    create_p.add_argument("--top-k", type=int, required=True, help="Max top_k")
-    create_p.add_argument("--rate-limit", required=True, help="Rate limit (e.g. 30/60s)")
-    create_p.set_defaults(func=cmd_role_create)
-
-    update_p = role_sub.add_parser("update", help="Update a role")
-    update_p.add_argument("--name", required=True, help="Role name")
-    update_p.add_argument("--scope", default=None, help="Comma-separated scope list")
-    update_p.add_argument("--top-k", type=int, default=None, help="Max top_k")
-    update_p.add_argument("--rate-limit", default=None, help="Rate limit (e.g. 30/60s)")
-    update_p.set_defaults(func=cmd_role_update)
-
-    delete_p = role_sub.add_parser("delete", help="Delete a role")
-    delete_p.add_argument("--name", required=True, help="Role name")
-    delete_p.set_defaults(func=cmd_role_delete)
-
-    return parser
-
-
-def main():
-    parser = build_parser()
-    args = parser.parse_args()
-    if hasattr(args, "func"):
-        args.func(args)
-    else:
-        parser.print_help()
-
-
-if __name__ == "__main__":
-    main()
diff --git a/vault/vault_core.py b/vault/vault_core.py
deleted file mode 100644
index 3556abc..0000000
--- a/vault/vault_core.py
+++ /dev/null
@@ -1,326 +0,0 @@
-"""
-Rune-Vault Core Business Logic
-
-Pure business logic for FHE key management, authentication, and decryption.
-No transport layer (MCP, gRPC) — consumed by vault_grpc_server.py.
-"""
-
-import base64
-import hashlib
-import heapq
-import json
-import logging
-import os
-
-from cryptography.hazmat.primitives import hashes
-from cryptography.hazmat.primitives.kdf.hkdf import HKDF
-from pyenvector.crypto import Cipher, KeyGenerator
-from pyenvector.crypto.block import CipherBlock
-from pyenvector.utils.aes import decrypt_metadata as aes_decrypt_metadata
-
-try:
-    from pyenvector.proto_gen.v2.common.type_pb2 import CiphertextScore
-except ModuleNotFoundError:
-    from pyenvector.proto_gen.type_pb2 import CiphertextScore
-
-logger = logging.getLogger("rune.vault")
-
-# Configuration
-KEY_DIR = "vault_keys"
-KEY_ID = "vault-key"
-DIM = 1024  # FHE cipher supports up to 2^12, using 1024 for production
-
-# ev.init() resolves key files as {KEY_DIR}/{KEY_ID}/EncKey.json
-KEY_SUBDIR = os.path.join(KEY_DIR, KEY_ID)
-
-# enVector Cloud configuration
-ENVECTOR_ENDPOINT = os.getenv("ENVECTOR_ENDPOINT", "").strip() or None
-ENVECTOR_API_KEY = os.getenv("ENVECTOR_API_KEY", "").strip() or None
-EMBEDDING_DIM = int(os.getenv("EMBEDDING_DIM", "1024"))
-
-# Team index name (set by admin, distributed to all team members via get_public_key)
-VAULT_INDEX_NAME = os.getenv("VAULT_INDEX_NAME", "").strip() or None
-
-
-def ensure_vault():
-    """
-    One-shot startup:
-    1. Generate local FHE keys if not present (KeyGenerator)
-    2. Connect to enVector Cloud with auto_key_setup=True
-       (SDK handles key registration → loading)
-    3. Create the team index if it doesn't exist
-    """
-    import pyenvector as ev
-
-    # Phase 1: local key generation
-    enc_key = os.path.join(KEY_SUBDIR, "EncKey.json")
-    if not os.path.exists(enc_key):
-        logger.info(f"Generating keys in {KEY_SUBDIR}...")
-        os.makedirs(KEY_SUBDIR, exist_ok=True)
-        keygen = KeyGenerator(
-            key_path=KEY_SUBDIR, key_id=KEY_ID, dim_list=[DIM], metadata_encryption=False
-        )
-        keygen.generate_keys()
-    else:
-        logger.info(f"Keys found in {KEY_SUBDIR}")
-
-    # Phase 2: connect to enVector Cloud and register key
-    if not ENVECTOR_ENDPOINT or not ENVECTOR_API_KEY:
-        logger.warning("ENVECTOR_ENDPOINT/ENVECTOR_API_KEY not set — offline mode, no team index.")
-        return
-
-    logger.info(f"Connecting to enVector Cloud ({ENVECTOR_ENDPOINT})...")
-    try:
-        ev.init(
-            address=ENVECTOR_ENDPOINT,
-            key_path=KEY_DIR,
-            key_id=KEY_ID,
-            dim=EMBEDDING_DIM,
-            eval_mode="rmp",
-            auto_key_setup=True,
-            access_token=ENVECTOR_API_KEY,
-            query_encryption="plain",
-        )
-        logger.info("Key registered on enVector Cloud (auto_key_setup).")
-    except Exception as e:
-        logger.warning(f"auto_key_setup failed (key may already be registered): {e}")
-        logger.info("Retrying with auto_key_setup=False...")
-        ev.init(
-            address=ENVECTOR_ENDPOINT,
-            key_path=KEY_DIR,
-            key_id=KEY_ID,
-            dim=EMBEDDING_DIM,
-            eval_mode="rmp",
-            auto_key_setup=False,
-            access_token=ENVECTOR_API_KEY,
-            query_encryption="plain",
-        )
-        logger.info("Connected to enVector Cloud (auto_key_setup=False).")
-
-    # Phase 3: ensure team index
-    if not VAULT_INDEX_NAME:
-        return
-
-    try:
-        existing = ev.get_index_list()
-        existing_names = []
-        if hasattr(existing, "indexes"):
-            existing_names = [idx.index_name for idx in existing.indexes]
-        elif isinstance(existing, (list, tuple)):
-            existing_names = [str(idx) for idx in existing]
-
-        if VAULT_INDEX_NAME in existing_names:
-            logger.info(f"Team index '{VAULT_INDEX_NAME}' already exists.")
-        else:
-            ev.create_index(
-                index_name=VAULT_INDEX_NAME,
-                dim=EMBEDDING_DIM,
-                index_params={"index_type": "FLAT"},
-                query_encryption="plain",
-                metadata_encryption=False,
-                # workaround: skip deepcopy metadata_key property access (pyenvector#247)
-                metadata_key=b"",
-            )
-            logger.info(f"Created team index '{VAULT_INDEX_NAME}' (dim={EMBEDDING_DIM}).")
-    except Exception as e:
-        logger.error(f"Failed to ensure team index: {e}", exc_info=True)
-
-
-ensure_vault()
-enc_key_path = os.path.join(KEY_SUBDIR, "EncKey.json")
-sec_key_path = os.path.join(KEY_SUBDIR, "SecKey.json")
-
-# Initialize shared Cipher instance
-cipher = Cipher(enc_key_path=enc_key_path, dim=DIM)
-
-
-# =============================================================================
-# Per-Agent Metadata Key Derivation (HKDF-SHA256)
-# =============================================================================
-def derive_agent_key(team_secret: str, agent_id: str) -> bytes:
-    """Derive a 32-byte AES-256 DEK for a specific agent via HKDF-SHA256.
-
-    Args:
-        team_secret: Team-wide master secret (VAULT_TEAM_SECRET).
-        agent_id: Per-user agent identifier derived from token.
-
-    Returns:
-        32-byte AES-256 key.
-    """
-    hkdf = HKDF(
-        algorithm=hashes.SHA256(),
-        length=32,
-        salt=None,
-        info=agent_id.encode("utf-8"),
-    )
-    return hkdf.derive(team_secret.encode("utf-8"))
-
-
-# =============================================================================
-# Authorization (per-user token auth via TokenStore)
-# =============================================================================
-from token_store import (  # noqa: E402 — must import after ensure_vault()
-    TopKExceededError,
-    token_store,
-)
-
-# Team secret for DEK derivation (shared across all users)
-VAULT_TEAM_SECRET = (
-    os.getenv("VAULT_TEAM_SECRET", "").strip() or os.getenv("VAULT_TOKENS", "").strip()
-)
-
-# Load token/role configuration (priority: files > env var > demo)
-_roles_path = os.getenv("VAULT_ROLES_FILE", "/app/config/vault-roles.yml")
-_tokens_path = os.getenv("VAULT_TOKENS_FILE", "/app/config/vault-tokens.yml")
-
-if os.path.exists(_roles_path) or os.path.exists(_tokens_path):
-    token_store.load_from_files(_roles_path, _tokens_path)
-    logger.info("Per-user token auth loaded from config files")
-elif VAULT_TEAM_SECRET:
-    token_store.load_legacy_env(VAULT_TEAM_SECRET)
-    logger.warning("Legacy single-token mode. Migrate to per-user tokens via runevault CLI.")
-else:
-    token_store.load_defaults_with_demo_token()
-    logger.warning("Demo mode. Set VAULT_TEAM_SECRET for production.")
-
-
-def validate_token(token: str) -> tuple[str, object]:
-    """Validate per-user token. Returns (username, Role)."""
-    return token_store.validate(token)
-
-
-# =============================================================================
-# Core Business Logic
-# =============================================================================
-def _get_public_key_impl(token: str) -> str:
-    """
-    Core implementation: Returns the public key bundle.
-
-    Args:
-        token: Authentication token issued by Vault Admin.
-
-    Returns:
-        JSON string containing EncKey, EvalKey.
-    """
-    username, role = validate_token(token)
-    token_store.check_scope(role, "get_public_key")
-
-    bundle = {}
-    for filename in ["EncKey.json", "EvalKey.json"]:
-        path = os.path.join(KEY_SUBDIR, filename)
-        if os.path.exists(path):
-            with open(path, "r") as f:
-                bundle[filename] = f.read()
-        else:
-            # Should not happen if ensure_vault ran
-            pass
-
-    # Include team index name and key_id so clients discover them dynamically
-    if VAULT_INDEX_NAME:
-        bundle["index_name"] = VAULT_INDEX_NAME
-    bundle["key_id"] = KEY_ID
-
-    # Per-user metadata DEK: derived from VAULT_TEAM_SECRET + token-based agent_id
-    agent_id = hashlib.sha256(token.encode("utf-8")).hexdigest()[:32]
-    agent_dek = derive_agent_key(VAULT_TEAM_SECRET, agent_id)
-    bundle["agent_id"] = agent_id
-    bundle["agent_dek"] = base64.b64encode(agent_dek).decode("ascii")
-
-    # enVector Cloud credentials — agents receive these from Vault instead of user input
-    bundle["envector_endpoint"] = ENVECTOR_ENDPOINT
-    bundle["envector_api_key"] = ENVECTOR_API_KEY
-
-    return json.dumps(bundle)
-
-
-def _decrypt_scores_impl(token: str, encrypted_blob_b64: str, top_k: int = 5) -> str:
-    """
-    Core implementation: Decrypts CiphertextScore and applies Top-K filtering.
-
-    The blob is a protobuf-serialized CiphertextScore produced by Index.scoring().
-    cipher.decrypt_score() returns {"score": [[s0, s1, ...], ...], "shard_idx": [...]},
-    where each inner list corresponds to a shard (IVF) or a single chunk (FLAT).
-
-    Args:
-        token: Authentication token issued by Vault Admin.
-        encrypted_blob_b64: Base64 string of the serialized CiphertextScore protobuf.
-        top_k: Number of top results to return (max 10 allowed).
-
-    Returns:
-        JSON string containing the list of {shard_idx, row_idx, score}.
-    """
-    username, role = validate_token(token)
-    token_store.check_scope(role, "decrypt_scores")
-
-    # Per-role top_k enforcement
-    if top_k > role.top_k:
-        raise TopKExceededError(top_k, role.top_k, role.name)
-
-    try:
-        # 1. Deserialize CiphertextScore protobuf
-        blob_bytes = base64.b64decode(encrypted_blob_b64)
-
-        try:
-            score_proto = CiphertextScore()
-            score_proto.ParseFromString(blob_bytes)
-            encrypted_result = CipherBlock(data=score_proto)
-        except Exception as e:
-            return json.dumps({"error": f"Deserialization failed: {str(e)}"})
-
-        # 2. Decrypt with cipher.decrypt_score (NOT cipher.decrypt)
-        decrypted = cipher.decrypt_score(encrypted_result, sec_key_path=sec_key_path)
-        # decrypted: {"score": [[chunk0_scores], [chunk1_scores], ...], "shard_idx": [s0, s1, ...]}
-        score_2d = decrypted["score"]
-        shard_indices = decrypted.get("shard_idx", list(range(len(score_2d))))
-
-        # 3. Top-K across all shards (handles both FLAT and IVF_FLAT)
-        # Flatten 2D scores into (shard_idx, row_idx, score) tuples
-        all_scores = (
-            (shard_indices[i], j, float(v))
-            for i, row in enumerate(score_2d)
-            for j, v in enumerate(row)
-        )
-        topk_results = heapq.nlargest(top_k, all_scores, key=lambda x: x[2])
-
-        params = [{"shard_idx": s, "row_idx": r, "score": sc} for s, r, sc in topk_results]
-
-        return json.dumps(params)
-
-    except Exception as e:
-        return json.dumps({"error": str(e)})
-
-
-def _decrypt_metadata_impl(token: str, encrypted_metadata_list: list[str]) -> str:
-    """
-    Core implementation: Decrypts a list of per-agent AES-encrypted metadata.
-
-    Each item is a JSON string: {"a": "<agent_id>", "c": "<base64_ciphertext>"}.
-    Vault derives the agent's DEK from VAULT_TEAM_SECRET + agent_id via HKDF.
-
-    Args:
-        token: Authentication token issued by Vault Admin.
-        encrypted_metadata_list: List of JSON-encoded per-agent encrypted blobs.
-
-    Returns:
-        JSON string containing the list of decrypted metadata objects.
-    """
-    username, role = validate_token(token)
-    token_store.check_scope(role, "decrypt_metadata")
-
-    if not VAULT_TEAM_SECRET:
-        return json.dumps({"error": "VAULT_TEAM_SECRET not configured"})
-
-    try:
-        results = []
-        for blob_str in encrypted_metadata_list:
-            blob = json.loads(blob_str)
-            agent_id = blob["a"]
-            ct_b64 = blob["c"]
-            agent_dek = derive_agent_key(VAULT_TEAM_SECRET, agent_id)
-            decrypted = aes_decrypt_metadata(ct_b64, agent_dek)
-            if isinstance(decrypted, bytes):
-                decrypted = decrypted.decode("utf-8")
-            results.append(decrypted)
-        return json.dumps(results)
-    except Exception as e:
-        return json.dumps({"error": f"Metadata decryption failed: {str(e)}"})
diff --git a/vault/vault_grpc_server.py b/vault/vault_grpc_server.py
deleted file mode 100644
index eb7df7b..0000000
--- a/vault/vault_grpc_server.py
+++ /dev/null
@@ -1,375 +0,0 @@
-"""
-gRPC server for Rune-Vault.
-
-Sole entry point for the Vault service.
-Delegates to _*_impl() pure functions in vault_core.py.
-"""
-
-import json
-import logging
-import os
-import signal
-import time
-from concurrent import futures
-from datetime import datetime, timezone
-
-import grpc
-from admin_server import start_admin_server
-from grpc_health.v1 import health_pb2, health_pb2_grpc
-from grpc_health.v1.health import HealthServicer
-from grpc_reflection.v1alpha import reflection
-from proto import vault_service_pb2 as pb2
-from proto import vault_service_pb2_grpc as pb2_grpc
-from token_store import (
-    RateLimitError,
-    ScopeError,
-    TokenExpiredError,
-    TokenNotFoundError,
-    TopKExceededError,
-)
-from validation_interceptor import ValidationInterceptor
-from vault_core import (
-    _decrypt_metadata_impl,
-    _decrypt_scores_impl,
-    _get_public_key_impl,
-    token_store,
-)
-
-try:
-    from audit import audit_logger, extract_source_ip
-
-    AUDIT_AVAILABLE = True
-except ImportError:
-    AUDIT_AVAILABLE = False
-
-logger = logging.getLogger("rune.vault.grpc")
-
-MAX_MESSAGE_LENGTH = 256 * 1024 * 1024  # 256 MB (EvalKey can be tens of MB)
-
-
-def _emit_audit(method, user, top_k, result_count, status, error_detail, duration, context):
-    """Emit audit log entry."""
-    if not (AUDIT_AVAILABLE and audit_logger.enabled):
-        return
-    audit_logger.log(
-        timestamp=datetime.now(timezone.utc).isoformat(),
-        user_id=user,
-        method=method,
-        top_k=top_k,
-        result_count=result_count,
-        status=status,
-        source_ip=extract_source_ip(context),
-        latency_ms=duration * 1000,
-        error=error_detail,
-    )
-
-
-class VaultServiceServicer(pb2_grpc.VaultServiceServicer):
-    """gRPC implementation that delegates to vault_core._*_impl() functions."""
-
-    def GetPublicKey(self, request, context):
-        start_time = time.time()
-        status = "success"
-        user = "unknown"
-        result_count = 0
-        error_detail = None
-        try:
-            user = token_store.get_username(request.token) or "unknown"
-            result_json = _get_public_key_impl(request.token)
-            parsed = json.loads(result_json)
-            if isinstance(parsed, dict) and "error" in parsed:
-                status = "error"
-                error_detail = parsed["error"]
-                return pb2.GetPublicKeyResponse(error=parsed["error"])
-            result_count = 1
-            return pb2.GetPublicKeyResponse(key_bundle_json=result_json)
-        except (TokenNotFoundError, TokenExpiredError) as e:
-            status = "denied"
-            error_detail = str(e)
-            context.set_code(grpc.StatusCode.UNAUTHENTICATED)
-            context.set_details(str(e))
-            return pb2.GetPublicKeyResponse(error=str(e))
-        except RateLimitError as e:
-            status = "denied"
-            error_detail = str(e)
-            context.set_code(grpc.StatusCode.RESOURCE_EXHAUSTED)
-            context.set_details(str(e))
-            return pb2.GetPublicKeyResponse(error=str(e))
-        except ScopeError as e:
-            status = "denied"
-            error_detail = str(e)
-            context.set_code(grpc.StatusCode.PERMISSION_DENIED)
-            context.set_details(str(e))
-            return pb2.GetPublicKeyResponse(error=str(e))
-        except ValueError as e:
-            status = "denied"
-            error_detail = str(e)
-            context.set_code(grpc.StatusCode.UNAUTHENTICATED)
-            context.set_details(str(e))
-            return pb2.GetPublicKeyResponse(error=str(e))
-        except Exception as e:
-            status = "error"
-            error_detail = str(e)
-            context.set_code(grpc.StatusCode.INTERNAL)
-            context.set_details(str(e))
-            return pb2.GetPublicKeyResponse(error=str(e))
-        finally:
-            duration = time.time() - start_time
-            _emit_audit(
-                "get_public_key", user, None, result_count, status, error_detail, duration, context
-            )
-
-    def DecryptScores(self, request, context):
-        start_time = time.time()
-        status = "success"
-        user = "unknown"
-        result_count = 0
-        error_detail = None
-        try:
-            user = token_store.get_username(request.token) or "unknown"
-            result_json = _decrypt_scores_impl(
-                request.token,
-                request.encrypted_blob_b64,
-                request.top_k,
-            )
-            parsed = json.loads(result_json)
-            if isinstance(parsed, dict) and "error" in parsed:
-                status = "error"
-                error_detail = parsed["error"]
-                return pb2.DecryptScoresResponse(error=parsed["error"])
-
-            entries = [
-                pb2.ScoreEntry(
-                    shard_idx=item["shard_idx"],
-                    row_idx=item["row_idx"],
-                    score=item["score"],
-                )
-                for item in parsed
-            ]
-            result_count = len(entries)
-            return pb2.DecryptScoresResponse(results=entries)
-        except TopKExceededError as e:
-            status = "denied"
-            error_detail = str(e)
-            context.set_code(grpc.StatusCode.INVALID_ARGUMENT)
-            context.set_details(str(e))
-            return pb2.DecryptScoresResponse(error=str(e))
-        except (TokenNotFoundError, TokenExpiredError) as e:
-            status = "denied"
-            error_detail = str(e)
-            context.set_code(grpc.StatusCode.UNAUTHENTICATED)
-            context.set_details(str(e))
-            return pb2.DecryptScoresResponse(error=str(e))
-        except RateLimitError as e:
-            status = "denied"
-            error_detail = str(e)
-            context.set_code(grpc.StatusCode.RESOURCE_EXHAUSTED)
-            context.set_details(str(e))
-            return pb2.DecryptScoresResponse(error=str(e))
-        except ScopeError as e:
-            status = "denied"
-            error_detail = str(e)
-            context.set_code(grpc.StatusCode.PERMISSION_DENIED)
-            context.set_details(str(e))
-            return pb2.DecryptScoresResponse(error=str(e))
-        except ValueError as e:
-            status = "denied"
-            error_detail = str(e)
-            context.set_code(grpc.StatusCode.UNAUTHENTICATED)
-            context.set_details(str(e))
-            return pb2.DecryptScoresResponse(error=str(e))
-        except Exception as e:
-            status = "error"
-            error_detail = str(e)
-            context.set_code(grpc.StatusCode.INTERNAL)
-            context.set_details(str(e))
-            return pb2.DecryptScoresResponse(error=str(e))
-        finally:
-            duration = time.time() - start_time
-            _emit_audit(
-                "decrypt_scores",
-                user,
-                request.top_k,
-                result_count,
-                status,
-                error_detail,
-                duration,
-                context,
-            )
-
-    def DecryptMetadata(self, request, context):
-        start_time = time.time()
-        status = "success"
-        user = "unknown"
-        result_count = 0
-        error_detail = None
-        try:
-            user = token_store.get_username(request.token) or "unknown"
-            result_json = _decrypt_metadata_impl(
-                request.token,
-                list(request.encrypted_metadata_list),
-            )
-            parsed = json.loads(result_json)
-            if isinstance(parsed, dict) and "error" in parsed:
-                status = "error"
-                error_detail = parsed["error"]
-                return pb2.DecryptMetadataResponse(error=parsed["error"])
-
-            # Each element is a decrypted metadata object.
-            # Serialize non-string items back to JSON string for the proto field.
-            decrypted_strings = [
-                json.dumps(item) if not isinstance(item, str) else item for item in parsed
-            ]
-            result_count = len(decrypted_strings)
-            return pb2.DecryptMetadataResponse(decrypted_metadata=decrypted_strings)
-        except (TokenNotFoundError, TokenExpiredError) as e:
-            status = "denied"
-            error_detail = str(e)
-            context.set_code(grpc.StatusCode.UNAUTHENTICATED)
-            context.set_details(str(e))
-            return pb2.DecryptMetadataResponse(error=str(e))
-        except RateLimitError as e:
-            status = "denied"
-            error_detail = str(e)
-            context.set_code(grpc.StatusCode.RESOURCE_EXHAUSTED)
-            context.set_details(str(e))
-            return pb2.DecryptMetadataResponse(error=str(e))
-        except ScopeError as e:
-            status = "denied"
-            error_detail = str(e)
-            context.set_code(grpc.StatusCode.PERMISSION_DENIED)
-            context.set_details(str(e))
-            return pb2.DecryptMetadataResponse(error=str(e))
-        except ValueError as e:
-            status = "denied"
-            error_detail = str(e)
-            context.set_code(grpc.StatusCode.UNAUTHENTICATED)
-            context.set_details(str(e))
-            return pb2.DecryptMetadataResponse(error=str(e))
-        except Exception as e:
-            status = "error"
-            error_detail = str(e)
-            context.set_code(grpc.StatusCode.INTERNAL)
-            context.set_details(str(e))
-            return pb2.DecryptMetadataResponse(error=str(e))
-        finally:
-            duration = time.time() - start_time
-            _emit_audit(
-                "decrypt_metadata",
-                user,
-                None,
-                result_count,
-                status,
-                error_detail,
-                duration,
-                context,
-            )
-
-
-def _load_tls_credentials():
-    """
-    Load TLS credentials from environment variables.
-
-    Returns grpc.ServerCredentials or None (if TLS disabled).
-    Raises SystemExit if TLS is required but cert/key not provided.
-    """
-    if os.environ.get("VAULT_TLS_DISABLE", "").lower() == "true":
-        logger.warning("TLS DISABLED — gRPC traffic is unencrypted. Do not use in production.")
-        return None
-
-    cert_path = os.environ.get("VAULT_TLS_CERT")
-    key_path = os.environ.get("VAULT_TLS_KEY")
-
-    if not cert_path or not key_path:
-        logger.error(
-            "TLS certificate not configured. "
-            "Set VAULT_TLS_CERT and VAULT_TLS_KEY, "
-            "or set VAULT_TLS_DISABLE=true for insecure mode."
-        )
-        raise SystemExit(1)
-
-    with open(cert_path, "rb") as f:
-        cert_pem = f.read()
-    with open(key_path, "rb") as f:
-        key_pem = f.read()
-
-    logger.info("TLS configured — cert=%s", cert_path)
-    return grpc.ssl_server_credentials([(key_pem, cert_pem)])
-
-
-def serve_grpc(host: str = "0.0.0.0", port: int = 50051) -> grpc.Server:
-    """
-    Start the gRPC server. Non-blocking — returns the server object.
-    Call server.stop(grace=N) for graceful shutdown.
-    """
-    server = grpc.server(
-        futures.ThreadPoolExecutor(max_workers=4),
-        options=[
-            ("grpc.max_send_message_length", MAX_MESSAGE_LENGTH),
-            ("grpc.max_receive_message_length", MAX_MESSAGE_LENGTH),
-        ],
-        interceptors=[ValidationInterceptor()],
-    )
-
-    # Register VaultService
-    pb2_grpc.add_VaultServiceServicer_to_server(VaultServiceServicer(), server)
-
-    # Enable gRPC server reflection (for grpcurl, etc.)
-    SERVICE_NAMES = (
-        pb2.DESCRIPTOR.services_by_name["VaultService"].full_name,
-        reflection.SERVICE_NAME,
-    )
-    reflection.enable_server_reflection(SERVICE_NAMES, server)
-
-    # Register gRPC health checking (standard grpc.health.v1 protocol)
-    health_servicer = HealthServicer()
-    health_pb2_grpc.add_HealthServicer_to_server(health_servicer, server)
-    health_servicer.set(
-        "rune.vault.v1.VaultService",
-        health_pb2.HealthCheckResponse.SERVING,
-    )
-    health_servicer.set("", health_pb2.HealthCheckResponse.SERVING)
-
-    addr = f"{host}:{port}"
-    credentials = _load_tls_credentials()
-    if credentials:
-        server.add_secure_port(addr, credentials)
-        logger.info("gRPC server started on %s (TLS)", addr)
-    else:
-        server.add_insecure_port(addr)
-        logger.info("gRPC server started on %s (insecure)", addr)
-
-    server.start()
-    return server, health_servicer
-
-
-if __name__ == "__main__":
-    import argparse
-
-    logging.basicConfig(
-        level=logging.INFO,
-        format="%(asctime)s %(name)s %(levelname)s %(message)s",
-    )
-
-    parser = argparse.ArgumentParser(description="Run the Rune-Vault gRPC server.")
-    parser.add_argument("--host", default="0.0.0.0", help="Host to bind")
-    parser.add_argument("--grpc-port", type=int, default=50051, help="gRPC port")
-    args = parser.parse_args()
-
-    # Start gRPC server (non-blocking)
-    grpc_server, health_servicer = serve_grpc(host=args.host, port=args.grpc_port)
-
-    # Start admin HTTP server (internal HTTP, not exposed via Docker)
-    admin_srv = start_admin_server(token_store, health_servicer=health_servicer)
-
-    # Graceful shutdown on SIGTERM / SIGINT
-    def _shutdown(signum, frame):
-        logger.info("Received shutdown signal, stopping...")
-        admin_srv.shutdown()
-        grpc_server.stop(grace=5)
-
-    signal.signal(signal.SIGTERM, _shutdown)
-    signal.signal(signal.SIGINT, _shutdown)
-
-    logger.info("Rune-Vault is ready.")
-    grpc_server.wait_for_termination()
diff --git a/vault/verify_crypto_flow.py b/vault/verify_crypto_flow.py
deleted file mode 100644
index f51693c..0000000
--- a/vault/verify_crypto_flow.py
+++ /dev/null
@@ -1,93 +0,0 @@
-import os
-import shutil
-
-import numpy as np
-from pyenvector.crypto import Cipher, KeyGenerator
-
-KEY_DIR = "vault_keys_test"
-KEY_ID = "test-key"
-
-
-def verify_flow():
-    # 0. Clean up
-    if os.path.exists(KEY_DIR):
-        shutil.rmtree(KEY_DIR)
-
-    print("1. Generating Keys...")
-    # Using dimension 1024 for production
-    dim = 1024
-    keygen = KeyGenerator(key_path=KEY_DIR, key_id=KEY_ID, dim_list=[dim])
-    keygen.generate_keys()
-
-    # Keys found directly in KEY_DIR in this version/usage?
-    # Or maybe KeyGenerator uses key_path as the output dir directly if provided?
-    # Adjusting to observed behavior.
-    enc_path = os.path.join(KEY_DIR, "EncKey.json")
-    sec_path = os.path.join(KEY_DIR, "SecKey.json")
-
-    if not os.path.exists(enc_path):
-        raise FileNotFoundError(f"Key not found: {enc_path}")
-
-    # 2. Init Cipher
-    print(f"Initializing Cipher with dim={dim} and key={enc_path}")
-    cipher = Cipher(enc_key_path=enc_path, dim=dim)
-
-    # 3. Simulate Server: "Encrypting Scores"
-    # Create scores for dim=1024. Most can be 0.
-    mock_scores = np.zeros(dim, dtype=np.float32)
-    mock_scores[:4] = [0.9, 0.1, 0.8, 0.2]
-    print(f"Original Mock Scores (first 4): {mock_scores[:4]}")
-
-    # Encrypt explicitly. Cipher.encrypt expects a vector (numpy array)
-    # It returns a list of bytes usually (if multiple input) or single bytes?
-    # Let's try encrypting as "item" or "query"?
-    # Actually we just want to encrypt a generic vector.
-    # 'encrypt' method usually takes (data, type). Type might be 'item', 'query'.
-    # For simulation, we just want to produce a ciphertext.
-    # Let's try type="item".
-    try:
-        # Encrypt results
-        encrypted_result = cipher.encrypt(mock_scores, "item")
-        print(f"Encrypted result type: {type(encrypted_result)}")
-
-        # 4. Simulate Vault: "Decrypting Scores"
-        print("Decrypting using standard decrypt (simulating score decryption)...")
-        # Use standard decrypt, which should work for encrypted vectors.
-        decrypted_vector = cipher.decrypt(encrypted_result, sec_key_path=sec_path)
-
-        # decrypted_vector is likely a numpy array or list of arrays
-        print(f"Decrypted Vector type: {type(decrypted_vector)}")
-        if isinstance(decrypted_vector, list) and len(decrypted_vector) > 0:
-            print(f"Item 0 type: {type(decrypted_vector[0])}")
-            print(f"Decrypted Vector (full): {decrypted_vector}")
-
-        # Check similarity
-        final_result = decrypted_vector
-        # Only unwrap if it looks like a list of lists/arrays
-        if (
-            isinstance(final_result, list)
-            and len(final_result) > 0
-            and (isinstance(final_result[0], list) or isinstance(final_result[0], np.ndarray))
-        ):
-            final_result = final_result[0]
-
-        print(f"Decrypted: {final_result[:4]}")
-
-        dec_arr = np.array(final_result)
-        diff = np.abs(mock_scores - dec_arr[: len(mock_scores)])
-        print(f"Max Diff: {np.max(diff)}")
-
-        if np.max(diff) < 1e-4:
-            print("SUCCESS: Crypto compatibility verified (via standard decrypt).")
-        else:
-            print("FAILURE: Decrypted values do not match.")
-
-    except Exception as e:
-        print(f"ERROR: {e}")
-        import traceback
-
-        traceback.print_exc()
-
-
-if __name__ == "__main__":
-    verify_flow()

From bf171956529972e89b3e626bbd543630e161fe95 Mon Sep 17 00:00:00 2001
From: Jeonghwan Lee <jhlee@cryptolab.co.kr>
Date: Mon, 27 Apr 2026 12:02:15 +0900
Subject: [PATCH 02/27] ci: add release binary pipeline with multi-platform
 build and checksum verification

---
 .github/workflows/ci.yml             |  47 +++-----
 .github/workflows/docker-publish.yml |  56 ---------
 .github/workflows/release.yaml       | 165 +++++++++++++++++++++++++++
 3 files changed, 178 insertions(+), 90 deletions(-)
 delete mode 100644 .github/workflows/docker-publish.yml
 create mode 100644 .github/workflows/release.yaml

diff --git a/.github/workflows/ci.yml b/.github/workflows/ci.yml
index 1ac2a91..2aa6692 100644
--- a/.github/workflows/ci.yml
+++ b/.github/workflows/ci.yml
@@ -7,18 +7,18 @@ on:
       - "docs/**"
       - "*.md"
       - "deployment/**"
-      - ".github/workflows/docker-publish.yml"
       - "LICENSE"
       - ".githooks/**"
+      - ".github/workflows/**"
   push:
     branches: [main]
     paths-ignore:
       - "docs/**"
       - "*.md"
       - "deployment/**"
-      - ".github/workflows/docker-publish.yml"
       - "LICENSE"
       - ".githooks/**"
+      - ".github/workflows/**"
 
 concurrency:
   group: ci-${{ github.event.pull_request.number || github.sha }}
@@ -26,12 +26,12 @@ concurrency:
 
 jobs:
   check:
-    runs-on: [self-hosted, vault-ci]
+    runs-on: ubuntu-latest
+    env:
+      MISE_ENV: ci
     steps:
       - uses: actions/checkout@v4
       - uses: jdx/mise-action@v2
-        env:
-          MISE_ENV: ci
       - run: mise run setup
       - name: Clean previous fixtures
         run: rm -rf tests/fixtures/
@@ -39,35 +39,14 @@ jobs:
         env:
           FIXTURES_GPG_PASSPHRASE: ${{ secrets.FIXTURES_GPG_PASSPHRASE_ALT }}
         run: mise run fixtures:decrypt
-      - name: Format check
-        run: mise run format:check
-      - name: Lint
-        run: mise run lint
-      - name: Test (unit + integration)
-        run: mise run test
-      - name: Clean up fixtures
-        if: always()
-        run: rm -rf tests/fixtures/
-
-  build-image:
-    if: github.event_name == 'push'
-    needs: check
-    runs-on: [self-hosted, vault-ci]
-    steps:
-      - uses: actions/checkout@v4
+      - name: Check (gofmt + vet + unit tests)
+        run: mise run check
       - name: Build
         run: |
-          docker build -t rune-vault:ci-${{ github.sha }} vault/
-      - name: Smoke test
-        run: |
-          docker run -d --name vault-ci-${{ github.run_id }} \
-            -e VAULT_TLS_DISABLE=true \
-            rune-vault:ci-${{ github.sha }}
-          timeout 60 bash -c 'until docker exec vault-ci-${{ github.run_id }} \
-            curl -sf http://localhost:8081/health 2>/dev/null; do sleep 2; done'
-      - name: Teardown
+          VERSION=$(git describe --tags --always 2>/dev/null || echo "dev")
+          VERSION=$VERSION mise run go:build
+      - name: E2E tests
+        run: mise run go:test:e2e
+      - name: Clean up fixtures
         if: always()
-        run: |
-          docker rm -f vault-ci-${{ github.run_id }} || true
-          docker rmi rune-vault:ci-${{ github.sha }} || true
-          docker system prune -f
+        run: rm -rf tests/fixtures/
diff --git a/.github/workflows/docker-publish.yml b/.github/workflows/docker-publish.yml
deleted file mode 100644
index d4921e8..0000000
--- a/.github/workflows/docker-publish.yml
+++ /dev/null
@@ -1,56 +0,0 @@
-name: Build and Push Docker Image
-
-on:
-  release:
-    types: [published]
-
-env:
-  REGISTRY: ghcr.io
-  IMAGE_NAME: cryptolabinc/rune-vault
-
-jobs:
-  build-and-push:
-    runs-on: [self-hosted, vault-ci]
-
-    permissions:
-      contents: read
-      packages: write
-
-    steps:
-      - name: Checkout repository
-        uses: actions/checkout@v4
-
-      - name: Set up QEMU
-        uses: docker/setup-qemu-action@v3
-
-      - name: Set up Docker Buildx
-        uses: docker/setup-buildx-action@v3
-
-      - name: Log in to GHCR
-        uses: docker/login-action@v3
-        with:
-          registry: ${{ env.REGISTRY }}
-          username: ${{ github.actor }}
-          password: ${{ secrets.GITHUB_TOKEN }}
-
-      - name: Extract metadata (tags, labels)
-        id: meta
-        uses: docker/metadata-action@v5
-        with:
-          images: ${{ env.REGISTRY }}/${{ env.IMAGE_NAME }}
-          tags: |
-            type=semver,pattern={{version}}
-            type=semver,pattern=v{{version}}
-            type=semver,pattern={{major}}.{{minor}}
-            type=raw,value=latest,enable={{is_default_branch}}
-
-      - name: Build and push Docker image
-        uses: docker/build-push-action@v6
-        with:
-          context: vault/
-          platforms: linux/amd64,linux/arm64
-          push: true
-          tags: ${{ steps.meta.outputs.tags }}
-          labels: ${{ steps.meta.outputs.labels }}
-          cache-from: type=gha
-          cache-to: type=gha,mode=max
diff --git a/.github/workflows/release.yaml b/.github/workflows/release.yaml
new file mode 100644
index 0000000..7a9c452
--- /dev/null
+++ b/.github/workflows/release.yaml
@@ -0,0 +1,165 @@
+name: Release Binaries
+
+on:
+  release:
+    types: [prereleased]
+  workflow_dispatch:
+    inputs:
+      dry_run:
+        description: 'Dry run — skip GitHub Release upload'
+        required: false
+        default: 'true'
+        type: boolean
+
+concurrency:
+  group: release-binaries-${{ github.ref }}
+  cancel-in-progress: false
+
+jobs:
+  build:
+    name: Build ${{ matrix.os }}/${{ matrix.arch }}
+    runs-on: ${{ matrix.runner }}
+    strategy:
+      fail-fast: false
+      matrix:
+        include:
+          - { runner: ubuntu-latest,    os: linux,  arch: amd64 }
+          - { runner: ubuntu-24.04-arm, os: linux,  arch: arm64 }
+          - { runner: macos-14,         os: darwin, arch: arm64 }
+          - { runner: macos-14,         os: darwin, arch: amd64 }
+
+    steps:
+      - uses: actions/checkout@v4
+
+      - uses: jdx/mise-action@v2
+
+      - name: Bootstrap (modules + proto stubs)
+        run: mise run setup
+
+      - name: Install OpenSSL (Linux)
+        if: matrix.os == 'linux'
+        run: sudo apt-get install -y libssl-dev
+
+      - name: Install OpenSSL arm64 (macOS)
+        if: matrix.os == 'darwin'
+        run: brew install openssl@3
+
+      - name: Install Intel Homebrew + OpenSSL x86_64 (macOS amd64 cross)
+        if: matrix.os == 'darwin' && matrix.arch == 'amd64'
+        run: |
+          if ! [ -x /usr/local/bin/brew ]; then
+            NONINTERACTIVE=1 arch -x86_64 /bin/bash -c \
+              "$(curl -fsSL https://raw.githubusercontent.com/Homebrew/install/HEAD/install.sh)"
+          fi
+          arch -x86_64 /usr/local/bin/brew install openssl@3
+
+      - name: Check (gofmt + go vet + unit tests)
+        run: mise run check
+
+      - name: Resolve version
+        id: meta
+        run: |
+          if [ "${{ github.event_name }}" = "release" ]; then
+            VERSION="${{ github.event.release.tag_name }}"
+          else
+            VERSION=$(git describe --tags --always 2>/dev/null || echo "dev")
+          fi
+          echo "version=${VERSION}" >> "$GITHUB_OUTPUT"
+          echo "archive=runevault_${VERSION}_${{ matrix.os }}_${{ matrix.arch }}.tar.gz" >> "$GITHUB_OUTPUT"
+
+      - name: Build binary
+        env:
+          GOOS: ${{ matrix.os }}
+          GOARCH: ${{ matrix.arch }}
+          VERSION: ${{ steps.meta.outputs.version }}
+        run: |
+          PKG="github.com/CryptoLabInc/rune-admin/vault/internal/commands"
+          COMMIT=$(git rev-parse --short HEAD)
+          DATE=$(date -u +%Y-%m-%dT%H:%M:%SZ)
+          if [ "${{ matrix.os }}" = "darwin" ] && [ "${{ matrix.arch }}" = "amd64" ]; then
+            SDKROOT=$(xcrun -sdk macosx --show-sdk-path)
+            export CC="clang -arch x86_64 -isysroot ${SDKROOT}"
+            export CGO_CFLAGS="-arch x86_64 -I/usr/local/opt/openssl@3/include"
+            export CGO_LDFLAGS="-arch x86_64 -L/usr/local/opt/openssl@3/lib"
+          fi
+          cd vault && go build \
+            -trimpath \
+            -ldflags "-s -w -X '${PKG}.buildVersion=${VERSION}' -X '${PKG}.buildCommit=${COMMIT}' -X '${PKG}.buildDate=${DATE}'" \
+            -o bin/runevault \
+            ./cmd
+
+      - name: Smoke test
+        run: |
+          if [ "${{ matrix.os }}" = "darwin" ] && [ "${{ matrix.arch }}" = "amd64" ]; then
+            arch -x86_64 ./vault/bin/runevault version
+          else
+            ./vault/bin/runevault version
+          fi
+
+      - name: Package
+        run: |
+          mkdir -p _dist
+          cp vault/bin/runevault _dist/
+          cp LICENSE _dist/
+          tar -czf "${{ steps.meta.outputs.archive }}" -C _dist .
+
+      - uses: actions/upload-artifact@v4
+        with:
+          name: ${{ steps.meta.outputs.archive }}
+          path: ${{ steps.meta.outputs.archive }}
+          retention-days: 7
+
+  publish:
+    name: Sign and publish
+    runs-on: ubuntu-latest
+    needs: build
+    permissions:
+      contents: write
+      id-token: write
+
+    steps:
+      - uses: actions/checkout@v4
+
+      - name: Download build artifacts
+        uses: actions/download-artifact@v4
+        with:
+          path: dist/
+          merge-multiple: true
+
+      - name: Install cosign
+        uses: sigstore/cosign-installer@v3
+
+      - name: Resolve version
+        id: meta
+        run: |
+          if [ "${{ github.event_name }}" = "release" ]; then
+            echo "version=${{ github.event.release.tag_name }}" >> "$GITHUB_OUTPUT"
+          else
+            echo "version=$(git describe --tags --always 2>/dev/null || echo dev)" >> "$GITHUB_OUTPUT"
+          fi
+
+      - name: Generate SHA256SUMS
+        working-directory: dist/
+        run: sha256sum *.tar.gz > SHA256SUMS
+
+      - name: Sign SHA256SUMS
+        working-directory: dist/
+        run: |
+          cosign sign-blob \
+            --yes \
+            --output-signature SHA256SUMS.sig \
+            --output-certificate SHA256SUMS.pem \
+            SHA256SUMS
+
+      - name: Upload to GitHub Release
+        if: github.event_name == 'release'
+        working-directory: dist/
+        env:
+          GH_TOKEN: ${{ github.token }}
+        run: |
+          gh release upload "${{ github.event.release.tag_name }}" \
+            *.tar.gz \
+            SHA256SUMS \
+            SHA256SUMS.sig \
+            SHA256SUMS.pem \
+            --repo "${{ github.repository }}"

From eee3ac5150c49ef0dd877e0e17ef9206dd81885b Mon Sep 17 00:00:00 2001
From: Jeonghwan Lee <jhlee@cryptolab.co.kr>
Date: Mon, 27 Apr 2026 12:02:15 +0900
Subject: [PATCH 03/27] docs: add security check section on README

---
 README.md | 64 +++++++++++++++++++++++++++++++++++++++++++------------
 1 file changed, 50 insertions(+), 14 deletions(-)

diff --git a/README.md b/README.md
index 72b5829..a125008 100644
--- a/README.md
+++ b/README.md
@@ -38,22 +38,34 @@ Team members install [Rune](https://github.com/CryptoLabInc/rune) from Claude Ma
 
 ## Quick Start
 
-### 1. Deploy Rune-Vault
+### 1. Build and run Rune-Vault
+
+Phase 1 of the Go runtime migration ships the daemon as a single binary
+`runevault`. The cloud installer (binary distribution + Terraform) lands
+in Phase 3 (issue #64); until then, build from source:
 
 ```bash
-curl -fsSL https://raw.githubusercontent.com/CryptoLabInc/rune-admin/main/install.sh -o install.sh && sudo bash install.sh
+git clone https://github.com/CryptoLabInc/rune-admin.git
+cd rune-admin/vault
+go build -o /usr/local/bin/runevault ./cmd/runevault
 ```
 
-The installer will interactively guide you through:
-- Cloud provider selection (AWS / GCP / OCI)
-- enVector Cloud credentials
-- TLS certificate generation
-- Terraform-based VM provisioning
+Render `runevault.conf` from the template (paths, TLS cert/key, envector
+credentials, team secret) and place it at
+`/opt/rune-vault/configs/runevault.conf`:
 
-**Output**:
+```bash
+# Template
+cat vault/internal/server/testdata/runevault.conf.example
+# (then write your filled-in copy)
+sudo install -m 0600 -o "$(id -un)" runevault.conf /opt/rune-vault/configs/runevault.conf
 ```
-vault_endpoint = "vault-yourteam.oci.envector.io:50051"
-ca.pem downloaded for TLS verification
+
+Generate self-signed TLS certs (or supply your own) and start the daemon:
+
+```bash
+mise run certs                       # writes certs/server.{pem,key}
+runevault daemon start               # foreground; Ctrl+C or `runevault daemon stop` to exit
 ```
 
 ### 2. Verify Deployment
@@ -113,13 +125,37 @@ Vault communications MUST use TLS. The installer automatically configures TLS ce
 - **EncKey/EvalKey**: Safe to distribute (public keys)
 - Per-agent metadata encryption uses HKDF-derived DEKs (no separate key file)
 
+### Release Signature Verification
+
+Every GitHub release ships `SHA256SUMS`, `SHA256SUMS.sig`, and `SHA256SUMS.pem`.
+The checksum file is signed keylessly via [Sigstore](https://sigstore.dev) from the
+`release.yaml` workflow. Verify before installing:
+
+```bash
+cosign verify-blob \
+  --signature SHA256SUMS.sig \
+  --certificate SHA256SUMS.pem \
+  --certificate-oidc-issuer https://token.actions.githubusercontent.com \
+  --certificate-identity-regexp "^https://github.com/CryptoLabInc/rune-admin/.github/workflows/release.yaml@" \
+  SHA256SUMS
+
+sha256sum --check --ignore-missing SHA256SUMS
+```
+
+The `--certificate-oidc-issuer` and `--certificate-identity-regexp` flags are
+required to pin the signature to this repository's workflow — without them,
+any Fulcio-issued certificate (including one from a different repository) would
+pass verification.
+
 ## Deployment Targets
 
-All cloud deployments are handled by the [interactive installer](#quick-start).
+Cloud deployment automation (Terraform modules under `deployment/`) is
+on hold during the Phase 1 → Phase 3 transition. Deploy the binary
+directly to your VM of choice for now.
 
-- **OCI** (Oracle Cloud Infrastructure): `deployment/oci/`
-- **AWS** (Amazon Web Services): `deployment/aws/`
-- **GCP** (Google Cloud Platform): `deployment/gcp/`
+- **OCI** (Oracle Cloud Infrastructure): `deployment/oci/` (Phase 3)
+- **AWS** (Amazon Web Services): `deployment/aws/` (Phase 3)
+- **GCP** (Google Cloud Platform): `deployment/gcp/` (Phase 3)
 
 ## Development
 

From e49ac3d2c2caa9abdb42de3f8469fe02deddcf11 Mon Sep 17 00:00:00 2001
From: Jeonghwan Lee <jhlee@cryptolab.co.kr>
Date: Mon, 27 Apr 2026 12:02:15 +0900
Subject: [PATCH 04/27] =?UTF-8?q?feat:=20add=20EnsureVault=20to=20server?=
 =?UTF-8?q?=20startup=20=E2=80=94=20activate=20keys=20and=20ensure=20index?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

---
 vault/internal/server/ensure_vault.go | 76 +++++++++++++++++++++++++++
 1 file changed, 76 insertions(+)
 create mode 100644 vault/internal/server/ensure_vault.go

diff --git a/vault/internal/server/ensure_vault.go b/vault/internal/server/ensure_vault.go
new file mode 100644
index 0000000..2fb2233
--- /dev/null
+++ b/vault/internal/server/ensure_vault.go
@@ -0,0 +1,76 @@
+package server
+
+import (
+	"context"
+	"fmt"
+	"log/slog"
+	"path/filepath"
+
+	envector "github.com/CryptoLabInc/envector-go-sdk"
+)
+
+// EnsureVault connects to enVector Cloud and idempotently performs the two
+// cloud-side setup steps that the Python vault_core.ensure_vault() ran at
+// startup before the gRPC server began accepting requests:
+//
+//  1. ActivateKeys — registers the EvalKey bundle if absent, unloads any
+//     other resident key, then loads the target key (4-RPC sequence in the
+//     SDK, already idempotent).
+//  2. Index — creates the team index if it does not yet exist; no-op when
+//     the index is already present.
+//
+// Returns nil immediately (offline mode) when envector.endpoint or
+// envector.api_key is unset, matching the Python "warn and skip" behaviour.
+func EnsureVault(ctx context.Context, cfg *Config) error {
+	if cfg.Envector.Endpoint == "" || cfg.Envector.APIKey == "" {
+		slog.Warn("vault: envector.endpoint / envector.api_key not set — skipping cloud key registration and index setup (offline mode)")
+		return nil
+	}
+	if cfg.Keys.IndexName == "" {
+		slog.Warn("vault: keys.index_name not set — skipping index creation")
+		return nil
+	}
+
+	slog.Info("vault: connecting to enVector Cloud", "endpoint", cfg.Envector.Endpoint)
+
+	client, err := envector.NewClient(
+		envector.WithAddress(cfg.Envector.Endpoint),
+		envector.WithAccessToken(cfg.Envector.APIKey),
+	)
+	if err != nil {
+		return fmt.Errorf("ensure vault: dial enVector: %w", err)
+	}
+	defer client.Close()
+
+	// Only EvalKey is needed: ActivateKeys uploads it to the cloud, and
+	// Index/createIndex uses Dim() and ID() which are set from options
+	// regardless of which key parts are loaded.
+	keyDir := filepath.Join(cfg.Keys.Path, defaultKeyID(cfg))
+	keys, err := envector.OpenKeysFromFile(
+		envector.WithKeyPath(keyDir),
+		envector.WithKeyID(defaultKeyID(cfg)),
+		envector.WithKeyDim(cfg.Keys.EmbeddingDim),
+		envector.WithKeyParts(envector.KeyPartEval),
+	)
+	if err != nil {
+		return fmt.Errorf("ensure vault: open eval key: %w", err)
+	}
+	defer keys.Close()
+
+	slog.Info("vault: activating FHE keys on enVector Cloud", "key_id", defaultKeyID(cfg))
+	if err := client.ActivateKeys(ctx, keys); err != nil {
+		return fmt.Errorf("ensure vault: activate keys: %w", err)
+	}
+	slog.Info("vault: FHE keys activated")
+
+	slog.Info("vault: ensuring team index", "index", cfg.Keys.IndexName)
+	if _, err := client.Index(ctx,
+		envector.WithIndexName(cfg.Keys.IndexName),
+		envector.WithIndexKeys(keys),
+	); err != nil {
+		return fmt.Errorf("ensure vault: ensure index: %w", err)
+	}
+	slog.Info("vault: team index ready", "index", cfg.Keys.IndexName)
+
+	return nil
+}

From 475b14fcda74b34f25470e3f25c750b276528999 Mon Sep 17 00:00:00 2001
From: Jeonghwan Lee <jhlee@cryptolab.co.kr>
Date: Mon, 27 Apr 2026 12:02:15 +0900
Subject: [PATCH 05/27] feat: add production installer with systemd/launchd
 service registration

---
 .../launchd/com.cryptolabinc.runevault.plist  |   45 +
 deployment/systemd/runevault.service          |   38 +
 install.sh                                    | 1617 +++++++++--------
 scripts/install-dev.sh                        |  892 +--------
 4 files changed, 934 insertions(+), 1658 deletions(-)
 create mode 100644 deployment/launchd/com.cryptolabinc.runevault.plist
 create mode 100644 deployment/systemd/runevault.service

diff --git a/deployment/launchd/com.cryptolabinc.runevault.plist b/deployment/launchd/com.cryptolabinc.runevault.plist
new file mode 100644
index 0000000..7b1bfb3
--- /dev/null
+++ b/deployment/launchd/com.cryptolabinc.runevault.plist
@@ -0,0 +1,45 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE plist PUBLIC "-//Apple//DTD PLIST 1.0//EN"
+  "http://www.apple.com/DTDs/PropertyList-1.0.dtd">
+<plist version="1.0">
+<dict>
+  <key>Label</key>
+  <string>com.cryptolabinc.runevault</string>
+
+  <key>ProgramArguments</key>
+  <array>
+    <string>/usr/local/bin/runevault</string>
+    <string>daemon</string>
+    <string>start</string>
+    <string>--config</string>
+    <string>/opt/runevault/configs/runevault.conf</string>
+  </array>
+
+  <key>UserName</key>
+  <string>runevault</string>
+
+  <key>RunAtLoad</key>
+  <true/>
+
+  <key>KeepAlive</key>
+  <true/>
+
+  <key>ThrottleInterval</key>
+  <integer>10</integer>
+
+  <key>StandardOutPath</key>
+  <string>/opt/runevault/logs/runevault.stdout.log</string>
+
+  <key>StandardErrorPath</key>
+  <string>/opt/runevault/logs/runevault.stderr.log</string>
+
+  <key>EnvironmentVariables</key>
+  <dict>
+    <key>PATH</key>
+    <string>/usr/local/bin:/usr/bin:/bin:/usr/sbin:/sbin</string>
+  </dict>
+
+  <key>ProcessType</key>
+  <string>Background</string>
+</dict>
+</plist>
diff --git a/deployment/systemd/runevault.service b/deployment/systemd/runevault.service
new file mode 100644
index 0000000..72dfe74
--- /dev/null
+++ b/deployment/systemd/runevault.service
@@ -0,0 +1,38 @@
+[Unit]
+Description=Rune-Vault FHE gRPC Server
+Documentation=https://github.com/CryptoLabInc/rune-admin
+After=network-online.target
+Wants=network-online.target
+
+[Service]
+Type=simple
+User=runevault
+Group=runevault
+ExecStart=/usr/local/bin/runevault daemon start --config /opt/runevault/configs/runevault.conf
+Restart=on-failure
+RestartSec=5s
+TimeoutStopSec=30s
+StandardOutput=journal
+StandardError=journal
+SyslogIdentifier=runevault
+
+# Security hardening
+NoNewPrivileges=true
+PrivateTmp=true
+ProtectSystem=strict
+ProtectHome=true
+ReadWritePaths=/opt/runevault
+ProtectKernelTunables=true
+ProtectKernelModules=true
+ProtectControlGroups=true
+RestrictAddressFamilies=AF_INET AF_INET6 AF_UNIX
+RestrictNamespaces=true
+LockPersonality=true
+MemoryDenyWriteExecute=false
+RestrictRealtime=true
+RestrictSUIDSGID=true
+RemoveIPC=true
+LimitNOFILE=65536
+
+[Install]
+WantedBy=multi-user.target
diff --git a/install.sh b/install.sh
index 15c8879..8f6288b 100755
--- a/install.sh
+++ b/install.sh
@@ -1,860 +1,869 @@
-#!/bin/bash
-# Rune-Vault Interactive Server Setup
-# Usage: curl -fsSL https://raw.githubusercontent.com/CryptoLabInc/rune-admin/main/install.sh -o install.sh && sudo bash install.sh
+#!/usr/bin/env bash
+#
+# Rune-Vault installer.
+#
+# Downloads, verifies, and installs the runevault daemon with systemd (Linux)
+# or launchd (macOS) service registration.
+#
+# Usage:
+#   sudo bash install.sh [options]
+#
+# Options:
+#   --version <tag>      Install a specific release tag (default: latest)
+#   --force              Overwrite existing config and TLS certificates
+#   --non-interactive    Skip all prompts; supply secrets via env vars
+#   --uninstall          Stop the service, remove files, optionally delete data
+#
+# Non-interactive env vars:
+#   RUNEVAULT_TEAM_NAME              keys.index_name (required)
+#   RUNEVAULT_ENVECTOR_ENDPOINT      envector.endpoint (required)
+#   RUNEVAULT_ENVECTOR_API_KEY       envector.api_key
+#   RUNEVAULT_ENVECTOR_API_KEY_FILE  envector.api_key_file (alternative)
+#   RUNEVAULT_TEAM_SECRET            tokens.team_secret (auto-generated if unset)
+#   RUNEVAULT_TLS_CERT_PATH          Path to existing TLS cert (skips auto-gen)
+#   RUNEVAULT_TLS_KEY_PATH           Path to existing TLS key  (skips auto-gen)
+#
+# Dev/testing env vars (set by scripts/install-dev.sh):
+#   RUNEVAULT_LOCAL_BINARY    Path to local binary; skips download + verification
+#   RUNEVAULT_SKIP_VERIFY     Set to 1 to skip cosign verification
+#   RUNEVAULT_INSTALL_PREFIX  Override /opt/runevault (default)
+#   RUNEVAULT_BINARY_PATH     Override /usr/local/bin/runevault (default)
+#   RUNEVAULT_SKIP_SERVICE    Set to 1 to skip systemd/launchd installation
 
 set -euo pipefail
 
-# ─── Root privilege check ─────────────────────────────────────────────────────
-
-if [ "$(id -u)" -ne 0 ]; then
-    echo "Error: This script must be run as root. Use: sudo bash install.sh"
-    exit 1
+# ── Constants ──────────────────────────────────────────────────────────────────
+REPO=CryptoLabInc/rune-admin
+OIDC_ISSUER=https://token.actions.githubusercontent.com
+CERT_REGEXP="^https://github.com/CryptoLabInc/rune-admin/.github/workflows/release.yaml@"
+SERVICE_USER=runevault
+GRPC_PORT=50051
+
+# Overridable by env (used by scripts/install-dev.sh)
+INSTALL_PREFIX="${RUNEVAULT_INSTALL_PREFIX:-/opt/runevault}"
+BINARY_DEST="${RUNEVAULT_BINARY_PATH:-/usr/local/bin/runevault}"
+SKIP_VERIFY="${RUNEVAULT_SKIP_VERIFY:-0}"
+LOCAL_BINARY="${RUNEVAULT_LOCAL_BINARY:-}"
+SKIP_SERVICE="${RUNEVAULT_SKIP_SERVICE:-0}"
+
+# ── Color helpers ──────────────────────────────────────────────────────────────
+if [[ -t 1 ]]; then
+  _RED='\033[0;31m' _GRN='\033[0;32m' _BLU='\033[0;34m' _YLW='\033[0;33m' _RST='\033[0m'
+else
+  _RED='' _GRN='' _BLU='' _YLW='' _RST=''
 fi
-
-# ─── Parse flags ──────────────────────────────────────────────────────────────
-
-VERSION_OVERRIDE=""
-while [ $# -gt 0 ]; do
-    case "$1" in
-        --version) VERSION_OVERRIDE="$2"; shift 2 ;;
-        --version=*) VERSION_OVERRIDE="${1#*=}"; shift ;;
-        *) shift ;;
-    esac
+die()     { printf "${_RED}ERROR:${_RST} %s\n" "$*" >&2; exit 1; }
+info()    { printf "${_BLU}==>${_RST} %s\n" "$*"; }
+success() { printf "${_GRN}✓${_RST} %s\n" "$*"; }
+warn()    { printf "${_YLW}WARNING:${_RST} %s\n" "$*" >&2; }
+
+# ── Argument parsing ───────────────────────────────────────────────────────────
+UNINSTALL=0
+FORCE=0
+VERSION=""
+NON_INTERACTIVE=0
+
+while [[ $# -gt 0 ]]; do
+  case $1 in
+    --version)         VERSION="$2"; shift 2 ;;
+    --uninstall)       UNINSTALL=1; shift ;;
+    --force)           FORCE=1; shift ;;
+    --non-interactive) NON_INTERACTIVE=1; shift ;;
+    *) die "Unknown flag: $1" ;;
+  esac
 done
 
-# ─── Constants ────────────────────────────────────────────────────────────────
-
-REPO="CryptoLabInc/rune-admin"
-DOCKER_IMAGE="ghcr.io/cryptolabinc/rune-vault"
-_user_home="${SUDO_USER:+$(eval echo ~"$SUDO_USER")}"
-DEFAULT_INSTALL_DIR="${_user_home:-$HOME}/rune-vault"
-VAULT_PUBLIC_IP=""
-CSP_CA_CERT_LOCAL=""
-
-# ─── Colors & output helpers ─────────────────────────────────────────────────
-
-RED='\033[0;31m'
-GREEN='\033[0;32m'
-YELLOW='\033[1;33m'
-BLUE='\033[0;34m'
-BOLD='\033[1m'
-NC='\033[0m'
-
-print_header() {
-    echo -e "\n${BLUE}================================================${NC}"
-    echo -e "${BLUE}  $1${NC}"
-    echo -e "${BLUE}================================================${NC}\n"
+# Auto-set non-interactive when stdin is not a TTY (e.g. curl | bash)
+[[ -t 0 ]] || NON_INTERACTIVE=1
+
+# ── Platform detection ─────────────────────────────────────────────────────────
+case "$(uname -s)" in
+  Linux)  OS_SLUG=linux ;;
+  Darwin) OS_SLUG=darwin ;;
+  *)      die "Unsupported OS: $(uname -s). Only Linux and macOS are supported." ;;
+esac
+case "$(uname -m)" in
+  x86_64|amd64)  ARCH_SLUG=amd64 ;;
+  arm64|aarch64) ARCH_SLUG=arm64 ;;
+  *)             die "Unsupported architecture: $(uname -m)." ;;
+esac
+
+# ── Uninstall flow ─────────────────────────────────────────────────────────────
+run_uninstall() {
+  info "Uninstalling Rune-Vault..."
+  [[ "$(id -u)" -eq 0 ]] || die "Uninstall must be run as root (use sudo)."
+
+  if [[ "$OS_SLUG" = linux ]]; then
+    if systemctl is-active --quiet runevault.service 2>/dev/null; then
+      info "Stopping runevault.service..."
+      systemctl stop runevault.service
+    fi
+    systemctl disable runevault.service 2>/dev/null || true
+    rm -f /etc/systemd/system/runevault.service
+    systemctl daemon-reload
+    success "systemd service removed."
+  else
+    local plist=/Library/LaunchDaemons/com.cryptolabinc.runevault.plist
+    if [[ -f "$plist" ]]; then
+      launchctl bootout system/com.cryptolabinc.runevault 2>/dev/null || true
+      rm -f "$plist"
+      success "launchd service removed."
+    fi
+  fi
+
+  rm -f "$BINARY_DEST"
+  success "Binary removed: ${BINARY_DEST}"
+
+  printf '\n'
+  warn "The following directory contains Rune-Vault Keys and configuration:"
+  warn "  ${INSTALL_PREFIX}/"
+  warn "This data CANNOT be recovered if deleted."
+  printf '\n'
+
+  local answer=n
+  if [[ "$NON_INTERACTIVE" -eq 1 ]]; then
+    warn "Non-interactive mode: data preserved. Remove manually: rm -rf ${INSTALL_PREFIX}"
+  else
+    read -r -p "Delete all vault data including Rune-Vault Keys? [y/N] " answer
+  fi
+
+  case "$answer" in
+    [Yy]*)
+      rm -rf "${INSTALL_PREFIX}"
+      success "Vault data deleted."
+      ;;
+    *)
+      info "Data preserved at ${INSTALL_PREFIX}"
+      ;;
+  esac
+
+  if [[ "$OS_SLUG" = linux ]]; then
+    if id "$SERVICE_USER" >/dev/null 2>&1; then
+      userdel "$SERVICE_USER" 2>/dev/null || true
+      success "System user '${SERVICE_USER}' removed."
+    fi
+    if getent group "$SERVICE_USER" >/dev/null 2>&1; then
+      groupdel "$SERVICE_USER" 2>/dev/null || true
+      success "System group '${SERVICE_USER}' removed."
+    fi
+  else
+    if id "$SERVICE_USER" >/dev/null 2>&1; then
+      dscl . -delete /Users/"$SERVICE_USER" 2>/dev/null || true
+      success "System user '${SERVICE_USER}' removed."
+    fi
+    if dscl . -read /Groups/"$SERVICE_USER" >/dev/null 2>&1; then
+      dscl . -delete /Groups/"$SERVICE_USER" 2>/dev/null || true
+      success "System group '${SERVICE_USER}' removed."
+    fi
+  fi
+
+  success "Rune-Vault uninstalled."
 }
 
-print_info()  { echo -e "${GREEN}✓${NC} $1"; }
-print_warn()  { echo -e "${YELLOW}⚠${NC} $1"; }
-print_error() { echo -e "${RED}✗${NC} $1"; }
-print_step()  { echo -e "\n${BOLD}▸ $1${NC}\n"; }
-
-# ─── Cleanup trap ─────────────────────────────────────────────────────────────
-
-CLEANUP_DIR=""
-cleanup() {
-    printf '\033[?25h' >&2 2>/dev/null || true
-    if [ -n "$CLEANUP_DIR" ] && [ -d "$CLEANUP_DIR" ]; then
-        rm -rf "$CLEANUP_DIR"
-    fi
+# ── Tool auto-install ──────────────────────────────────────────────────────────
+
+# Run brew as the original (non-root) user when invoked via sudo on macOS.
+_brew() { sudo -u "${SUDO_USER:-$(id -un)}" brew "$@"; }
+
+_pkg_install() {
+  if command -v apt-get >/dev/null 2>&1; then
+    apt-get install -y "$@"
+  elif command -v dnf >/dev/null 2>&1; then
+    dnf install -y "$@"
+  elif command -v yum >/dev/null 2>&1; then
+    yum install -y "$@"
+  else
+    die "No supported package manager found (apt/dnf/yum). Install manually: $*"
+  fi
 }
-trap cleanup EXIT
-
-# ─── Prompt helper ────────────────────────────────────────────────────────────
 
-prompt() {
-    local varname="$1" message="$2" default="${3:-}"
-    if [ -n "$default" ]; then
-        printf "${BOLD}%s${NC} [%s]: " "$message" "$default" >&2
-    else
-        printf "${BOLD}%s${NC}: " "$message" >&2
-    fi
-    local value
-    read -r value
-    value="${value:-$default}"
-    eval "$varname=\"\$value\""
+_install_tool() {
+  local tool=$1
+  info "Installing ${tool}..."
+  case "$OS_SLUG:$tool" in
+    linux:cosign)
+      # Download pre-built binary from sigstore releases (no apt repo needed)
+      local arch_suffix=amd64
+      [[ "$ARCH_SLUG" = arm64 ]] && arch_suffix=arm64
+      curl -fsSL \
+        "https://github.com/sigstore/cosign/releases/latest/download/cosign-linux-${arch_suffix}" \
+        -o /usr/local/bin/cosign
+      chmod 0755 /usr/local/bin/cosign
+      ;;
+    linux:openssl)  _pkg_install openssl ;;
+    linux:sha256sum) _pkg_install coreutils ;;
+    darwin:cosign)  _brew install cosign ;;
+    darwin:openssl) _brew install openssl ;;
+    darwin:shasum)
+      die "shasum is pre-installed on macOS. Something is very wrong." ;;
+    *:systemctl)
+      die "systemctl not found. This installer requires a systemd-based Linux." ;;
+    *)
+      die "Don't know how to install '${tool}' on ${OS_SLUG}. Install it manually." ;;
+  esac
+  command -v "$tool" >/dev/null 2>&1 \
+    || die "Installation of '${tool}' appeared to succeed but binary not found in PATH."
+  success "${tool} installed."
 }
 
-prompt_yn() {
-    local message="$1" default="${2:-y}"
-    local value
-    if [ "$default" = "y" ]; then
-        printf "${BOLD}%s${NC} [Y/n]: " "$message" >&2
+# ── Phase 1: Preflight ─────────────────────────────────────────────────────────
+preflight() {
+  info "Running preflight checks..."
+
+  [[ "$(id -u)" -eq 0 ]] || die "This installer must be run as root (use sudo)."
+
+  local tools=(curl)
+  [[ "$SKIP_VERIFY" -eq 0 && -z "$LOCAL_BINARY" ]] && tools+=(cosign)
+  if [[ "$OS_SLUG" = linux ]]; then
+    tools+=(sha256sum systemctl)
+  else
+    tools+=(shasum)
+  fi
+  # openssl only needed when auto-generating TLS certs
+  if [[ -z "${RUNEVAULT_TLS_CERT_PATH:-}" || -z "${RUNEVAULT_TLS_KEY_PATH:-}" ]]; then
+    tools+=(openssl)
+  fi
+
+  # Collect missing tools (systemctl is never auto-installable — fail immediately)
+  local missing=()
+  for tool in "${tools[@]}"; do
+    command -v "$tool" >/dev/null 2>&1 && continue
+    [[ "$tool" = systemctl ]] \
+      && die "systemctl not found. This installer requires a systemd-based Linux."
+    missing+=("$tool")
+  done
+
+  if [[ ${#missing[@]} -gt 0 ]]; then
+    printf '\n'
+    warn "The following required tools are not installed:"
+    for tool in "${missing[@]}"; do printf '  - %s\n' "$tool"; done
+    printf '\n'
+
+    local answer=n
+    if [[ "$NON_INTERACTIVE" -eq 0 ]]; then
+      read -r -p "Install missing tools automatically? [y/N] " answer
     else
-        printf "${BOLD}%s${NC} [y/N]: " "$message" >&2
-    fi
-    read -r value
-    value="${value:-$default}"
-    case "$value" in
-        [Yy]*) return 0 ;;
-        *) return 1 ;;
-    esac
-}
-
-# ─── Arrow-key menu selector ────────────────────────────────────────────────
-
-select_menu() {
-    local options=("$@")
-    local count=${#options[@]}
-    local _sel=0
-
-    # Fallback: plain number input when terminal is dumb or unset
-    if [ -z "${TERM:-}" ] || [ "$TERM" = "dumb" ]; then
-        local i
-        for i in "${!options[@]}"; do
-            printf "  %d) %s\n" "$((i + 1))" "${options[$i]}" >&2
-        done
-        echo "" >&2
-        local choice
-        printf "${BOLD}Select${NC} [1]: " >&2
-        read -r choice
-        choice="${choice:-1}"
-        if [ "$choice" -ge 1 ] 2>/dev/null && [ "$choice" -le "$count" ] 2>/dev/null; then
-            echo "$((choice - 1))"
-        else
-            print_error "Invalid selection."; exit 1
-        fi
-        return
+      warn "Non-interactive mode: cannot auto-install missing tools."
     fi
 
-    # ── Draw the menu ──
-    _draw_menu() {
-        local i
-        for i in "${!options[@]}"; do
-            if [ "$i" -eq "$_sel" ]; then
-                printf "  ${GREEN}${BOLD}> %s${NC}\n" "${options[$i]}" >&2
-            else
-                printf "    %s\n" "${options[$i]}" >&2
-            fi
+    case "$answer" in
+      [Yy]*)
+        for tool in "${missing[@]}"; do
+          _install_tool "$tool"
         done
-    }
-
-    # ── Move cursor up to redraw ──
-    _erase_menu() {
-        local i
-        for (( i = 0; i < count; i++ )); do
-            printf '\033[1A\033[2K' >&2
+        ;;
+      *)
+        printf 'Install them manually and re-run the installer:\n' >&2
+        for tool in "${missing[@]}"; do
+          case "$OS_SLUG:$tool" in
+            linux:cosign)   printf '  cosign:    https://docs.sigstore.dev/cosign/system_config/installation/\n' >&2 ;;
+            linux:openssl)  printf '  openssl:   apt install openssl\n' >&2 ;;
+            linux:sha256sum) printf '  sha256sum: apt install coreutils\n' >&2 ;;
+            darwin:cosign)  printf '  cosign:    brew install cosign\n' >&2 ;;
+            darwin:openssl) printf '  openssl:   brew install openssl\n' >&2 ;;
+          esac
         done
-    }
-
-    printf '\033[?25l' >&2          # hide cursor
-    printf "  ${BOLD}↑↓ move  Enter confirm${NC}\n" >&2
-    _draw_menu
-
-    while true; do
-        local key=""
-        IFS= read -rsn1 key
-        if [ "$key" = $'\x1b' ]; then
-            local seq=""
-            IFS= read -rsn2 -t 1 seq || true
-            case "$seq" in
-                '[A') # Up arrow
-                    if [ "$_sel" -gt 0 ]; then
-                        _sel=$((_sel - 1))
-                    else
-                        _sel=$((count - 1))
-                    fi
-                    ;;
-                '[B') # Down arrow
-                    if [ "$_sel" -lt $((count - 1)) ]; then
-                        _sel=$((_sel + 1))
-                    else
-                        _sel=0
-                    fi
-                    ;;
-            esac
-            _erase_menu
-            _draw_menu
-        elif [ "$key" = "" ]; then
-            # Enter key
-            break
-        elif [ "$key" -ge 1 ] 2>/dev/null && [ "$key" -le "$count" ] 2>/dev/null; then
-            # Number key direct jump
-            _sel=$((key - 1))
-            _erase_menu
-            _draw_menu
-        fi
-    done
-
-    printf '\033[?25h' >&2          # show cursor
-
-    echo "$_sel"
+        exit 1
+        ;;
+    esac
+  fi
+
+  # Port availability (best-effort — skip gracefully if tools unavailable)
+  local port_occupied=0
+  if [[ "$OS_SLUG" = linux ]] && command -v ss >/dev/null 2>&1; then
+    ss -tlnp 2>/dev/null | grep -q ":${GRPC_PORT}" && port_occupied=1 || true
+  elif command -v lsof >/dev/null 2>&1; then
+    lsof -iTCP:"${GRPC_PORT}" -sTCP:LISTEN -P -n 2>/dev/null \
+      | grep -q ":${GRPC_PORT}" && port_occupied=1 || true
+  fi
+  if [[ "$port_occupied" -eq 1 ]]; then
+    if [[ "$OS_SLUG" = linux ]]; then
+      die "Port ${GRPC_PORT} is already in use. Stop the existing daemon first:
+       sudo systemctl stop runevault"
+    else
+      die "Port ${GRPC_PORT} is already in use. Stop the existing daemon first:
+       sudo launchctl bootout system/com.cryptolabinc.runevault"
+    fi
+  fi
+
+  # Version resolution (skip if using a local binary)
+  if [[ -z "$LOCAL_BINARY" && -z "$VERSION" ]]; then
+    info "Resolving latest release version..."
+    VERSION=$(curl -fsSL \
+      "https://api.github.com/repos/${REPO}/releases/latest" \
+      | grep '"tag_name"' \
+      | head -1 \
+      | sed 's/.*"tag_name": *"\([^"]*\)".*/\1/')
+    [[ -n "$VERSION" ]] || die "Failed to resolve latest version from GitHub API."
+    info "Latest version: ${VERSION}"
+  fi
+
+  # Already-installed version check (skip if --force or using a local binary)
+  if [[ "$FORCE" -eq 0 && -z "$LOCAL_BINARY" && -x "$BINARY_DEST" ]]; then
+    local installed_ver
+    installed_ver=$("$BINARY_DEST" version 2>/dev/null | grep -oE 'v[0-9]+\.[0-9]+\.[0-9]+[^ ]*' | head -1 || true)
+    if [[ -n "$installed_ver" && "$installed_ver" = "$VERSION" ]]; then
+      warn "runevault ${VERSION} is already installed. Use --force to reinstall."
+      exit 0
+    fi
+  fi
+
+  success "Preflight checks passed."
 }
 
-# ─── Resolve latest release version ──────────────────────────────────────────
-
-resolve_version() {
-    if [ -n "$VERSION_OVERRIDE" ]; then
-        print_step "Using version override: ${VERSION_OVERRIDE}"
-        VERSION="$VERSION_OVERRIDE"
-        DOCKER_TAG="$VERSION_OVERRIDE"
-        GITHUB_RAW_BASE="https://raw.githubusercontent.com/${REPO}/${VERSION}"
-        return
-    fi
-
-    print_step "Resolving latest release version..."
-    local api_response
-    api_response=$(curl -fsSL "https://api.github.com/repos/${REPO}/releases/latest" 2>/dev/null) || true
-    VERSION=$(echo "$api_response" | grep '"tag_name"' | sed -E 's/.*"([^"]+)".*/\1/') || true
+# ── Phase 2 & 3: Download and verify ──────────────────────────────────────────
+SCRATCH=""
+
+_curl_retry() {
+  local url=$1 dest=$2 i
+  for i in 1 2 3; do
+    curl -fsSL --connect-timeout 15 -o "$dest" "$url" && return 0
+    warn "Download attempt ${i} failed for $(basename "$url"). Retrying in 5s..."
+    sleep 5
+  done
+  die "Failed to download: ${url}"
+}
 
-    if [ -z "${VERSION:-}" ]; then
-        print_warn "No release found. Falling back to 'main' branch."
-        VERSION="main"
-        DOCKER_TAG="latest"
+_checksum_verify() {
+  local sums_file=$1 archive=$2 archive_name line
+  archive_name=$(basename "$archive")
+  line=$(grep -F "$archive_name" "$sums_file") \
+    || die "Archive '${archive_name}' not found in SHA256SUMS."
+  (
+    cd "$(dirname "$archive")"
+    if [[ "$OS_SLUG" = linux ]]; then
+      printf '%s\n' "$line" | sha256sum --check --quiet
     else
-        print_info "Latest release: ${VERSION}"
-        DOCKER_TAG="${VERSION}"
+      printf '%s\n' "$line" | shasum -a 256 --check --quiet
     fi
-
-    GITHUB_RAW_BASE="https://raw.githubusercontent.com/${REPO}/${VERSION}"
+  ) || die "Checksum verification failed for ${archive_name}."
 }
 
-# ─── Prerequisite checks ─────────────────────────────────────────────────────
+download_and_verify() {
+  SCRATCH=$(mktemp -d)
+  trap 'rm -rf "$SCRATCH"' EXIT
 
-check_command() {
-    local cmd="$1" install_hint="$2"
-    if ! command -v "$cmd" &>/dev/null; then
-        print_error "'$cmd' is not installed."
-        echo "  Install: $install_hint"
-        return 1
-    fi
-    print_info "$cmd found"
+  if [[ -n "$LOCAL_BINARY" ]]; then
+    info "Using local binary: ${LOCAL_BINARY}"
+    [[ -x "$LOCAL_BINARY" ]] || die "Local binary not executable: ${LOCAL_BINARY}"
+    cp "$LOCAL_BINARY" "$SCRATCH/runevault"
     return 0
+  fi
+
+  local archive="runevault_${VERSION}_${OS_SLUG}_${ARCH_SLUG}.tar.gz"
+  local base_url="https://github.com/${REPO}/releases/download/${VERSION}"
+
+  info "Downloading ${archive}..."
+  _curl_retry "${base_url}/${archive}"         "$SCRATCH/${archive}"
+  _curl_retry "${base_url}/SHA256SUMS"         "$SCRATCH/SHA256SUMS"
+  _curl_retry "${base_url}/SHA256SUMS.sig"     "$SCRATCH/SHA256SUMS.sig"
+  _curl_retry "${base_url}/SHA256SUMS.pem"     "$SCRATCH/SHA256SUMS.pem"
+
+  if [[ "$SKIP_VERIFY" -eq 1 ]]; then
+    warn "SKIP_VERIFY=1: skipping cosign verification (development only)."
+  else
+    info "Verifying release signature..."
+    local cosign_err
+    cosign_err=$(mktemp)
+    cosign verify-blob \
+      --signature   "$SCRATCH/SHA256SUMS.sig" \
+      --certificate "$SCRATCH/SHA256SUMS.pem" \
+      --certificate-oidc-issuer "$OIDC_ISSUER" \
+      --certificate-identity-regexp "$CERT_REGEXP" \
+      "$SCRATCH/SHA256SUMS" 2>"$cosign_err" \
+      || { cat "$cosign_err" >&2
+           die "Signature verification failed — aborting before any installation."; }
+    success "Signature verified."
+  fi
+
+  info "Verifying checksum..."
+  _checksum_verify "$SCRATCH/SHA256SUMS" "$SCRATCH/${archive}"
+  success "Checksum verified."
+
+  info "Extracting binary..."
+  tar -xzf "$SCRATCH/${archive}" -C "$SCRATCH" ./runevault
+  "$SCRATCH/runevault" version >/dev/null 2>&1 \
+    || die "Extracted binary failed smoke test."
 }
 
-check_prerequisites_local() {
-    print_step "Checking prerequisites..."
-    local missing=0
-    check_command docker "https://docs.docker.com/get-docker/" || missing=1
-    check_command openssl "apt install openssl / brew install openssl" || missing=1
-    check_command curl "apt install curl / brew install curl" || missing=1
-
-    # docker compose (v2 plugin)
-    if ! docker compose version &>/dev/null 2>&1; then
-        print_error "'docker compose' (v2 plugin) is not available."
-        echo "  Install: https://docs.docker.com/compose/install/"
-        missing=1
+# ── Phase 4: System setup ──────────────────────────────────────────────────────
+_create_system_group() {
+  if [[ "$OS_SLUG" = linux ]]; then
+    if ! getent group "$SERVICE_USER" >/dev/null 2>&1; then
+      groupadd --system "$SERVICE_USER"
+      success "System group '${SERVICE_USER}' created."
     else
-        print_info "docker compose found"
-    fi
-
-    if [ "$missing" -eq 1 ]; then
-        echo ""
-        print_error "Please install the missing prerequisites and re-run."
-        exit 1
-    fi
-
-    # Check Docker daemon
-    if ! docker info &>/dev/null 2>&1; then
-        print_error "Cannot connect to Docker daemon. Is Docker running?"
-        echo "  Fix: systemctl start docker"
-        exit 1
+      info "System group '${SERVICE_USER}' already exists."
+    fi
+  else
+    if ! dscl . -read /Groups/"$SERVICE_USER" >/dev/null 2>&1; then
+      local gid=490
+      while dscl . -list /Groups PrimaryGroupID 2>/dev/null \
+            | awk '{print $2}' | grep -qx "$gid"; do
+        gid=$((gid - 1))
+      done
+      dscl . -create /Groups/"$SERVICE_USER"
+      dscl . -create /Groups/"$SERVICE_USER" PrimaryGroupID "$gid"
+      dscl . -create /Groups/"$SERVICE_USER" RealName "Rune Vault Admin Group"
+      success "System group '${SERVICE_USER}' created (GID=${gid})."
+    else
+      info "System group '${SERVICE_USER}' already exists."
     fi
+  fi
 }
 
-check_prerequisites_csp() {
-    local provider="$1"
-    print_step "Checking prerequisites..."
-
-    local missing=0
-    check_command terraform "https://developer.hashicorp.com/terraform/install" || missing=1
-    check_command curl "apt install curl / brew install curl" || missing=1
-    check_command openssl "apt install openssl / brew install openssl" || missing=1
-
-    case "$provider" in
-        aws) check_command aws "https://aws.amazon.com/cli/" || missing=1 ;;
-        gcp) check_command gcloud "https://cloud.google.com/sdk/docs/install" || missing=1 ;;
-        oci) check_command oci "https://docs.oracle.com/en-us/iaas/Content/API/SDKDocs/cliinstall.htm" || missing=1 ;;
-    esac
-
-    if [ "$missing" -eq 1 ]; then
-        echo ""
-        print_error "Please install the missing prerequisites and re-run."
-        exit 1
+_create_system_user() {
+  if [[ "$OS_SLUG" = linux ]]; then
+    if ! id "$SERVICE_USER" >/dev/null 2>&1; then
+      useradd --system --no-create-home --shell /usr/sbin/nologin \
+        -g "$SERVICE_USER" --no-user-group "$SERVICE_USER"
+      success "System user '${SERVICE_USER}' created."
+    else
+      info "System user '${SERVICE_USER}' already exists."
+    fi
+  else
+    if ! id "$SERVICE_USER" >/dev/null 2>&1; then
+      local uid=490
+      while dscl . -list /Users UniqueID 2>/dev/null \
+            | awk '{print $2}' | grep -qx "$uid"; do
+        uid=$((uid - 1))
+      done
+      local gid
+      gid=$(dscl . -read /Groups/"$SERVICE_USER" PrimaryGroupID 2>/dev/null \
+            | awk '{print $2}')
+      dscl . -create /Users/"$SERVICE_USER"
+      dscl . -create /Users/"$SERVICE_USER" UserShell        /usr/bin/false
+      dscl . -create /Users/"$SERVICE_USER" RealName         "Rune Vault Service"
+      dscl . -create /Users/"$SERVICE_USER" UniqueID         "$uid"
+      dscl . -create /Users/"$SERVICE_USER" PrimaryGroupID   "$gid"
+      dscl . -create /Users/"$SERVICE_USER" NFSHomeDirectory /var/empty
+      dscl . -create /Users/"$SERVICE_USER" IsHidden         1
+      success "System user '${SERVICE_USER}' created (UID=${uid})."
+    else
+      info "System user '${SERVICE_USER}' already exists."
     fi
+  fi
 }
 
-# ─── Interactive prompts ─────────────────────────────────────────────────────
-
-choose_deploy_target() {
-    print_step "Select deployment target"
-    local options=("Local (This machine)" "AWS" "GCP" "OCI")
-    local targets=("local" "aws" "gcp" "oci")
-    local selected
-    selected=$(select_menu "${options[@]}")
-    DEPLOY_TARGET="${targets[$selected]}"
-    print_info "Deployment target: ${DEPLOY_TARGET}"
+_add_invoking_user_to_group() {
+  local invoking_user="${SUDO_USER:-}"
+  [[ -z "$invoking_user" ]] && return 0
+  if [[ "$OS_SLUG" = linux ]]; then
+    usermod -aG "$SERVICE_USER" "$invoking_user"
+  else
+    dscl . -append /Groups/"$SERVICE_USER" GroupMembership "$invoking_user" 2>/dev/null || true
+  fi
+  success "Added '${invoking_user}' to group '${SERVICE_USER}'."
 }
 
-prompt_install_dir() {
-    print_step "Installation directory"
-    local default_dir="$DEFAULT_INSTALL_DIR"
-    if [ "$DEPLOY_TARGET" != "local" ]; then
-        default_dir="$HOME/rune-vault-${DEPLOY_TARGET}"
-        echo "  Terraform files, state, and SSH keys are stored here."
-        echo "  Keep this directory to manage (update/destroy) your deployment."
-        echo ""
-    fi
-    prompt INSTALL_DIR "Directory" "$default_dir"
+setup_system() {
+  info "Setting up system..."
+
+  if [[ "$SKIP_SERVICE" -eq 0 ]]; then
+    _create_system_group
+    _create_system_user
+  fi
+
+  # /opt may not exist on fresh macOS
+  [[ "$OS_SLUG" = darwin ]] && mkdir -p /opt
+
+  local dir
+  for dir in \
+    "${INSTALL_PREFIX}" \
+    "${INSTALL_PREFIX}/configs" \
+    "${INSTALL_PREFIX}/certs" \
+    "${INSTALL_PREFIX}/logs"
+  do
+    mkdir -p "$dir"
+    chmod 0750 "$dir"
+    [[ "$SKIP_SERVICE" -eq 0 ]] && chown "${SERVICE_USER}:${SERVICE_USER}" "$dir"
+  done
+  # vault-keys stays 0700: secret FHE key material must never be group-readable.
+  mkdir -p "${INSTALL_PREFIX}/vault-keys"
+  chmod 0700 "${INSTALL_PREFIX}/vault-keys"
+  [[ "$SKIP_SERVICE" -eq 0 ]] && chown "${SERVICE_USER}:${SERVICE_USER}" "${INSTALL_PREFIX}/vault-keys"
+
+  success "Directories created under ${INSTALL_PREFIX}/"
+
+  install -m 0755 "$SCRATCH/runevault" "$BINARY_DEST"
+  success "Binary installed: ${BINARY_DEST}"
+
+  [[ "$SKIP_SERVICE" -eq 0 ]] && _add_invoking_user_to_group
 }
 
-prompt_tls_mode() {
-    print_step "TLS configuration"
-    local options=("Generate self-signed certificate" "No TLS (not recommended)")
-    local modes=("self-signed" "none")
-    local selected
-    selected=$(select_menu "${options[@]}")
-    TLS_MODE="${modes[$selected]}"
-
-    if [ "$TLS_MODE" = "self-signed" ]; then
-        echo ""
-        prompt TLS_HOSTNAME "Domain name for the certificate (leave empty if none)" ""
-    fi
-
-    if [ "$TLS_MODE" = "none" ]; then
-        print_warn "Running without TLS. gRPC traffic will be unencrypted."
-        print_warn "This is NOT recommended for production."
-    fi
+# ── Phase 5: TLS certificates ──────────────────────────────────────────────────
+generate_tls_certs() {
+  local cert_dir="${INSTALL_PREFIX}/certs"
+
+  # BYO cert: copy provided files and skip generation
+  if [[ -n "${RUNEVAULT_TLS_CERT_PATH:-}" && -n "${RUNEVAULT_TLS_KEY_PATH:-}" ]]; then
+    cp "${RUNEVAULT_TLS_CERT_PATH}" "${cert_dir}/server.pem"
+    cp "${RUNEVAULT_TLS_KEY_PATH}"  "${cert_dir}/server.key"
+    chmod 0644 "${cert_dir}/server.pem"
+    chmod 0600 "${cert_dir}/server.key"
+    [[ "$SKIP_SERVICE" -eq 0 ]] \
+      && chown "$SERVICE_USER" "${cert_dir}/server.pem" "${cert_dir}/server.key"
+    info "Using provided TLS certificates."
+    return 0
+  fi
 
-    print_info "TLS mode: ${TLS_MODE}"
+  if [[ -f "${cert_dir}/server.pem" && "$FORCE" -eq 0 ]]; then
+    info "TLS certificates already exist (use --force to regenerate)."
+    return 0
+  fi
+
+  info "Generating self-signed TLS certificates..."
+
+  local public_ip=""
+  public_ip=$(curl -4 -sf --connect-timeout 5 ifconfig.me 2>/dev/null || true)
+  [[ -n "$public_ip" ]] && info "Public IP detected: ${public_ip}"
+
+  # Write openssl config via printf (avoids heredoc issues in piped execution)
+  local tmpconf
+  tmpconf=$(mktemp)
+  printf '[req]\ndistinguished_name = req_dn\nreq_extensions = v3_req\nprompt = no\n\n' \
+    > "$tmpconf"
+  printf '[req_dn]\nCN = runevault\n\n'              >> "$tmpconf"
+  printf '[v3_req]\nsubjectAltName = @alt_names\n\n' >> "$tmpconf"
+  printf '[alt_names]\n'                             >> "$tmpconf"
+  printf 'DNS.1 = localhost\n'                       >> "$tmpconf"
+  printf 'DNS.2 = vault\n'                           >> "$tmpconf"
+  printf 'DNS.3 = runevault\n'                       >> "$tmpconf"
+  printf 'IP.1  = 127.0.0.1\n'                       >> "$tmpconf"
+  [[ -n "$public_ip" ]] && printf 'IP.2  = %s\n' "$public_ip" >> "$tmpconf"
+
+  openssl genrsa -out "${cert_dir}/ca.key" 4096 2>/dev/null
+  openssl req -new -x509 \
+    -key "${cert_dir}/ca.key" \
+    -out "${cert_dir}/ca.pem" \
+    -days 3650 -subj "/CN=Rune-Vault CA" -sha256 2>/dev/null
+
+  openssl genrsa -out "${cert_dir}/server.key" 2048 2>/dev/null
+  local csr="${cert_dir}/server.csr"
+  openssl req -new \
+    -key "${cert_dir}/server.key" -out "$csr" -config "$tmpconf" 2>/dev/null
+  openssl x509 -req \
+    -in "$csr" \
+    -CA "${cert_dir}/ca.pem" -CAkey "${cert_dir}/ca.key" -CAcreateserial \
+    -out "${cert_dir}/server.pem" \
+    -days 825 -sha256 -extfile "$tmpconf" -extensions v3_req 2>/dev/null
+
+  rm -f "$tmpconf" "$csr" "${cert_dir}/ca.srl"
+
+  chmod 0600 "${cert_dir}/ca.key" "${cert_dir}/server.key"
+  chmod 0644 "${cert_dir}/ca.pem" "${cert_dir}/server.pem"
+  if [[ "$SKIP_SERVICE" -eq 0 ]]; then
+    chown "${SERVICE_USER}:${SERVICE_USER}" \
+      "${cert_dir}/ca.key" "${cert_dir}/ca.pem" \
+      "${cert_dir}/server.key" "${cert_dir}/server.pem"
+  fi
+
+  success "TLS certificates generated."
 }
 
-prompt_envector_config() {
-    print_step "enVector Cloud configuration"
-    echo "  Create your enVector cluster at https://envector.io before proceeding."
-    echo "  You will need the endpoint URL and API key from the dashboard."
-    echo "  Index name is used to store and retrieve your team's organizational memory."
-    echo ""
-    prompt ENVECTOR_ENDPOINT "enVector endpoint (e.g. cluster-id.clusters.envector.io)"
-    prompt ENVECTOR_API_KEY "enVector API key (e.g. aBcDE_12345_xxxxx)"
-    prompt VAULT_INDEX_NAME "Index name" "runecontext"
-
-    if [ -z "$ENVECTOR_ENDPOINT" ] || [ -z "$ENVECTOR_API_KEY" ]; then
-        print_error "enVector endpoint and API key are required."
-        exit 1
-    fi
-    if [ -z "$VAULT_INDEX_NAME" ]; then
-        print_error "Index name is required."
+# ── Phase 6: Configuration ─────────────────────────────────────────────────────
+collect_and_write_config() {
+  local conf_file="${INSTALL_PREFIX}/configs/runevault.conf"
+
+  if [[ -f "$conf_file" && "$FORCE" -eq 0 ]]; then
+    info "Config already exists (use --force to overwrite): ${conf_file}"
+  else
+    local team_name="${RUNEVAULT_TEAM_NAME:-}"
+    local envector_endpoint="${RUNEVAULT_ENVECTOR_ENDPOINT:-}"
+    local envector_api_key="${RUNEVAULT_ENVECTOR_API_KEY:-}"
+    local envector_api_key_file="${RUNEVAULT_ENVECTOR_API_KEY_FILE:-}"
+    local team_secret="${RUNEVAULT_TEAM_SECRET:-}"
+
+    if [[ "$NON_INTERACTIVE" -eq 0 ]]; then
+      printf '\n'
+      printf '══════════════════════════════════════════════════════════\n'
+      printf '  Vault configuration\n'
+      printf '══════════════════════════════════════════════════════════\n'
+      printf '\n'
+      [[ -z "$team_name" ]] \
+        && read -r -p "Team name (vault index identifier): " team_name
+      [[ -z "$envector_endpoint" ]] \
+        && read -r -p "enVector endpoint URL: " envector_endpoint
+      if [[ -z "$envector_api_key" && -z "$envector_api_key_file" ]]; then
+        read -r -p "enVector API key: " envector_api_key
+      fi
+      printf '\n'
+    else
+      local missing=()
+      [[ -z "$team_name" ]]         && missing+=("RUNEVAULT_TEAM_NAME")
+      [[ -z "$envector_endpoint" ]] && missing+=("RUNEVAULT_ENVECTOR_ENDPOINT")
+      [[ -z "$envector_api_key" && -z "$envector_api_key_file" ]] \
+        && missing+=("RUNEVAULT_ENVECTOR_API_KEY or RUNEVAULT_ENVECTOR_API_KEY_FILE")
+      if [[ ${#missing[@]} -gt 0 ]]; then
+        printf 'ERROR: Missing required env vars for non-interactive install:\n' >&2
+        for v in "${missing[@]}"; do printf '  %s\n' "$v" >&2; done
         exit 1
-    fi
-    print_info "enVector endpoint: ${ENVECTOR_ENDPOINT}"
-}
-
-prompt_csp_config() {
-    prompt TEAM_NAME "Team name (used for resource naming)" "default"
-
-    case "$DEPLOY_TARGET" in
-        aws)
-            prompt CSP_REGION "AWS region" "us-east-1"
-            ;;
-        gcp)
-            prompt CSP_REGION "GCP region" "us-central1"
-            prompt GCP_PROJECT_ID "GCP project ID"
-            if [ -z "$GCP_PROJECT_ID" ]; then
-                print_error "GCP project ID is required."; exit 1
-            fi
-            ;;
-        oci)
-            prompt CSP_REGION "OCI region" "us-ashburn-1"
-            prompt OCI_COMPARTMENT_ID "OCI compartment OCID"
-            if [ -z "$OCI_COMPARTMENT_ID" ]; then
-                print_error "OCI compartment OCID is required."; exit 1
-            fi
-            ;;
-    esac
-}
-
-generate_team_secret() {
-    VAULT_TEAM_SECRET_VALUE="evt_$(openssl rand -hex 32)"
-    print_info "Team secret generated."
-}
-
-generate_config_files() {
-    local dir="$1"
-
-    cat > "$dir/vault-roles.yml" <<'ROLESEOF'
-roles:
-  admin:
-    scope: [get_public_key, decrypt_scores, decrypt_metadata, manage_tokens]
-    top_k: 50
-    rate_limit: 150/60s
-  member:
-    scope: [get_public_key, decrypt_scores, decrypt_metadata]
-    top_k: 10
-    rate_limit: 30/60s
-ROLESEOF
-
-    cat > "$dir/vault-tokens.yml" <<'TOKENSEOF'
-tokens: []
-TOKENSEOF
-
-    chmod 600 "$dir/vault-roles.yml" "$dir/vault-tokens.yml"
-    print_info "Token/role config files created."
-}
-
-setup_runevault_alias() {
-    if [ -z "${SUDO_USER:-}" ]; then
-        return
-    fi
-
-    # Add user to docker group
-    if command -v usermod >/dev/null 2>&1; then
-        usermod -aG docker "$SUDO_USER" 2>/dev/null || true
-    fi
-
-    # Detect shell config
-    local user_home
-    user_home="$(eval echo ~"$SUDO_USER")"
-    local shell_rc=""
-    if [ -f "$user_home/.zshrc" ]; then
-        shell_rc="$user_home/.zshrc"
-    elif [ -f "$user_home/.bashrc" ]; then
-        shell_rc="$user_home/.bashrc"
+      fi
     fi
 
-    if [ -n "$shell_rc" ]; then
-        if ! grep -q 'alias runevault=' "$shell_rc" 2>/dev/null; then
-            echo '' >> "$shell_rc"
-            echo '# Rune-Vault admin CLI' >> "$shell_rc"
-            echo 'alias runevault="docker exec -it rune-vault python3 /app/vault_admin_cli.py"' >> "$shell_rc"
-            print_info "runevault alias added to ${shell_rc}"
-            print_warn "Run 'exec \$SHELL' to reload your shell and enable the runevault command."
-        fi
+    if [[ -z "$team_secret" ]]; then
+      team_secret=$(LC_ALL=C tr -dc 'a-f0-9' < /dev/urandom | head -c 64; true)
     fi
-}
-
-# ─── Confirmation summary ────────────────────────────────────────────────────
-
-show_confirmation() {
-    print_header "Configuration Summary"
-    echo "  Deployment target : ${DEPLOY_TARGET}"
-    echo "  Install directory : ${INSTALL_DIR}"
-    echo "  TLS mode          : ${TLS_MODE}"
-    [ -n "${TLS_HOSTNAME:-}" ] && echo "  TLS domain        : ${TLS_HOSTNAME}"
-    echo "  Team secret       : (auto-generated in .env)"
-    echo "  enVector endpoint : ${ENVECTOR_ENDPOINT}"
-    echo "  Index name        : ${VAULT_INDEX_NAME}"
-    if [ "$DEPLOY_TARGET" != "local" ]; then
-        echo "  Team name         : ${TEAM_NAME}"
-        echo "  Region            : ${CSP_REGION}"
-        [ "${DEPLOY_TARGET}" = "gcp" ] && echo "  GCP project       : ${GCP_PROJECT_ID}"
-        [ "${DEPLOY_TARGET}" = "oci" ] && echo "  OCI compartment   : ${OCI_COMPARTMENT_ID}"
-    fi
-    echo ""
-
-    if ! prompt_yn "Proceed with deployment?"; then
-        print_warn "Aborted."
-        exit 0
-    fi
-}
-
-# ─── File download helper ────────────────────────────────────────────────────
-
-download_file() {
-    local url="$1" dest="$2"
-    local attempt max_attempts=3
-    for attempt in $(seq 1 $max_attempts); do
-        if curl -fsSL "$url" -o "$dest"; then
-            return 0
-        fi
-        [ "$attempt" -lt "$max_attempts" ] && sleep 1
-    done
-    print_error "Failed to download (after ${max_attempts} attempts): $url"
-    exit 1
-}
-
-# ─── TLS handling ─────────────────────────────────────────────────────────────
-
-setup_tls() {
-    local certs_dir="$INSTALL_DIR/certs"
-    mkdir -p "$certs_dir"
-
-    case "$TLS_MODE" in
-        self-signed)
-            print_step "Generating self-signed certificates..."
-            download_file "${GITHUB_RAW_BASE}/scripts/generate-certs.sh" "$certs_dir/generate-certs.sh"
-            chmod +x "$certs_dir/generate-certs.sh"
-            (cd "$certs_dir" && bash generate-certs.sh . "${TLS_HOSTNAME:-localhost}")
-            TLS_CERT_PATH="$certs_dir/server.pem"
-            TLS_KEY_PATH="$certs_dir/server.key"
-            TLS_CA_PATH="$certs_dir/ca.pem"
-            print_info "Self-signed certificates generated in ${certs_dir}/"
-            ;;
-        none)
-            print_warn "Skipping TLS setup."
-            TLS_CERT_PATH=""
-            TLS_KEY_PATH=""
-            TLS_CA_PATH=""
-            ;;
-    esac
-}
 
-# ─── Generate .env file ──────────────────────────────────────────────────────
+    [[ -n "$team_name" ]]         || die "team_name is required."
+    [[ -n "$envector_endpoint" ]] || die "envector_endpoint is required."
+    [[ -n "$envector_api_key" || -n "$envector_api_key_file" ]] \
+      || die "enVector API key or key file is required."
 
-generate_env_file() {
-    local env_file="$INSTALL_DIR/.env"
-
-    cat > "$env_file" <<ENVEOF
-# Rune-Vault configuration — generated by install.sh
-VAULT_TEAM_SECRET=${VAULT_TEAM_SECRET_VALUE}
-VAULT_INDEX_NAME=${VAULT_INDEX_NAME}
-ENVECTOR_ENDPOINT=${ENVECTOR_ENDPOINT}
-ENVECTOR_API_KEY=${ENVECTOR_API_KEY}
-EMBEDDING_DIM=1024
-RUNE_VAULT_TAG=${DOCKER_TAG}
-ENVEOF
-
-    if [ "$TLS_MODE" = "none" ]; then
-        echo "VAULT_TLS_DISABLE=true" >> "$env_file"
+    local api_key_line
+    if [[ -n "$envector_api_key_file" ]]; then
+      api_key_line="  api_key_file: ${envector_api_key_file}"
     else
-        cat >> "$env_file" <<TLSEOF
-VAULT_TLS_CERT=/app/certs/server.pem
-VAULT_TLS_KEY=/app/certs/server.key
-TLSEOF
-    fi
-
-    chmod 600 "$env_file"
-    print_info ".env file created (mode 600)."
+      api_key_line="  api_key: ${envector_api_key}"
+    fi
+
+    info "Writing ${conf_file}..."
+    printf '%s\n' \
+      "server:" \
+      "  grpc:" \
+      "    host: 0.0.0.0" \
+      "    port: ${GRPC_PORT}" \
+      "    tls:" \
+      "      cert: ${INSTALL_PREFIX}/certs/server.pem" \
+      "      key: ${INSTALL_PREFIX}/certs/server.key" \
+      "      disable: false" \
+      "  admin:" \
+      "    socket: ${INSTALL_PREFIX}/admin.sock" \
+      "" \
+      "keys:" \
+      "  path: ${INSTALL_PREFIX}/vault-keys" \
+      "  index_name: ${team_name}" \
+      "  embedding_dim: 1024" \
+      "" \
+      "envector:" \
+      "  endpoint: ${envector_endpoint}" \
+      "${api_key_line}" \
+      "" \
+      "tokens:" \
+      "  team_secret: ${team_secret}" \
+      "  roles_file: ${INSTALL_PREFIX}/configs/roles.yml" \
+      "  tokens_file: ${INSTALL_PREFIX}/configs/tokens.yml" \
+      "" \
+      "audit:" \
+      "  mode: file+stdout" \
+      "  path: ${INSTALL_PREFIX}/logs/audit.log" \
+      > "$conf_file"
+    chmod 0640 "$conf_file"
+    [[ "$SKIP_SERVICE" -eq 0 ]] && chown "${SERVICE_USER}:${SERVICE_USER}" "$conf_file"
+
+  fi
+
+  # roles.yml
+  local roles_file="${INSTALL_PREFIX}/configs/roles.yml"
+  if [[ ! -f "$roles_file" || "$FORCE" -eq 1 ]]; then
+    printf '%s\n' \
+      "roles:" \
+      "  admin:" \
+      "    scope:" \
+      "      - get_public_key" \
+      "      - decrypt_scores" \
+      "      - decrypt_metadata" \
+      "      - manage_tokens" \
+      "    top_k: 50" \
+      "    rate_limit: 150/60s" \
+      "  member:" \
+      "    scope:" \
+      "      - get_public_key" \
+      "      - decrypt_scores" \
+      "      - decrypt_metadata" \
+      "    top_k: 10" \
+      "    rate_limit: 30/60s" \
+      > "$roles_file"
+    chmod 0640 "$roles_file"
+    [[ "$SKIP_SERVICE" -eq 0 ]] && chown "${SERVICE_USER}:${SERVICE_USER}" "$roles_file"
+  fi
+
+  # tokens.yml
+  local tokens_file="${INSTALL_PREFIX}/configs/tokens.yml"
+  if [[ ! -f "$tokens_file" || "$FORCE" -eq 1 ]]; then
+    printf 'tokens: []\n' > "$tokens_file"
+    chmod 0640 "$tokens_file"
+    [[ "$SKIP_SERVICE" -eq 0 ]] && chown "${SERVICE_USER}:${SERVICE_USER}" "$tokens_file"
+  fi
+
+  success "Configuration written."
 }
 
-# ─── Local deployment ─────────────────────────────────────────────────────────
-
-deploy_local() {
-    print_header "Deploying Rune-Vault (Local)"
-
-    # Handle existing installation
-    if [ -d "$INSTALL_DIR" ]; then
-        print_warn "Existing installation found at ${INSTALL_DIR}"
-        if prompt_yn "Remove existing installation and reinstall?" "n"; then
-            print_step "Removing existing installation..."
-            (cd "$INSTALL_DIR" && docker compose down 2>/dev/null) || true
-            rm -rf "$INSTALL_DIR"
-            print_info "Previous installation removed."
-        else
-            print_warn "Aborted."
-            exit 0
-        fi
-    fi
-
-    # Create directory structure
-    mkdir -p "$INSTALL_DIR"/{certs,backups,logs}
-    print_info "Directory structure created: ${INSTALL_DIR}/"
-
-    # Download docker-compose.yml
-    print_step "Downloading docker-compose.yml..."
-    download_file "${GITHUB_RAW_BASE}/vault/docker-compose.yml" "$INSTALL_DIR/docker-compose.yml"
-    # Pin image to the resolved version
-    sed -i.bak "s|image:.*rune-vault:.*|image: ${DOCKER_IMAGE}:${DOCKER_TAG}|" "$INSTALL_DIR/docker-compose.yml"
-    rm -f "$INSTALL_DIR/docker-compose.yml.bak"
-    print_info "docker-compose.yml downloaded."
-
-    # TLS
-    setup_tls
-
-    # Generate .env and config files
-    generate_env_file
-    generate_config_files "$INSTALL_DIR"
-
-    # Restore ownership to the invoking user (files were created as root via sudo)
-    if [ -n "${SUDO_USER:-}" ]; then
-        chown -R "$SUDO_USER" "$INSTALL_DIR"
-    fi
-
-    # Pull image
-    print_step "Pulling Docker image..."
-    (cd "$INSTALL_DIR" && docker compose pull)
-    print_info "Docker image pulled."
-
-    # Start container
-    print_step "Starting Rune-Vault..."
-    (cd "$INSTALL_DIR" && docker compose up -d)
-    print_info "Container started."
-
-    # Health check
-    print_step "Waiting for Vault to become healthy..."
-    local elapsed=0
-    local timeout=60
-    while [ $elapsed -lt $timeout ]; do
-        if docker exec rune-vault curl -sf http://localhost:8081/health 2>/dev/null; then
-            print_info "Vault is healthy!"
-
-            # Set up runevault alias for admin CLI
-            setup_runevault_alias
-            return 0
-        fi
-        sleep 2
-        elapsed=$((elapsed + 2))
-        printf "."
-    done
-
-    echo ""
-    print_error "Vault did not become healthy within ${timeout}s."
-    print_warn "Container logs:"
-    docker logs rune-vault 2>&1 | tail -30
-    exit 1
-}
-
-# ─── CSP deployment ───────────────────────────────────────────────────────────
-
-deploy_csp() {
-    local provider="$DEPLOY_TARGET"
-    print_header "Deploying Rune-Vault (${provider})"
-
-    local tf_dir="$INSTALL_DIR/deployment"
-    mkdir -p "$tf_dir"
-    # Ensure the original user owns the deployment directory for terraform
-    if [ -n "${SUDO_USER:-}" ]; then
-        chown -R "$SUDO_USER" "$INSTALL_DIR"
-    fi
-
-    # Download Terraform files
-    print_step "Downloading Terraform configuration..."
-    download_file "${GITHUB_RAW_BASE}/deployment/${provider}/main.tf" "$tf_dir/main.tf"
-    if [ "$provider" = "aws" ]; then
-        download_file "${GITHUB_RAW_BASE}/deployment/${provider}/cloud-init.yaml" "$tf_dir/cloud-init.yaml"
-        sed -i.bak "s|image:.*rune-vault:.*|image: ${DOCKER_IMAGE}:${DOCKER_TAG}|" "$tf_dir/cloud-init.yaml"
-        rm -f "$tf_dir/cloud-init.yaml.bak"
-    else
-        download_file "${GITHUB_RAW_BASE}/deployment/${provider}/startup-script.sh" "$tf_dir/startup-script.sh"
-        sed -i.bak "s|image:.*rune-vault:.*|image: ${DOCKER_IMAGE}:${DOCKER_TAG}|" "$tf_dir/startup-script.sh"
-        rm -f "$tf_dir/startup-script.sh.bak"
-    fi
-    print_info "Terraform files downloaded."
-
-    # Generate SSH key pair for EC2 access
-    local ssh_key_path="$INSTALL_DIR/ssh_key"
-    if [ ! -f "$ssh_key_path" ]; then
-        print_step "Generating SSH key pair..."
-        ssh-keygen -t ed25519 -f "$ssh_key_path" -N "" -q
-        chmod 600 "$ssh_key_path"
-        chmod 644 "${ssh_key_path}.pub"
-        print_info "SSH key generated: ${ssh_key_path}"
-    fi
-    local public_key
-    public_key=$(cat "${ssh_key_path}.pub")
-
-    # Generate terraform.tfvars (use printf to avoid heredoc escaping issues)
-    print_step "Generating terraform.tfvars..."
-    escape_tf() { printf '%s' "$1" | sed 's/\\/\\\\/g; s/"/\\"/g'; }
-    {
-        printf 'team_secret        = "%s"\n' "$(escape_tf "$VAULT_TEAM_SECRET_VALUE")"
-        printf 'team_name          = "%s"\n' "$(escape_tf "$TEAM_NAME")"
-        printf 'region             = "%s"\n' "$(escape_tf "$CSP_REGION")"
-        printf 'tls_mode           = "%s"\n' "$(escape_tf "$TLS_MODE")"
-        printf 'tls_hostname       = "%s"\n' "$(escape_tf "${TLS_HOSTNAME:-}")"
-        printf 'envector_endpoint  = "%s"\n' "$(escape_tf "$ENVECTOR_ENDPOINT")"
-        printf 'envector_api_key   = "%s"\n' "$(escape_tf "$ENVECTOR_API_KEY")"
-        printf 'vault_index_name   = "%s"\n' "$(escape_tf "$VAULT_INDEX_NAME")"
-        printf 'public_key         = "%s"\n' "$(escape_tf "$public_key")"
-        case "$provider" in
-            gcp) printf 'project_id         = "%s"\n' "$(escape_tf "$GCP_PROJECT_ID")" ;;
-            oci) printf 'compartment_id     = "%s"\n' "$(escape_tf "$OCI_COMPARTMENT_ID")" ;;
-        esac
-    } > "$tf_dir/terraform.tfvars"
-
-    chmod 600 "$tf_dir/terraform.tfvars"
-    if [ -n "${SUDO_USER:-}" ]; then
-        chown -R "$SUDO_USER" "$INSTALL_DIR"
-    fi
-    print_info "terraform.tfvars created."
-
-    # Terraform init & apply (run as the original user to preserve CLI auth)
-    print_step "Running Terraform..."
-    local tf_run="terraform"
-    if [ -n "${SUDO_USER:-}" ]; then
-        tf_run="sudo -u $SUDO_USER terraform"
-    fi
-    (cd "$tf_dir" && $tf_run init)
-    (cd "$tf_dir" && $tf_run apply -auto-approve)
-
-    # Capture outputs
-    VAULT_PUBLIC_IP=$(cd "$tf_dir" && $tf_run output -raw vault_public_ip 2>/dev/null) || true
-    local vault_url
-    vault_url=$(cd "$tf_dir" && $tf_run output -raw vault_url 2>/dev/null) || true
-
-    print_info "Infrastructure provisioned."
-
-    # Health polling — wait for cloud-init to finish and Vault to start
-    if [ -n "$VAULT_PUBLIC_IP" ]; then
-        print_step "Waiting for Vault to become reachable (up to 10 min)..."
-        local elapsed=0
-        local timeout=600
-        while [ $elapsed -lt $timeout ]; do
-            if bash -c "echo >/dev/tcp/${VAULT_PUBLIC_IP}/50051" 2>/dev/null; then
-                print_info "Vault is reachable at ${VAULT_PUBLIC_IP}:50051!"
-
-                # Download ca.pem from remote server
-                if [ "$TLS_MODE" = "self-signed" ]; then
-                    mkdir -p "$INSTALL_DIR/certs"
-                    if [ -n "${SUDO_USER:-}" ]; then
-                        chown -R "$SUDO_USER" "$INSTALL_DIR/certs"
-                    fi
-                    local scp_opts="-i $ssh_key_path -o StrictHostKeyChecking=no -o ConnectTimeout=15 -o BatchMode=yes"
-                    local scp_prefix=""
-                    if [ -n "${SUDO_USER:-}" ]; then
-                        scp_prefix="sudo -u $SUDO_USER"
-                    fi
-                    # Retry SCP (SSH may not be ready immediately)
-                    local downloaded=0
-                    for attempt in 1 2 3; do
-                        sleep 10
-                        for ssh_user in ubuntu opc; do
-                            if $scp_prefix scp $scp_opts \
-                                "${ssh_user}@${VAULT_PUBLIC_IP}:/opt/rune/certs/ca.pem" \
-                                "$INSTALL_DIR/certs/ca.pem" 2>/dev/null; then
-                                downloaded=1; break 2
-                            fi
-                        done
-                    done
-                    if [ "$downloaded" -eq 1 ]; then
-                        CSP_CA_CERT_LOCAL="$INSTALL_DIR/certs/ca.pem"
-                        print_info "CA certificate downloaded to ${CSP_CA_CERT_LOCAL}"
-                    else
-                        print_warn "Could not download ca.pem via SSH. Retrieve manually:"
-                        echo "  scp -i ${ssh_key_path} ubuntu@${VAULT_PUBLIC_IP}:/opt/rune/certs/ca.pem ${INSTALL_DIR}/certs/"
-                    fi
-                fi
-
-                break
-            fi
-            sleep 10
-            elapsed=$((elapsed + 10))
-            printf "."
-        done
-        echo ""
-        if [ $elapsed -ge $timeout ]; then
-            print_error "Vault not reachable within ${timeout}s. Cloud-init may still be running."
-            echo ""
-            echo "  Debug via SSH:"
-            echo "  ssh -i ${ssh_key_path} ubuntu@${VAULT_PUBLIC_IP} 'cloud-init status --wait && docker ps'"
-            echo ""
-            echo "  Terraform directory: ${tf_dir}"
-            echo "  To destroy resources: cd ${tf_dir} && terraform destroy"
-            exit 1
-        fi
-    fi
+# ── Phase 7: Service installation ─────────────────────────────────────────────
+install_service() {
+  if [[ "$SKIP_SERVICE" -eq 1 ]]; then
+    info "Skipping service installation (RUNEVAULT_SKIP_SERVICE=1)."
+    return 0
+  fi
+
+  local config_path="${INSTALL_PREFIX}/configs/runevault.conf"
+
+  if [[ "$OS_SLUG" = linux ]]; then
+    if systemctl is-active --quiet runevault.service 2>/dev/null; then
+      info "Stopping running runevault service..."
+      systemctl stop runevault.service
+      info "Tip: manage the service with: sudo systemctl start|stop|restart runevault"
+    fi
+    info "Installing systemd service..."
+    local unit=/etc/systemd/system/runevault.service
+    printf '%s\n' \
+      "[Unit]" \
+      "Description=Rune-Vault FHE gRPC Server" \
+      "Documentation=https://github.com/${REPO}" \
+      "After=network-online.target" \
+      "Wants=network-online.target" \
+      "" \
+      "[Service]" \
+      "Type=simple" \
+      "User=${SERVICE_USER}" \
+      "Group=${SERVICE_USER}" \
+      "ExecStart=${BINARY_DEST} daemon start --config ${config_path}" \
+      "Restart=on-failure" \
+      "RestartSec=5s" \
+      "TimeoutStopSec=30s" \
+      "StandardOutput=journal" \
+      "StandardError=journal" \
+      "SyslogIdentifier=runevault" \
+      "NoNewPrivileges=true" \
+      "PrivateTmp=true" \
+      "ProtectSystem=strict" \
+      "ProtectHome=true" \
+      "ReadWritePaths=${INSTALL_PREFIX}" \
+      "ProtectKernelTunables=true" \
+      "ProtectKernelModules=true" \
+      "ProtectControlGroups=true" \
+      "RestrictAddressFamilies=AF_INET AF_INET6 AF_UNIX" \
+      "RestrictNamespaces=true" \
+      "LockPersonality=true" \
+      "MemoryDenyWriteExecute=false" \
+      "RestrictRealtime=true" \
+      "RestrictSUIDSGID=true" \
+      "RemoveIPC=true" \
+      "LimitNOFILE=65536" \
+      "" \
+      "[Install]" \
+      "WantedBy=multi-user.target" \
+      > "$unit"
+    chmod 0644 "$unit"
+    systemctl daemon-reload
+    systemctl enable runevault.service
+    systemctl start runevault.service
+    success "systemd service enabled and started."
+
+  else
+    info "Installing launchd service..."
+    local plist=/Library/LaunchDaemons/com.cryptolabinc.runevault.plist
+    printf '%s\n' \
+      '<?xml version="1.0" encoding="UTF-8"?>' \
+      '<!DOCTYPE plist PUBLIC "-//Apple//DTD PLIST 1.0//EN"' \
+      '  "http://www.apple.com/DTDs/PropertyList-1.0.dtd">' \
+      '<plist version="1.0">' \
+      '<dict>' \
+      '  <key>Label</key>' \
+      '  <string>com.cryptolabinc.runevault</string>' \
+      '' \
+      '  <key>ProgramArguments</key>' \
+      '  <array>' \
+      "    <string>${BINARY_DEST}</string>" \
+      '    <string>daemon</string>' \
+      '    <string>start</string>' \
+      '    <string>--config</string>' \
+      "    <string>${config_path}</string>" \
+      '  </array>' \
+      '' \
+      '  <key>UserName</key>' \
+      "  <string>${SERVICE_USER}</string>" \
+      '' \
+      '  <key>RunAtLoad</key>' \
+      '  <true/>' \
+      '' \
+      '  <key>KeepAlive</key>' \
+      '  <true/>' \
+      '' \
+      '  <key>ThrottleInterval</key>' \
+      '  <integer>10</integer>' \
+      '' \
+      '  <key>StandardOutPath</key>' \
+      "  <string>${INSTALL_PREFIX}/logs/runevault.stdout.log</string>" \
+      '' \
+      '  <key>StandardErrorPath</key>' \
+      "  <string>${INSTALL_PREFIX}/logs/runevault.stderr.log</string>" \
+      '' \
+      '  <key>EnvironmentVariables</key>' \
+      '  <dict>' \
+      '    <key>PATH</key>' \
+      '    <string>/usr/local/bin:/usr/bin:/bin:/usr/sbin:/sbin</string>' \
+      '  </dict>' \
+      '' \
+      '  <key>ProcessType</key>' \
+      '  <string>Background</string>' \
+      '</dict>' \
+      '</plist>' \
+      > "$plist"
+    chmod 0644 "$plist"
+    chown root "$plist"
+    launchctl bootout system/com.cryptolabinc.runevault 2>/dev/null || true
+    launchctl bootstrap system "$plist"
+    success "launchd service loaded."
+  fi
 }
 
-# ─── Summary ──────────────────────────────────────────────────────────────────
-
-show_summary() {
-    local endpoint
-    if [ "$DEPLOY_TARGET" = "local" ]; then
-        if [ "$TLS_MODE" = "none" ]; then
-            endpoint="localhost:50051"
-        else
-            endpoint="localhost:50051 (TLS)"
-        fi
-    else
-        local ip="${VAULT_PUBLIC_IP:-<public-ip>}"
-        endpoint="${ip}:50051"
-    fi
-
-    print_header "Deployment Complete"
-    echo "  Vault Endpoint  : ${endpoint}"
-    echo "  Team Secret     : (stored in ${INSTALL_DIR}/.env)"
-    echo "  TLS Mode        : ${TLS_MODE}"
-    if [ "$TLS_MODE" = "self-signed" ] && [ "$DEPLOY_TARGET" = "local" ]; then
-        echo "  CA Certificate  : ${INSTALL_DIR}/certs/ca.pem"
-    fi
-    echo ""
-    echo -e "${BOLD}Share with your team:${NC}"
-    echo ""
-    echo "  Team members will need the following credentials when installing the"
-    echo "  Rune plugin/extension. Share them securely (e.g. encrypted channel):"
-    echo ""
-    if [ -n "${TLS_HOSTNAME:-}" ]; then
-        echo "  Endpoint : ${TLS_HOSTNAME}:50051"
-    elif [ "$DEPLOY_TARGET" != "local" ] && [ -n "${VAULT_PUBLIC_IP:-}" ]; then
-        echo "  Endpoint : ${VAULT_PUBLIC_IP}:50051"
-    else
-        echo "  Endpoint : <public-ip>:50051"
-    fi
-    echo ""
-    echo "  Issue per-user tokens with:"
-    echo "    runevault token issue --user <name> --role member --expires 90d"
-    echo ""
-    if [ "$DEPLOY_TARGET" = "local" ]; then
-        echo "  Reload your shell before using the runevault command:"
-        echo "    exec \$SHELL"
-        echo ""
-    fi
-    echo "  Each team member uses their individual token for authentication."
-    echo "  Team Secret (above) is only needed for DEK derivation — keep it secure."
-    if [ "$TLS_MODE" = "self-signed" ]; then
-        echo ""
-        echo "  Your vault uses a self-signed CA. Team members also need the CA"
-        echo "  certificate file below. Share this file directly — they will be"
-        echo "  prompted to provide its path during plugin/extension setup."
-        echo ""
-        if [ -n "${CSP_CA_CERT_LOCAL}" ]; then
-            echo "  CA Cert  : ${CSP_CA_CERT_LOCAL}"
-        elif [ "$DEPLOY_TARGET" = "local" ]; then
-            echo "  CA Cert  : ${INSTALL_DIR}/certs/ca.pem"
-        else
-            echo "  CA Cert  : /opt/rune/certs/ca.pem (on the remote server)"
-        fi
-    fi
-    if [ "$DEPLOY_TARGET" != "local" ]; then
-        echo ""
-        echo -e "${BOLD}Next steps:${NC}"
-        echo "  1. Point your domain DNS to ${VAULT_PUBLIC_IP:-<public-ip>}"
-        echo "  2. To use custom TLS certificates, replace files in /opt/rune/certs/ on the server"
-        echo "     and restart: ssh -i ${INSTALL_DIR}/ssh_key ubuntu@${VAULT_PUBLIC_IP:-<public-ip>} 'cd /opt/rune && docker compose restart'"
-        echo ""
-        echo "  SSH access: ssh -i ${INSTALL_DIR}/ssh_key ubuntu@${VAULT_PUBLIC_IP:-<public-ip>}"
-    fi
-    echo ""
-    echo "Install directory: ${INSTALL_DIR}"
-    echo ""
+# ── Phase 8: Post-install summary ─────────────────────────────────────────────
+post_install() {
+  if [[ "$SKIP_SERVICE" -eq 0 ]]; then
+    info "Waiting for vault to start..."
+    local i
+    for i in $(seq 1 15); do
+      "$BINARY_DEST" status \
+        --config "${INSTALL_PREFIX}/configs/runevault.conf" \
+        >/dev/null 2>&1 && { success "Vault is up."; break; } || true
+      sleep 1
+    done
+  fi
+
+  local public_ip=""
+  public_ip=$(curl -4 -sf --connect-timeout 5 ifconfig.me 2>/dev/null || true)
+
+  printf '\n'
+  success "Rune-Vault ${VERSION:-local} installed successfully."
+  printf '\n'
+  printf '  Binary:   %s\n' "$BINARY_DEST"
+  printf '  Config:   %s\n' "${INSTALL_PREFIX}/configs/runevault.conf"
+  printf '  CA cert:  %s\n' "${INSTALL_PREFIX}/certs/ca.pem"
+  [[ -n "$public_ip" ]] && printf '  Endpoint: %s:%s\n' "$public_ip" "$GRPC_PORT"
+  printf '\n'
+  printf 'Next steps:\n'
+  printf '  Issue a token:  runevault token issue --user <name> --role member\n'
+  printf '  Check status:   runevault status\n'
+  if [[ "$OS_SLUG" = linux ]]; then
+    printf '  View logs:      journalctl -u runevault -f\n'
+    printf '  Manage daemon:  sudo systemctl start|stop|restart runevault\n'
+  else
+    printf '  View logs:      tail -f %s/logs/runevault.stderr.log\n' "${INSTALL_PREFIX}"
+    printf '  Manage daemon:  sudo launchctl bootout system/com.cryptolabinc.runevault\n'
+    printf '                  sudo launchctl bootstrap system /Library/LaunchDaemons/com.cryptolabinc.runevault.plist\n'
+  fi
+  if [[ -n "${SUDO_USER:-}" ]]; then
+    printf '\n'
+    printf "NOTE: '%s' was added to the '%s' group.\n" "${SUDO_USER}" "${SERVICE_USER}"
+    printf '      Re-login (or run: newgrp %s) to apply group membership.\n' "${SERVICE_USER}"
+  fi
+  printf '\n'
+  warn "BACKUP: Keep these safe — they cannot be recovered if lost:"
+  warn "  Rune-Vault Keys: ${INSTALL_PREFIX}/vault-keys/"
+  warn "  Config:          ${INSTALL_PREFIX}/configs/runevault.conf"
 }
 
-# ─── main() ──────────────────────────────────────────────────────────────────
-
-main() {
-    print_header "Rune-Vault Interactive Setup"
-    echo "One-command deployment for Rune organizational memory vault."
-    echo ""
-
-    resolve_version
-
-    # 1. Deployment target
-    choose_deploy_target
-
-    # 2. Prerequisites
-    if [ "$DEPLOY_TARGET" = "local" ]; then
-        check_prerequisites_local
-    else
-        check_prerequisites_csp "$DEPLOY_TARGET"
-    fi
-
-    # 3. Install directory
-    prompt_install_dir
-
-    # 4. Common settings
-    prompt_tls_mode
-    generate_team_secret
-    prompt_envector_config
-
-    # 5. CSP-specific settings
-    if [ "$DEPLOY_TARGET" != "local" ]; then
-        prompt_csp_config
-    fi
-
-    # 6. Confirm
-    show_confirmation
-
-    # 7. Deploy
-    if [ "$DEPLOY_TARGET" = "local" ]; then
-        deploy_local
-    else
-        deploy_csp
-    fi
-
-    # 8. Summary
-    show_summary
-}
+# ── Main ───────────────────────────────────────────────────────────────────────
+if [[ "$UNINSTALL" -eq 1 ]]; then
+  run_uninstall
+  exit 0
+fi
 
-main "$@"
+preflight
+download_and_verify
+setup_system
+generate_tls_certs
+collect_and_write_config
+install_service
+post_install
diff --git a/scripts/install-dev.sh b/scripts/install-dev.sh
index f5be62e..5dbbcdf 100755
--- a/scripts/install-dev.sh
+++ b/scripts/install-dev.sh
@@ -1,865 +1,49 @@
-#!/bin/bash
-# Rune-Vault Interactive Server Setup — Local Development Version
-# Uses files from the local working tree instead of downloading from GitHub.
-# Usage: sudo bash scripts/install-dev.sh
+#!/usr/bin/env bash
 #
-# Build the Docker image first:
-#   mise run build dev
+# Local testing wrapper for install.sh.
+#
+# Uses the locally built binary instead of downloading from GitHub.
+# Skips cosign verification. Useful for testing the installer flow without
+# a published release.
+#
+# Usage:
+#   mise run go:build                         # build the binary first
+#   sudo bash scripts/install-dev.sh          # full install to /opt/runevault
+#   bash scripts/install-dev.sh --prefix /tmp/vault-test  # rootless local test
 
 set -euo pipefail
 
-# ─── Root privilege check ─────────────────────────────────────────────────────
-
-if [ "$(id -u)" -ne 0 ]; then
-    echo "Error: This script must be run as root. Use: sudo bash scripts/install-dev.sh"
-    exit 1
-fi
-
-# ─── Resolve repo root ──────────────────────────────────────────────────────
-
-SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
-REPO_ROOT="$(cd "$SCRIPT_DIR/.." && pwd)"
-
-if [ ! -f "$REPO_ROOT/install.sh" ]; then
-    echo "Error: Cannot find repo root. Run from the repository directory:"
-    echo "  sudo bash scripts/install-dev.sh"
-    exit 1
-fi
-
-# ─── Resolve Docker tag from git state ───────────────────────────────────────
-
-DOCKER_IMAGE="ghcr.io/cryptolabinc/rune-vault"
-GIT_BRANCH="$(git -C "$REPO_ROOT" rev-parse --abbrev-ref HEAD | sed 's|/|-|g')"
-GIT_COMMIT="$(git -C "$REPO_ROOT" rev-parse --short HEAD)"
-DOCKER_TAG="${GIT_BRANCH}-${GIT_COMMIT}"
-_user_home="${SUDO_USER:+$(eval echo ~"$SUDO_USER")}"
-DEFAULT_INSTALL_DIR="${_user_home:-$HOME}/rune-vault-dev"
-VAULT_PUBLIC_IP=""
-CSP_CA_CERT_LOCAL=""
-
-# ─── Colors & output helpers ─────────────────────────────────────────────────
-
-RED='\033[0;31m'
-GREEN='\033[0;32m'
-YELLOW='\033[1;33m'
-BLUE='\033[0;34m'
-BOLD='\033[1m'
-NC='\033[0m'
-
-print_header() {
-    echo -e "\n${BLUE}================================================${NC}"
-    echo -e "${BLUE}  $1${NC}"
-    echo -e "${BLUE}================================================${NC}\n"
-}
-
-print_info()  { echo -e "${GREEN}✓${NC} $1"; }
-print_warn()  { echo -e "${YELLOW}⚠${NC} $1"; }
-print_error() { echo -e "${RED}✗${NC} $1"; }
-print_step()  { echo -e "\n${BOLD}▸ $1${NC}\n"; }
-
-# ─── Cleanup trap ─────────────────────────────────────────────────────────────
-
-CLEANUP_DIR=""
-cleanup() {
-    printf '\033[?25h' >&2 2>/dev/null || true
-    if [ -n "$CLEANUP_DIR" ] && [ -d "$CLEANUP_DIR" ]; then
-        rm -rf "$CLEANUP_DIR"
-    fi
-}
-trap cleanup EXIT
-
-# ─── Prompt helper ────────────────────────────────────────────────────────────
-
-prompt() {
-    local varname="$1" message="$2" default="${3:-}"
-    if [ -n "$default" ]; then
-        printf "${BOLD}%s${NC} [%s]: " "$message" "$default" >&2
-    else
-        printf "${BOLD}%s${NC}: " "$message" >&2
-    fi
-    local value
-    read -r value
-    value="${value:-$default}"
-    eval "$varname=\"\$value\""
-}
-
-prompt_yn() {
-    local message="$1" default="${2:-y}"
-    local value
-    if [ "$default" = "y" ]; then
-        printf "${BOLD}%s${NC} [Y/n]: " "$message" >&2
-    else
-        printf "${BOLD}%s${NC} [y/N]: " "$message" >&2
-    fi
-    read -r value
-    value="${value:-$default}"
-    case "$value" in
-        [Yy]*) return 0 ;;
-        *) return 1 ;;
-    esac
-}
-
-# ─── Arrow-key menu selector ────────────────────────────────────────────────
-
-select_menu() {
-    local options=("$@")
-    local count=${#options[@]}
-    local _sel=0
-
-    # Fallback: plain number input when terminal is dumb or unset
-    if [ -z "${TERM:-}" ] || [ "$TERM" = "dumb" ]; then
-        local i
-        for i in "${!options[@]}"; do
-            printf "  %d) %s\n" "$((i + 1))" "${options[$i]}" >&2
-        done
-        echo "" >&2
-        local choice
-        printf "${BOLD}Select${NC} [1]: " >&2
-        read -r choice
-        choice="${choice:-1}"
-        if [ "$choice" -ge 1 ] 2>/dev/null && [ "$choice" -le "$count" ] 2>/dev/null; then
-            echo "$((choice - 1))"
-        else
-            print_error "Invalid selection."; exit 1
-        fi
-        return
-    fi
-
-    # ── Draw the menu ──
-    _draw_menu() {
-        local i
-        for i in "${!options[@]}"; do
-            if [ "$i" -eq "$_sel" ]; then
-                printf "  ${GREEN}${BOLD}> %s${NC}\n" "${options[$i]}" >&2
-            else
-                printf "    %s\n" "${options[$i]}" >&2
-            fi
-        done
-    }
-
-    # ── Move cursor up to redraw ──
-    _erase_menu() {
-        local i
-        for (( i = 0; i < count; i++ )); do
-            printf '\033[1A\033[2K' >&2
-        done
-    }
-
-    printf '\033[?25l' >&2          # hide cursor
-    printf "  ${BOLD}↑↓ move  Enter confirm${NC}\n" >&2
-    _draw_menu
-
-    while true; do
-        local key=""
-        IFS= read -rsn1 key
-        if [ "$key" = $'\x1b' ]; then
-            local seq=""
-            IFS= read -rsn2 -t 1 seq || true
-            case "$seq" in
-                '[A') # Up arrow
-                    if [ "$_sel" -gt 0 ]; then
-                        _sel=$((_sel - 1))
-                    else
-                        _sel=$((count - 1))
-                    fi
-                    ;;
-                '[B') # Down arrow
-                    if [ "$_sel" -lt $((count - 1)) ]; then
-                        _sel=$((_sel + 1))
-                    else
-                        _sel=0
-                    fi
-                    ;;
-            esac
-            _erase_menu
-            _draw_menu
-        elif [ "$key" = "" ]; then
-            # Enter key
-            break
-        elif [ "$key" -ge 1 ] 2>/dev/null && [ "$key" -le "$count" ] 2>/dev/null; then
-            # Number key direct jump
-            _sel=$((key - 1))
-            _erase_menu
-            _draw_menu
-        fi
-    done
-
-    printf '\033[?25h' >&2          # show cursor
-
-    echo "$_sel"
-}
-
-# ─── Local file copy helper (replaces download_file) ────────────────────────
-
-copy_local_file() {
-    local src="$1" dest="$2"
-    if [ ! -f "$src" ]; then
-        print_error "Local file not found: $src"
-        exit 1
-    fi
-    cp "$src" "$dest"
-}
-
-# ─── Prerequisite checks ─────────────────────────────────────────────────────
-
-check_command() {
-    local cmd="$1" install_hint="$2"
-    if ! command -v "$cmd" &>/dev/null; then
-        print_error "'$cmd' is not installed."
-        echo "  Install: $install_hint"
-        return 1
-    fi
-    print_info "$cmd found"
-    return 0
-}
-
-check_prerequisites_local() {
-    print_step "Checking prerequisites..."
-    local missing=0
-    check_command mise "https://mise.jdx.dev" || missing=1
-    check_command docker "https://docs.docker.com/get-docker/" || missing=1
-    check_command openssl "apt install openssl / brew install openssl" || missing=1
-
-    # docker compose (v2 plugin)
-    if ! docker compose version &>/dev/null 2>&1; then
-        print_error "'docker compose' (v2 plugin) is not available."
-        echo "  Install: https://docs.docker.com/compose/install/"
-        missing=1
-    else
-        print_info "docker compose found"
-    fi
-
-    if [ "$missing" -eq 1 ]; then
-        echo ""
-        print_error "Please install the missing prerequisites and re-run."
-        exit 1
-    fi
-
-    # Check Docker daemon
-    if ! docker info &>/dev/null 2>&1; then
-        print_error "Cannot connect to Docker daemon. Is Docker running?"
-        echo "  Fix: systemctl start docker"
-        exit 1
-    fi
-
-    (cd "$REPO_ROOT" && mise trust)
-}
-
-check_prerequisites_csp() {
-    local provider="$1"
-    print_step "Checking prerequisites..."
-
-    local missing=0
-    check_command mise "https://mise.jdx.dev" || missing=1
-    check_command terraform "https://developer.hashicorp.com/terraform/install" || missing=1
-    check_command openssl "apt install openssl / brew install openssl" || missing=1
-    check_command gh "https://cli.github.com/" || missing=1
-    check_command docker "https://docs.docker.com/get-docker/" || missing=1
-
-    case "$provider" in
-        aws) check_command aws "https://aws.amazon.com/cli/" || missing=1 ;;
-        gcp) check_command gcloud "https://cloud.google.com/sdk/docs/install" || missing=1 ;;
-        oci) check_command oci "https://docs.oracle.com/en-us/iaas/Content/API/SDKDocs/cliinstall.htm" || missing=1 ;;
-    esac
-
-    if [ "$missing" -eq 1 ]; then
-        echo ""
-        print_error "Please install the missing prerequisites and re-run."
-        exit 1
-    fi
-
-    (cd "$REPO_ROOT" && mise trust)
-}
-
-# ─── Interactive prompts ─────────────────────────────────────────────────────
-
-choose_deploy_target() {
-    print_step "Select deployment target"
-    local options=("Local (This machine)" "AWS (requires GHCR access)" "GCP (requires GHCR access)" "OCI (requires GHCR access)")
-    local targets=("local" "aws" "gcp" "oci")
-    local selected
-    selected=$(select_menu "${options[@]}")
-    DEPLOY_TARGET="${targets[$selected]}"
-    print_info "Deployment target: ${DEPLOY_TARGET}"
-}
-
-prompt_install_dir() {
-    print_step "Installation directory"
-    local default_dir="$DEFAULT_INSTALL_DIR"
-    if [ "$DEPLOY_TARGET" != "local" ]; then
-        default_dir="$HOME/rune-vault-${DEPLOY_TARGET}"
-        echo "  Terraform files, state, and SSH keys are stored here."
-        echo "  Keep this directory to manage (update/destroy) your deployment."
-        echo ""
-    fi
-    prompt INSTALL_DIR "Directory" "$default_dir"
-}
-
-prompt_tls_mode() {
-    print_step "TLS configuration"
-    local options=("Generate self-signed certificate" "No TLS (not recommended)")
-    local modes=("self-signed" "none")
-    local selected
-    selected=$(select_menu "${options[@]}")
-    TLS_MODE="${modes[$selected]}"
-
-    if [ "$TLS_MODE" = "self-signed" ]; then
-        echo ""
-        prompt TLS_HOSTNAME "Domain name for the certificate (leave empty if none)" ""
-    fi
-
-    if [ "$TLS_MODE" = "none" ]; then
-        print_warn "Running without TLS. gRPC traffic will be unencrypted."
-        print_warn "This is NOT recommended for production."
-    fi
-
-    print_info "TLS mode: ${TLS_MODE}"
-}
-
-prompt_envector_config() {
-    print_step "enVector Cloud configuration"
-    echo "  Create your enVector cluster at https://envector.io before proceeding."
-    echo "  You will need the endpoint URL and API key from the dashboard."
-    echo "  Index name is used to store and retrieve your team's organizational memory."
-    echo ""
-    prompt ENVECTOR_ENDPOINT "enVector endpoint (e.g. cluster-id.clusters.envector.io)"
-    prompt ENVECTOR_API_KEY "enVector API key (e.g. aBcDE_12345_xxxxx)"
-    prompt VAULT_INDEX_NAME "Index name" "runecontext"
-
-    if [ -z "$ENVECTOR_ENDPOINT" ] || [ -z "$ENVECTOR_API_KEY" ]; then
-        print_error "enVector endpoint and API key are required."
-        exit 1
-    fi
-    if [ -z "$VAULT_INDEX_NAME" ]; then
-        print_error "Index name is required."
-        exit 1
-    fi
-    print_info "enVector endpoint: ${ENVECTOR_ENDPOINT}"
-}
-
-prompt_csp_config() {
-    prompt TEAM_NAME "Team name (used for resource naming)" "default"
-
-    case "$DEPLOY_TARGET" in
-        aws)
-            prompt CSP_REGION "AWS region" "us-east-1"
-            ;;
-        gcp)
-            prompt CSP_REGION "GCP region" "us-central1"
-            prompt GCP_PROJECT_ID "GCP project ID"
-            if [ -z "$GCP_PROJECT_ID" ]; then
-                print_error "GCP project ID is required."; exit 1
-            fi
-            ;;
-        oci)
-            prompt CSP_REGION "OCI region" "us-ashburn-1"
-            prompt OCI_COMPARTMENT_ID "OCI compartment OCID"
-            if [ -z "$OCI_COMPARTMENT_ID" ]; then
-                print_error "OCI compartment OCID is required."; exit 1
-            fi
-            ;;
-    esac
-}
-
-generate_team_secret() {
-    VAULT_TEAM_SECRET_VALUE="evt_$(openssl rand -hex 32)"
-    print_info "Team secret generated."
-}
-
-generate_config_files() {
-    local dir="$1"
-
-    cat > "$dir/vault-roles.yml" <<'ROLESEOF'
-roles:
-  admin:
-    scope: [get_public_key, decrypt_scores, decrypt_metadata, manage_tokens]
-    top_k: 50
-    rate_limit: 150/60s
-  member:
-    scope: [get_public_key, decrypt_scores, decrypt_metadata]
-    top_k: 10
-    rate_limit: 30/60s
-ROLESEOF
-
-    cat > "$dir/vault-tokens.yml" <<'TOKENSEOF'
-tokens: []
-TOKENSEOF
-
-    chmod 600 "$dir/vault-roles.yml" "$dir/vault-tokens.yml"
-    print_info "Token/role config files created."
-}
-
-setup_runevault_alias() {
-    if [ -z "${SUDO_USER:-}" ]; then
-        return
-    fi
-
-    # Add user to docker group
-    if command -v usermod >/dev/null 2>&1; then
-        usermod -aG docker "$SUDO_USER" 2>/dev/null || true
-    fi
-
-    # Detect shell config
-    local user_home
-    user_home="$(eval echo ~"$SUDO_USER")"
-    local shell_rc=""
-    if [ -f "$user_home/.zshrc" ]; then
-        shell_rc="$user_home/.zshrc"
-    elif [ -f "$user_home/.bashrc" ]; then
-        shell_rc="$user_home/.bashrc"
-    fi
-
-    if [ -n "$shell_rc" ]; then
-        if ! grep -q 'alias runevault=' "$shell_rc" 2>/dev/null; then
-            echo '' >> "$shell_rc"
-            echo '# Rune-Vault admin CLI' >> "$shell_rc"
-            echo 'alias runevault="docker exec -it rune-vault python3 /app/vault_admin_cli.py"' >> "$shell_rc"
-            print_info "runevault alias added to ${shell_rc}"
-            print_warn "Run 'exec \$SHELL' to reload your shell and enable the runevault command."
-        fi
-    fi
-}
-
-# ─── Confirmation summary ────────────────────────────────────────────────────
-
-show_confirmation() {
-    print_header "Configuration Summary (DEV — local build)"
-    echo "  Deployment target : ${DEPLOY_TARGET}"
-    echo "  Install directory : ${INSTALL_DIR}"
-    echo "  Docker image      : ${DOCKER_IMAGE}:${DOCKER_TAG} (local)"
-    echo "  Repo root         : ${REPO_ROOT}"
-    echo "  TLS mode          : ${TLS_MODE}"
-    [ -n "${TLS_HOSTNAME:-}" ] && echo "  TLS domain        : ${TLS_HOSTNAME}"
-    echo "  Team secret       : (auto-generated in .env)"
-    echo "  enVector endpoint : ${ENVECTOR_ENDPOINT}"
-    echo "  Index name        : ${VAULT_INDEX_NAME}"
-    if [ "$DEPLOY_TARGET" != "local" ]; then
-        echo "  Team name         : ${TEAM_NAME}"
-        echo "  Region            : ${CSP_REGION}"
-        [ "${DEPLOY_TARGET}" = "gcp" ] && echo "  GCP project       : ${GCP_PROJECT_ID}"
-        [ "${DEPLOY_TARGET}" = "oci" ] && echo "  OCI compartment   : ${OCI_COMPARTMENT_ID}"
-    fi
-    echo ""
-
-    if ! prompt_yn "Proceed with deployment?"; then
-        print_warn "Aborted."
-        exit 0
-    fi
-}
-
-# ─── TLS handling ─────────────────────────────────────────────────────────────
-
-setup_tls() {
-    local certs_dir="$INSTALL_DIR/certs"
-    mkdir -p "$certs_dir"
-
-    case "$TLS_MODE" in
-        self-signed)
-            print_step "Generating self-signed certificates..."
-            copy_local_file "$REPO_ROOT/scripts/generate-certs.sh" "$certs_dir/generate-certs.sh"
-            chmod +x "$certs_dir/generate-certs.sh"
-            (cd "$certs_dir" && bash generate-certs.sh . "${TLS_HOSTNAME:-localhost}")
-            TLS_CERT_PATH="$certs_dir/server.pem"
-            TLS_KEY_PATH="$certs_dir/server.key"
-            TLS_CA_PATH="$certs_dir/ca.pem"
-            print_info "Self-signed certificates generated in ${certs_dir}/"
-            ;;
-        none)
-            print_warn "Skipping TLS setup."
-            TLS_CERT_PATH=""
-            TLS_KEY_PATH=""
-            TLS_CA_PATH=""
-            ;;
-    esac
-}
-
-# ─── Generate .env file ──────────────────────────────────────────────────────
-
-generate_env_file() {
-    local env_file="$INSTALL_DIR/.env"
-
-    cat > "$env_file" <<ENVEOF
-# Rune-Vault configuration — generated by install-dev.sh
-VAULT_TEAM_SECRET=${VAULT_TEAM_SECRET_VALUE}
-VAULT_INDEX_NAME=${VAULT_INDEX_NAME}
-ENVECTOR_ENDPOINT=${ENVECTOR_ENDPOINT}
-ENVECTOR_API_KEY=${ENVECTOR_API_KEY}
-EMBEDDING_DIM=768
-RUNE_VAULT_TAG=${DOCKER_TAG}
-ENVEOF
-
-    if [ "$TLS_MODE" = "none" ]; then
-        echo "VAULT_TLS_DISABLE=true" >> "$env_file"
-    else
-        cat >> "$env_file" <<TLSEOF
-VAULT_TLS_CERT=/app/certs/server.pem
-VAULT_TLS_KEY=/app/certs/server.key
-TLSEOF
-    fi
-
-    chmod 600 "$env_file"
-    print_info ".env file created (mode 600)."
-}
-
-# ─── Local deployment ─────────────────────────────────────────────────────────
-
-deploy_local() {
-    print_header "Deploying Rune-Vault (Local — DEV)"
-
-    # Clean up existing installation
-    if [ -d "$INSTALL_DIR" ]; then
-        print_warn "Existing installation found at ${INSTALL_DIR}"
-        if prompt_yn "Remove existing installation and reinstall?" "n"; then
-            print_step "Removing existing installation..."
-            (cd "$INSTALL_DIR" && docker compose down -v 2>/dev/null) || true
-            rm -rf "$INSTALL_DIR"
-            print_info "Previous installation removed."
-        else
-            print_warn "Aborted."
-            exit 0
-        fi
-    fi
-    # Clean up orphaned container/network/volume
-    local project
-    project="$(basename "$INSTALL_DIR")"
-    if docker container inspect rune-vault &>/dev/null; then
-        print_step "Removing existing rune-vault container..."
-        docker rm -f rune-vault >/dev/null 2>&1 || true
-        print_info "Container removed."
-    fi
-    docker network rm "${project}_vault-net" >/dev/null 2>&1 || true
-    docker volume rm "${project}_vault-keys" >/dev/null 2>&1 || true
-
-    # Create directory structure
-    mkdir -p "$INSTALL_DIR"/{certs,backups,logs}
-    print_info "Directory structure created: ${INSTALL_DIR}/"
-
-    # Copy docker-compose.yml from local repo
-    print_step "Copying docker-compose.yml from local repo..."
-    copy_local_file "$REPO_ROOT/vault/docker-compose.yml" "$INSTALL_DIR/docker-compose.yml"
-    # Pin image to the local build tag
-    sed -i.bak "s|image:.*rune-vault:.*|image: ${DOCKER_IMAGE}:${DOCKER_TAG}|" "$INSTALL_DIR/docker-compose.yml"
-    rm -f "$INSTALL_DIR/docker-compose.yml.bak"
-    print_info "docker-compose.yml copied."
-
-    # TLS
-    setup_tls
+REPO_ROOT=$(cd "$(dirname "$0")/.." && pwd)
+LOCAL_BINARY="${REPO_ROOT}/vault/bin/runevault"
 
-    # Generate .env and config files
-    generate_env_file
-    generate_config_files "$INSTALL_DIR"
-
-    # Restore ownership to the invoking user (files were created as root via sudo)
-    if [ -n "${SUDO_USER:-}" ]; then
-        chown -R "$SUDO_USER" "$INSTALL_DIR"
-    fi
-
-    # Build Docker image from local source
-    print_step "Building Docker image (tag: ${DOCKER_TAG})..."
-    (cd "$REPO_ROOT" && mise run build "${DOCKER_TAG}")
-    print_info "Image built: ${DOCKER_IMAGE}:${DOCKER_TAG}"
-
-    # Start container
-    print_step "Starting Rune-Vault..."
-    (cd "$INSTALL_DIR" && docker compose up -d)
-    print_info "Container started."
-
-    # Health check
-    print_step "Waiting for Vault to become healthy..."
-    local elapsed=0
-    local timeout=60
-    while [ $elapsed -lt $timeout ]; do
-        if docker exec rune-vault curl -sf http://localhost:8081/health 2>/dev/null; then
-            print_info "Vault is healthy!"
-
-            # Set up runevault alias for admin CLI
-            setup_runevault_alias
-            return 0
-        fi
-        sleep 2
-        elapsed=$((elapsed + 2))
-        printf "."
-    done
-
-    echo ""
-    print_error "Vault did not become healthy within ${timeout}s."
-    print_warn "Container logs:"
-    docker logs rune-vault 2>&1 | tail -30
-    exit 1
+[[ -x "$LOCAL_BINARY" ]] || {
+  printf 'ERROR: Binary not found at %s\n' "$LOCAL_BINARY" >&2
+  printf '  Run: mise run go:build\n' >&2
+  exit 1
 }
 
-# ─── CSP deployment ───────────────────────────────────────────────────────────
-
-deploy_csp() {
-    local provider="$DEPLOY_TARGET"
-    print_header "Deploying Rune-Vault (${provider} — DEV)"
-
-    local tf_dir="$INSTALL_DIR/deployment"
-    mkdir -p "$tf_dir"
-    # Ensure the original user owns the deployment directory for terraform
-    if [ -n "${SUDO_USER:-}" ]; then
-        chown -R "$SUDO_USER" "$INSTALL_DIR"
-    fi
-
-    # Build and push Docker image to GHCR (remote servers pull from registry)
-    # Requires GHCR push access to the CryptoLabInc organization.
-    print_step "Building and pushing Docker image to GHCR..."
-    echo "  CSP deployments pull the image from GHCR, so a push is required."
-    echo "  This requires GHCR push access to the CryptoLabInc organization."
-    echo ""
-    if ! gh auth status &>/dev/null; then
-        print_error "GitHub CLI not authenticated. Run: gh auth login"
-        exit 1
-    fi
-    (cd "$REPO_ROOT" && mise run push "${DOCKER_TAG}")
-    print_info "Image pushed: ${DOCKER_IMAGE}:${DOCKER_TAG}"
-
-    # Copy Terraform files from local repo
-    print_step "Copying Terraform configuration from local repo..."
-    copy_local_file "$REPO_ROOT/deployment/${provider}/main.tf" "$tf_dir/main.tf"
-    if [ "$provider" = "aws" ]; then
-        copy_local_file "$REPO_ROOT/deployment/${provider}/cloud-init.yaml" "$tf_dir/cloud-init.yaml"
-        sed -i.bak "s|image:.*rune-vault:.*|image: ${DOCKER_IMAGE}:${DOCKER_TAG}|" "$tf_dir/cloud-init.yaml"
-        rm -f "$tf_dir/cloud-init.yaml.bak"
-    else
-        copy_local_file "$REPO_ROOT/deployment/${provider}/startup-script.sh" "$tf_dir/startup-script.sh"
-        sed -i.bak "s|image:.*rune-vault:.*|image: ${DOCKER_IMAGE}:${DOCKER_TAG}|" "$tf_dir/startup-script.sh"
-        rm -f "$tf_dir/startup-script.sh.bak"
-    fi
-    print_info "Terraform files copied."
-
-    # Generate SSH key pair for EC2 access
-    local ssh_key_path="$INSTALL_DIR/ssh_key"
-    if [ ! -f "$ssh_key_path" ]; then
-        print_step "Generating SSH key pair..."
-        ssh-keygen -t ed25519 -f "$ssh_key_path" -N "" -q
-        chmod 600 "$ssh_key_path"
-        chmod 644 "${ssh_key_path}.pub"
-        print_info "SSH key generated: ${ssh_key_path}"
-    fi
-    local public_key
-    public_key=$(cat "${ssh_key_path}.pub")
-
-    # Generate terraform.tfvars (use printf to avoid heredoc escaping issues)
-    print_step "Generating terraform.tfvars..."
-    escape_tf() { printf '%s' "$1" | sed 's/\\/\\\\/g; s/"/\\"/g'; }
-    {
-        printf 'team_secret        = "%s"\n' "$(escape_tf "$VAULT_TEAM_SECRET_VALUE")"
-        printf 'team_name          = "%s"\n' "$(escape_tf "$TEAM_NAME")"
-        printf 'region             = "%s"\n' "$(escape_tf "$CSP_REGION")"
-        printf 'tls_mode           = "%s"\n' "$(escape_tf "$TLS_MODE")"
-        printf 'tls_hostname       = "%s"\n' "$(escape_tf "${TLS_HOSTNAME:-}")"
-        printf 'envector_endpoint  = "%s"\n' "$(escape_tf "$ENVECTOR_ENDPOINT")"
-        printf 'envector_api_key   = "%s"\n' "$(escape_tf "$ENVECTOR_API_KEY")"
-        printf 'vault_index_name   = "%s"\n' "$(escape_tf "$VAULT_INDEX_NAME")"
-        printf 'public_key         = "%s"\n' "$(escape_tf "$public_key")"
-        case "$provider" in
-            gcp) printf 'project_id         = "%s"\n' "$(escape_tf "$GCP_PROJECT_ID")" ;;
-            oci) printf 'compartment_id     = "%s"\n' "$(escape_tf "$OCI_COMPARTMENT_ID")" ;;
-        esac
-    } > "$tf_dir/terraform.tfvars"
-
-    chmod 600 "$tf_dir/terraform.tfvars"
-    if [ -n "${SUDO_USER:-}" ]; then
-        chown -R "$SUDO_USER" "$INSTALL_DIR"
-    fi
-    print_info "terraform.tfvars created."
-
-    # Terraform init & apply (run as the original user to preserve CLI auth)
-    print_step "Running Terraform..."
-    local tf_run="terraform"
-    if [ -n "${SUDO_USER:-}" ]; then
-        tf_run="sudo -u $SUDO_USER terraform"
-    fi
-    (cd "$tf_dir" && $tf_run init)
-    (cd "$tf_dir" && $tf_run apply -auto-approve)
-
-    # Capture outputs
-    VAULT_PUBLIC_IP=$(cd "$tf_dir" && $tf_run output -raw vault_public_ip 2>/dev/null) || true
-    local vault_url
-    vault_url=$(cd "$tf_dir" && $tf_run output -raw vault_url 2>/dev/null) || true
-
-    print_info "Infrastructure provisioned."
-
-    # Health polling — wait for cloud-init to finish and Vault to start
-    if [ -n "$VAULT_PUBLIC_IP" ]; then
-        print_step "Waiting for Vault to become reachable (up to 10 min)..."
-        local elapsed=0
-        local timeout=600
-        while [ $elapsed -lt $timeout ]; do
-            if bash -c "echo >/dev/tcp/${VAULT_PUBLIC_IP}/50051" 2>/dev/null; then
-                print_info "Vault is reachable at ${VAULT_PUBLIC_IP}:50051!"
+# Parse --prefix for rootless local testing; pass all other args to install.sh
+PREFIX=""
+PASSTHROUGH_ARGS=()
+while [[ $# -gt 0 ]]; do
+  case $1 in
+    --prefix) PREFIX="$2"; shift 2 ;;
+    *)        PASSTHROUGH_ARGS+=("$1"); shift ;;
+  esac
+done
 
-                # Download ca.pem from remote server
-                if [ "$TLS_MODE" = "self-signed" ]; then
-                    mkdir -p "$INSTALL_DIR/certs"
-                    if [ -n "${SUDO_USER:-}" ]; then
-                        chown -R "$SUDO_USER" "$INSTALL_DIR/certs"
-                    fi
-                    local scp_opts="-i $ssh_key_path -o StrictHostKeyChecking=no -o ConnectTimeout=15 -o BatchMode=yes"
-                    local scp_prefix=""
-                    if [ -n "${SUDO_USER:-}" ]; then
-                        scp_prefix="sudo -u $SUDO_USER"
-                    fi
-                    # Retry SCP (SSH may not be ready immediately)
-                    local downloaded=0
-                    for attempt in 1 2 3; do
-                        sleep 10
-                        for ssh_user in ubuntu opc; do
-                            if $scp_prefix scp $scp_opts \
-                                "${ssh_user}@${VAULT_PUBLIC_IP}:/opt/rune/certs/ca.pem" \
-                                "$INSTALL_DIR/certs/ca.pem" 2>/dev/null; then
-                                downloaded=1; break 2
-                            fi
-                        done
-                    done
-                    if [ "$downloaded" -eq 1 ]; then
-                        CSP_CA_CERT_LOCAL="$INSTALL_DIR/certs/ca.pem"
-                        print_info "CA certificate downloaded to ${CSP_CA_CERT_LOCAL}"
-                    else
-                        print_warn "Could not download ca.pem via SSH. Retrieve manually:"
-                        echo "  scp -i ${ssh_key_path} ubuntu@${VAULT_PUBLIC_IP}:/opt/rune/certs/ca.pem ${INSTALL_DIR}/certs/"
-                    fi
-                fi
+export RUNEVAULT_LOCAL_BINARY="$LOCAL_BINARY"
+export RUNEVAULT_SKIP_VERIFY=1
 
-                break
-            fi
-            sleep 10
-            elapsed=$((elapsed + 10))
-            printf "."
-        done
-        echo ""
-        if [ $elapsed -ge $timeout ]; then
-            print_error "Vault not reachable within ${timeout}s. Cloud-init may still be running."
-            echo ""
-            echo "  Debug via SSH:"
-            echo "  ssh -i ${ssh_key_path} ubuntu@${VAULT_PUBLIC_IP} 'cloud-init status --wait && docker ps'"
-            echo ""
-            echo "  Terraform directory: ${tf_dir}"
-            echo "  To destroy resources: cd ${tf_dir} && terraform destroy"
-            exit 1
-        fi
-    fi
-}
-
-# ─── Summary ──────────────────────────────────────────────────────────────────
-
-show_summary() {
-    local endpoint
-    if [ "$DEPLOY_TARGET" = "local" ]; then
-        if [ "$TLS_MODE" = "none" ]; then
-            endpoint="localhost:50051"
-        else
-            endpoint="localhost:50051 (TLS)"
-        fi
-    else
-        local ip="${VAULT_PUBLIC_IP:-<public-ip>}"
-        endpoint="${ip}:50051"
-    fi
-
-    print_header "Deployment Complete (DEV)"
-    echo "  Vault Endpoint  : ${endpoint}"
-    echo "  Docker Image    : ${DOCKER_IMAGE}:${DOCKER_TAG} (local build)"
-    echo "  Team Secret     : (stored in ${INSTALL_DIR}/.env)"
-    echo "  TLS Mode        : ${TLS_MODE}"
-    if [ "$TLS_MODE" = "self-signed" ] && [ "$DEPLOY_TARGET" = "local" ]; then
-        echo "  CA Certificate  : ${INSTALL_DIR}/certs/ca.pem"
-    fi
-    echo ""
-    echo -e "${BOLD}Share with your team:${NC}"
-    echo ""
-    echo "  Team members will need the following credentials when installing the"
-    echo "  Rune plugin/extension. Share them securely (e.g. encrypted channel):"
-    echo ""
-    if [ -n "${TLS_HOSTNAME:-}" ]; then
-        echo "  Endpoint : ${TLS_HOSTNAME}:50051"
-    elif [ "$DEPLOY_TARGET" != "local" ] && [ -n "${VAULT_PUBLIC_IP:-}" ]; then
-        echo "  Endpoint : ${VAULT_PUBLIC_IP}:50051"
-    else
-        echo "  Endpoint : <public-ip>:50051"
-    fi
-    echo ""
-    echo "  Issue per-user tokens with:"
-    echo "    runevault token issue --user <name> --role member --expires 90d"
-    echo ""
-    if [ "$DEPLOY_TARGET" = "local" ]; then
-        echo "  Reload your shell before using the runevault command:"
-        echo "    exec \$SHELL"
-        echo ""
-    fi
-    echo "  Each team member uses their individual token for authentication."
-    echo "  Team Secret (above) is only needed for DEK derivation — keep it secure."
-    if [ "$TLS_MODE" = "self-signed" ]; then
-        echo ""
-        echo "  Your vault uses a self-signed CA. Team members also need the CA"
-        echo "  certificate file below. Share this file directly — they will be"
-        echo "  prompted to provide its path during plugin/extension setup."
-        echo ""
-        if [ -n "${CSP_CA_CERT_LOCAL}" ]; then
-            echo "  CA Cert  : ${CSP_CA_CERT_LOCAL}"
-        elif [ "$DEPLOY_TARGET" = "local" ]; then
-            echo "  CA Cert  : ${INSTALL_DIR}/certs/ca.pem"
-        else
-            echo "  CA Cert  : /opt/rune/certs/ca.pem (on the remote server)"
-        fi
-    fi
-    if [ "$DEPLOY_TARGET" != "local" ]; then
-        echo ""
-        echo -e "${BOLD}Next steps:${NC}"
-        echo "  1. Point your domain DNS to ${VAULT_PUBLIC_IP:-<public-ip>}"
-        echo "  2. To use custom TLS certificates, replace files in /opt/rune/certs/ on the server"
-        echo "     and restart: ssh -i ${INSTALL_DIR}/ssh_key ubuntu@${VAULT_PUBLIC_IP:-<public-ip>} 'cd /opt/rune && docker compose restart'"
-        echo ""
-        echo "  SSH access: ssh -i ${INSTALL_DIR}/ssh_key ubuntu@${VAULT_PUBLIC_IP:-<public-ip>}"
-    fi
-    echo ""
-    echo "Install directory: ${INSTALL_DIR}"
-    echo ""
-}
-
-# ─── main() ──────────────────────────────────────────────────────────────────
-
-main() {
-    print_header "Rune-Vault Interactive Setup (DEV)"
-    echo "Local development installer — uses files from the working tree."
-    echo "Repo: ${REPO_ROOT}"
-    echo ""
-
-    # 1. Deployment target
-    choose_deploy_target
-
-    # 2. Prerequisites
-    if [ "$DEPLOY_TARGET" = "local" ]; then
-        check_prerequisites_local
-    else
-        check_prerequisites_csp "$DEPLOY_TARGET"
-    fi
-
-    # 3. Install directory
-    prompt_install_dir
-
-    # 4. Common settings
-    prompt_tls_mode
-    generate_team_secret
-    prompt_envector_config
-
-    # 5. CSP-specific settings
-    if [ "$DEPLOY_TARGET" != "local" ]; then
-        prompt_csp_config
-    fi
-
-    # 6. Confirm
-    show_confirmation
-
-    # 7. Deploy
-    if [ "$DEPLOY_TARGET" = "local" ]; then
-        deploy_local
-    else
-        deploy_csp
-    fi
+if [[ -n "$PREFIX" ]]; then
+  export RUNEVAULT_INSTALL_PREFIX="$PREFIX"
+  export RUNEVAULT_BINARY_PATH="${PREFIX}/runevault"
+  export RUNEVAULT_SKIP_SERVICE=1
+fi
 
-    # 8. Summary
-    show_summary
-}
+# Dev defaults for non-interactive installs
+export RUNEVAULT_TEAM_NAME="${RUNEVAULT_TEAM_NAME:-dev-team}"
+export RUNEVAULT_ENVECTOR_ENDPOINT="${RUNEVAULT_ENVECTOR_ENDPOINT:-https://envector.example.com}"
+export RUNEVAULT_ENVECTOR_API_KEY="${RUNEVAULT_ENVECTOR_API_KEY:-dev-api-key-placeholder}"
 
-main "$@"
+exec bash "${REPO_ROOT}/install.sh" "${PASSTHROUGH_ARGS[@]+"${PASSTHROUGH_ARGS[@]}"}"

From 0b20122c5304b9e4b2050cfcd40d277478f0ec6d Mon Sep 17 00:00:00 2001
From: Jeonghwan Lee <jhlee@cryptolab.co.kr>
Date: Mon, 27 Apr 2026 12:02:21 +0900
Subject: [PATCH 06/27] feat: allow runevault group members to use CLI without
 sudo

---
 vault/internal/server/admin.go      | 328 ++++++++++++++++++++++++++++
 vault/internal/server/admin_test.go | 295 +++++++++++++++++++++++++
 2 files changed, 623 insertions(+)
 create mode 100644 vault/internal/server/admin.go
 create mode 100644 vault/internal/server/admin_test.go

diff --git a/vault/internal/server/admin.go b/vault/internal/server/admin.go
new file mode 100644
index 0000000..a04ea15
--- /dev/null
+++ b/vault/internal/server/admin.go
@@ -0,0 +1,328 @@
+package server
+
+import (
+	"context"
+	"encoding/json"
+	"errors"
+	"fmt"
+	"log/slog"
+	"net"
+	"net/http"
+	"os"
+	"path/filepath"
+	"strings"
+	"syscall"
+	"time"
+
+	"github.com/CryptoLabInc/rune-admin/vault/internal/tokens"
+)
+
+// adminSocketMode is 0660: owner (runevault) + group (runevault) can connect;
+// other users cannot. Installers add trusted operators to the runevault group.
+const adminSocketMode = 0o660
+
+// AdminFromConfig is an AdminFactory suitable for production: it binds the
+// UDS at v.cfg.Server.Admin.Socket with mode 0660 (umask + chmod
+// belt+suspenders), serves the route table, and returns a closer that
+// gracefully stops the http.Server and unlinks the socket.
+func AdminFromConfig(ctx context.Context, v *Vault) (func(context.Context) error, error) {
+	cfg := v.Config()
+	socket := cfg.Server.Admin.Socket
+	if socket == "" {
+		return nil, errors.New("server.admin.socket is empty")
+	}
+	if err := os.MkdirAll(filepath.Dir(socket), 0o750); err != nil {
+		return nil, fmt.Errorf("admin: mkdir socket dir: %w", err)
+	}
+	// Stale socket recovery: remove leftover paths before Listen. Ignore
+	// missing-file errors; surface anything else (eg. wrong type).
+	if err := os.Remove(socket); err != nil && !os.IsNotExist(err) {
+		return nil, fmt.Errorf("admin: remove stale socket: %w", err)
+	}
+
+	// Umask 0o007 lets the socket inherit group rw while blocking others.
+	prevMask := syscall.Umask(0o007)
+	lis, err := net.Listen("unix", socket)
+	syscall.Umask(prevMask)
+	if err != nil {
+		return nil, fmt.Errorf("admin: listen unix %s: %w", socket, err)
+	}
+	// Belt + suspenders: even if umask leaked, force 0660.
+	if err := os.Chmod(socket, adminSocketMode); err != nil {
+		_ = lis.Close()
+		return nil, fmt.Errorf("admin: chmod socket: %w", err)
+	}
+
+	onShutdown := func() {
+		go func() {
+			time.Sleep(100 * time.Millisecond) // let response flush
+			_ = syscall.Kill(os.Getpid(), syscall.SIGTERM)
+		}()
+	}
+	mux := buildAdminMux(v, onShutdown)
+	srv := &http.Server{
+		Handler:           mux,
+		ReadHeaderTimeout: 5 * time.Second,
+		ReadTimeout:       30 * time.Second,
+		WriteTimeout:      30 * time.Second,
+	}
+	go func() {
+		if err := srv.Serve(lis); err != nil && !errors.Is(err, http.ErrServerClosed) {
+			slog.Error("admin: server error", "err", err)
+		}
+	}()
+	slog.Info("vault: admin UDS listening", "socket", socket, "mode", "0660")
+
+	shutdown := func(ctx context.Context) error {
+		err := srv.Shutdown(ctx)
+		// Always best-effort unlink; the socket is gone if Shutdown succeeded.
+		_ = os.Remove(socket)
+		return err
+	}
+	return shutdown, nil
+}
+
+// buildAdminMux wires the admin route table. Exposed for tests.
+// onShutdown is called (in a goroutine, after response) when POST /shutdown is
+// received; pass nil to disable the endpoint (tests).
+func buildAdminMux(v *Vault, onShutdown func()) http.Handler {
+	mux := http.NewServeMux()
+
+	mux.HandleFunc("GET /health", func(w http.ResponseWriter, r *http.Request) {
+		writeJSON(w, http.StatusOK, map[string]string{"status": "ok"})
+	})
+
+	mux.HandleFunc("POST /shutdown", func(w http.ResponseWriter, r *http.Request) {
+		if onShutdown == nil {
+			writeError(w, http.StatusNotImplemented, "shutdown not enabled")
+			return
+		}
+		writeJSON(w, http.StatusOK, map[string]string{"message": "shutdown initiated"})
+		onShutdown()
+	})
+
+	mux.HandleFunc("POST /restart", func(w http.ResponseWriter, r *http.Request) {
+		if onShutdown == nil {
+			writeError(w, http.StatusNotImplemented, "restart not enabled")
+			return
+		}
+		writeJSON(w, http.StatusOK, map[string]string{"message": "restart initiated"})
+		v.RequestRestart()
+		onShutdown()
+	})
+	mux.HandleFunc("GET /tokens", func(w http.ResponseWriter, r *http.Request) {
+		writeJSON(w, http.StatusOK, map[string]any{"tokens": v.Tokens().ListTokens()})
+	})
+	mux.HandleFunc("GET /roles", func(w http.ResponseWriter, r *http.Request) {
+		writeJSON(w, http.StatusOK, map[string]any{"roles": v.Tokens().ListRoles()})
+	})
+
+	mux.HandleFunc("POST /tokens", func(w http.ResponseWriter, r *http.Request) {
+		var body struct {
+			User        string `json:"user"`
+			Role        string `json:"role"`
+			ExpiresDays *int   `json:"expires_days"`
+		}
+		if err := readJSON(r, &body); err != nil {
+			writeError(w, http.StatusBadRequest, err.Error())
+			return
+		}
+		if body.User == "" || body.Role == "" {
+			writeError(w, http.StatusBadRequest, "Missing required fields: user, role")
+			return
+		}
+		tok, err := v.Tokens().AddToken(body.User, body.Role, body.ExpiresDays)
+		if err != nil {
+			writeError(w, http.StatusBadRequest, err.Error())
+			return
+		}
+		writeJSON(w, http.StatusCreated, tokenJSON(tok))
+	})
+
+	mux.HandleFunc("POST /tokens/{user}/rotate", func(w http.ResponseWriter, r *http.Request) {
+		user := r.PathValue("user")
+		tok, err := v.Tokens().RotateToken(user)
+		if err != nil {
+			writeError(w, http.StatusBadRequest, err.Error())
+			return
+		}
+		writeJSON(w, http.StatusOK, tokenJSON(tok))
+	})
+
+	mux.HandleFunc("POST /tokens/_rotate_all", func(w http.ResponseWriter, r *http.Request) {
+		toks, err := v.Tokens().RotateAllTokens()
+		if err != nil {
+			writeError(w, http.StatusInternalServerError, err.Error())
+			return
+		}
+		entries := make([]map[string]string, 0, len(toks))
+		for _, t := range toks {
+			entries = append(entries, map[string]string{
+				"user": t.User, "token": t.Token, "role": t.Role,
+			})
+		}
+		writeJSON(w, http.StatusOK, map[string]any{
+			"rotated": len(toks),
+			"tokens":  entries,
+		})
+	})
+
+	mux.HandleFunc("DELETE /tokens/{user}", func(w http.ResponseWriter, r *http.Request) {
+		user := r.PathValue("user")
+		if v.Tokens().RevokeToken(user) {
+			writeJSON(w, http.StatusOK, map[string]string{
+				"message": fmt.Sprintf("Revoked token for '%s'", user),
+			})
+			return
+		}
+		writeError(w, http.StatusNotFound, fmt.Sprintf("No token found for user '%s'", user))
+	})
+
+	mux.HandleFunc("POST /roles", func(w http.ResponseWriter, r *http.Request) {
+		var body struct {
+			Name      string   `json:"name"`
+			Scope     []string `json:"scope"`
+			TopK      *int     `json:"top_k"`
+			RateLimit string   `json:"rate_limit"`
+		}
+		if err := readJSON(r, &body); err != nil {
+			writeError(w, http.StatusBadRequest, err.Error())
+			return
+		}
+		if body.Name == "" || len(body.Scope) == 0 || body.TopK == nil || body.RateLimit == "" {
+			writeError(w, http.StatusBadRequest, "Missing required fields: name, scope, top_k, rate_limit")
+			return
+		}
+		role, err := v.Tokens().AddRole(body.Name, body.Scope, *body.TopK, body.RateLimit)
+		if err != nil {
+			writeError(w, http.StatusBadRequest, err.Error())
+			return
+		}
+		writeJSON(w, http.StatusCreated, roleJSON(role))
+	})
+
+	mux.HandleFunc("PUT /roles/{name}", func(w http.ResponseWriter, r *http.Request) {
+		name := r.PathValue("name")
+		var raw map[string]json.RawMessage
+		if err := readJSON(r, &raw); err != nil {
+			writeError(w, http.StatusBadRequest, err.Error())
+			return
+		}
+		opts := tokens.UpdateRoleOpts{}
+		if v, ok := raw["scope"]; ok {
+			var s []string
+			if err := json.Unmarshal(v, &s); err != nil {
+				writeError(w, http.StatusBadRequest, "scope must be a string array")
+				return
+			}
+			opts.Scope = &s
+		}
+		if v, ok := raw["top_k"]; ok {
+			var n int
+			if err := json.Unmarshal(v, &n); err != nil {
+				writeError(w, http.StatusBadRequest, "top_k must be an integer")
+				return
+			}
+			opts.TopK = &n
+		}
+		if v, ok := raw["rate_limit"]; ok {
+			var s string
+			if err := json.Unmarshal(v, &s); err != nil {
+				writeError(w, http.StatusBadRequest, "rate_limit must be a string")
+				return
+			}
+			opts.RateLimit = &s
+		}
+		if opts.Scope == nil && opts.TopK == nil && opts.RateLimit == nil {
+			writeError(w, http.StatusBadRequest, "No fields to update")
+			return
+		}
+		role, err := v.Tokens().UpdateRole(name, opts)
+		if err != nil {
+			writeError(w, http.StatusBadRequest, err.Error())
+			return
+		}
+		writeJSON(w, http.StatusOK, roleJSON(role))
+	})
+
+	mux.HandleFunc("DELETE /roles/{name}", func(w http.ResponseWriter, r *http.Request) {
+		name := r.PathValue("name")
+		if err := v.Tokens().DeleteRole(name); err != nil {
+			writeError(w, http.StatusBadRequest, err.Error())
+			return
+		}
+		writeJSON(w, http.StatusOK, map[string]string{
+			"message": fmt.Sprintf("Deleted role '%s'", name),
+		})
+	})
+
+	// 404 fallback for routes that didn't match.
+	mux.HandleFunc("/", func(w http.ResponseWriter, r *http.Request) {
+		writeError(w, http.StatusNotFound, fmt.Sprintf("No route for %s %s", r.Method, r.URL.Path))
+	})
+
+	return mux
+}
+
+func tokenJSON(t *tokens.Token) map[string]any {
+	exp := t.Expires
+	if exp == "" {
+		exp = "never"
+	}
+	return map[string]any{
+		"user":      t.User,
+		"token":     t.Token,
+		"role":      t.Role,
+		"issued_at": t.IssuedAt,
+		"expires":   exp,
+	}
+}
+
+func roleJSON(r *tokens.Role) map[string]any {
+	return map[string]any{
+		"name":       r.Name,
+		"scope":      r.Scope,
+		"top_k":      r.TopK,
+		"rate_limit": r.RateLimit,
+	}
+}
+
+func writeJSON(w http.ResponseWriter, status int, body any) {
+	buf, err := json.Marshal(body)
+	if err != nil {
+		http.Error(w, err.Error(), http.StatusInternalServerError)
+		return
+	}
+	w.Header().Set("Content-Type", "application/json")
+	w.WriteHeader(status)
+	_, _ = w.Write(buf)
+}
+
+func writeError(w http.ResponseWriter, status int, msg string) {
+	writeJSON(w, status, map[string]string{"error": msg})
+}
+
+func readJSON(r *http.Request, dst any) error {
+	if r.ContentLength == 0 {
+		return nil
+	}
+	dec := json.NewDecoder(r.Body)
+	dec.DisallowUnknownFields()
+	if err := dec.Decode(dst); err != nil {
+		return err
+	}
+	return nil
+}
+
+// SocketURL is a stable host used in the URL for UDS HTTP. Clients
+// substitute the actual socket file via http.Transport.DialContext.
+const SocketURL = "http://admin"
+
+// SanitizePathForLog hides socket directories that contain user names or
+// secret prefixes. Used by status reporting.
+func SanitizePathForLog(p string) string {
+	if p == "" {
+		return ""
+	}
+	return strings.TrimSuffix(p, "/")
+}
diff --git a/vault/internal/server/admin_test.go b/vault/internal/server/admin_test.go
new file mode 100644
index 0000000..e84d55b
--- /dev/null
+++ b/vault/internal/server/admin_test.go
@@ -0,0 +1,295 @@
+package server
+
+import (
+	"bytes"
+	"context"
+	"encoding/json"
+	"net"
+	"net/http"
+	"net/http/httptest"
+	"os"
+	"path/filepath"
+	"runtime"
+	"strings"
+	"testing"
+	"time"
+
+	"github.com/CryptoLabInc/rune-admin/vault/internal/tokens"
+)
+
+func newAdminTestVault(t *testing.T) *Vault {
+	t.Helper()
+	cfg := &Config{
+		Tokens: TokensConfig{TeamSecret: "test-secret"},
+		Keys:   KeysConfig{Path: t.TempDir(), EmbeddingDim: 1024},
+	}
+	store := tokens.NewStore()
+	store.LoadDefaultsWithDemoToken()
+	audit, _ := NewAuditLogger(AuditConfig{Mode: ""})
+	return NewVault(cfg, store, nil, audit)
+}
+
+func adminTestServer(t *testing.T) (*httptest.Server, *Vault) {
+	t.Helper()
+	v := newAdminTestVault(t)
+	ts := httptest.NewServer(buildAdminMux(v, nil))
+	t.Cleanup(ts.Close)
+	return ts, v
+}
+
+func TestAdminGetHealth(t *testing.T) {
+	ts, _ := adminTestServer(t)
+	resp, err := http.Get(ts.URL + "/health")
+	if err != nil {
+		t.Fatal(err)
+	}
+	defer resp.Body.Close()
+	if resp.StatusCode != http.StatusOK {
+		t.Errorf("status = %d", resp.StatusCode)
+	}
+}
+
+func TestAdminListRolesIncludesDefaults(t *testing.T) {
+	ts, _ := adminTestServer(t)
+	resp, err := http.Get(ts.URL + "/roles")
+	if err != nil {
+		t.Fatal(err)
+	}
+	defer resp.Body.Close()
+	var body struct {
+		Roles []map[string]any `json:"roles"`
+	}
+	if err := json.NewDecoder(resp.Body).Decode(&body); err != nil {
+		t.Fatal(err)
+	}
+	names := map[string]bool{}
+	for _, r := range body.Roles {
+		names[r["name"].(string)] = true
+	}
+	if !names["admin"] || !names["member"] {
+		t.Errorf("default roles missing: %v", names)
+	}
+}
+
+func TestAdminIssueListRevoke(t *testing.T) {
+	ts, _ := adminTestServer(t)
+
+	// Issue
+	body := bytes.NewReader([]byte(`{"user":"alice","role":"member"}`))
+	resp, err := http.Post(ts.URL+"/tokens", "application/json", body)
+	if err != nil {
+		t.Fatal(err)
+	}
+	defer resp.Body.Close()
+	if resp.StatusCode != http.StatusCreated {
+		t.Fatalf("issue status = %d", resp.StatusCode)
+	}
+	var issued map[string]any
+	if err := json.NewDecoder(resp.Body).Decode(&issued); err != nil {
+		t.Fatal(err)
+	}
+	if !strings.HasPrefix(issued["token"].(string), "evt_") {
+		t.Errorf("token = %v", issued["token"])
+	}
+
+	// List
+	resp, _ = http.Get(ts.URL + "/tokens")
+	var listResp struct {
+		Tokens []map[string]any `json:"tokens"`
+	}
+	json.NewDecoder(resp.Body).Decode(&listResp)
+	resp.Body.Close()
+	found := false
+	for _, t := range listResp.Tokens {
+		if t["user"] == "alice" {
+			found = true
+		}
+	}
+	if !found {
+		t.Error("alice not in list response")
+	}
+
+	// Revoke
+	req, _ := http.NewRequest("DELETE", ts.URL+"/tokens/alice", nil)
+	resp, err = http.DefaultClient.Do(req)
+	if err != nil {
+		t.Fatal(err)
+	}
+	resp.Body.Close()
+	if resp.StatusCode != http.StatusOK {
+		t.Errorf("revoke status = %d", resp.StatusCode)
+	}
+}
+
+func TestAdminIssueMissingFields(t *testing.T) {
+	ts, _ := adminTestServer(t)
+	resp, err := http.Post(ts.URL+"/tokens", "application/json", bytes.NewReader([]byte(`{}`)))
+	if err != nil {
+		t.Fatal(err)
+	}
+	defer resp.Body.Close()
+	if resp.StatusCode != http.StatusBadRequest {
+		t.Errorf("status = %d", resp.StatusCode)
+	}
+}
+
+func TestAdminRevokeNotFound(t *testing.T) {
+	ts, _ := adminTestServer(t)
+	req, _ := http.NewRequest("DELETE", ts.URL+"/tokens/nobody", nil)
+	resp, err := http.DefaultClient.Do(req)
+	if err != nil {
+		t.Fatal(err)
+	}
+	defer resp.Body.Close()
+	if resp.StatusCode != http.StatusNotFound {
+		t.Errorf("status = %d", resp.StatusCode)
+	}
+}
+
+func TestAdminCreateRoleAndDelete(t *testing.T) {
+	ts, _ := adminTestServer(t)
+	body := bytes.NewReader([]byte(`{"name":"researcher","scope":["get_public_key"],"top_k":3,"rate_limit":"10/60s"}`))
+	resp, err := http.Post(ts.URL+"/roles", "application/json", body)
+	if err != nil {
+		t.Fatal(err)
+	}
+	defer resp.Body.Close()
+	if resp.StatusCode != http.StatusCreated {
+		t.Fatalf("create status = %d", resp.StatusCode)
+	}
+	// Delete
+	req, _ := http.NewRequest("DELETE", ts.URL+"/roles/researcher", nil)
+	resp2, err := http.DefaultClient.Do(req)
+	if err != nil {
+		t.Fatal(err)
+	}
+	defer resp2.Body.Close()
+	if resp2.StatusCode != http.StatusOK {
+		t.Errorf("delete status = %d", resp2.StatusCode)
+	}
+}
+
+func TestAdminUpdateRoleNoFieldsRejected(t *testing.T) {
+	ts, _ := adminTestServer(t)
+	req, _ := http.NewRequest("PUT", ts.URL+"/roles/member", bytes.NewReader([]byte(`{}`)))
+	req.Header.Set("Content-Type", "application/json")
+	resp, err := http.DefaultClient.Do(req)
+	if err != nil {
+		t.Fatal(err)
+	}
+	defer resp.Body.Close()
+	if resp.StatusCode != http.StatusBadRequest {
+		t.Errorf("status = %d", resp.StatusCode)
+	}
+}
+
+func TestAdminUnknownRoute(t *testing.T) {
+	ts, _ := adminTestServer(t)
+	resp, err := http.Get(ts.URL + "/nope")
+	if err != nil {
+		t.Fatal(err)
+	}
+	defer resp.Body.Close()
+	if resp.StatusCode != http.StatusNotFound {
+		t.Errorf("status = %d", resp.StatusCode)
+	}
+}
+
+// ── UDS bind + permissions (Unix only) ───────────────────────────
+
+func TestAdminUDSBindMode0660(t *testing.T) {
+	if runtime.GOOS == "windows" {
+		t.Skip("UDS not supported on Windows")
+	}
+	v := newAdminTestVault(t)
+	// Darwin's sockaddr_un caps sun_path at ~104 bytes; t.TempDir() with a
+	// long test name plus the framework-injected sequence dir overruns. Use
+	// a shorter MkdirTemp at /tmp to stay safely under the limit.
+	dir, err := os.MkdirTemp("", "vt-")
+	if err != nil {
+		t.Fatal(err)
+	}
+	t.Cleanup(func() { os.RemoveAll(dir) })
+	v.cfg.Server.Admin.Socket = filepath.Join(dir, "x.sock")
+
+	shutdown, err := AdminFromConfig(context.Background(), v)
+	if err != nil {
+		t.Fatal(err)
+	}
+	defer shutdown(context.Background())
+
+	info, err := os.Stat(v.cfg.Server.Admin.Socket)
+	if err != nil {
+		t.Fatal(err)
+	}
+	if mode := info.Mode().Perm(); mode != 0o660 {
+		t.Errorf("socket mode = %04o, want 0660", mode)
+	}
+
+	// Smoke test: dial + GET /health.
+	conn, err := net.Dial("unix", v.cfg.Server.Admin.Socket)
+	if err != nil {
+		t.Fatal(err)
+	}
+	conn.Close()
+}
+
+func TestAdminUDSStaleSocketRecovered(t *testing.T) {
+	if runtime.GOOS == "windows" {
+		t.Skip("UDS not supported on Windows")
+	}
+	v := newAdminTestVault(t)
+	// Darwin's sockaddr_un caps sun_path at ~104 bytes; t.TempDir() with a
+	// long test name plus the framework-injected sequence dir overruns. Use
+	// a shorter MkdirTemp at /tmp to stay safely under the limit.
+	dir, err := os.MkdirTemp("", "vt-")
+	if err != nil {
+		t.Fatal(err)
+	}
+	t.Cleanup(func() { os.RemoveAll(dir) })
+	v.cfg.Server.Admin.Socket = filepath.Join(dir, "x.sock")
+	// Plant a stale file at the socket path.
+	if err := os.WriteFile(v.cfg.Server.Admin.Socket, []byte("stale"), 0o600); err != nil {
+		t.Fatal(err)
+	}
+	shutdown, err := AdminFromConfig(context.Background(), v)
+	if err != nil {
+		t.Fatalf("recovery failed: %v", err)
+	}
+	defer shutdown(context.Background())
+	info, err := os.Stat(v.cfg.Server.Admin.Socket)
+	if err != nil {
+		t.Fatal(err)
+	}
+	if info.Mode()&os.ModeSocket == 0 {
+		t.Errorf("socket file is not a socket after recovery")
+	}
+}
+
+func TestAdminUDSShutdownUnlinks(t *testing.T) {
+	if runtime.GOOS == "windows" {
+		t.Skip("UDS not supported on Windows")
+	}
+	v := newAdminTestVault(t)
+	// Darwin's sockaddr_un caps sun_path at ~104 bytes; t.TempDir() with a
+	// long test name plus the framework-injected sequence dir overruns. Use
+	// a shorter MkdirTemp at /tmp to stay safely under the limit.
+	dir, err := os.MkdirTemp("", "vt-")
+	if err != nil {
+		t.Fatal(err)
+	}
+	t.Cleanup(func() { os.RemoveAll(dir) })
+	v.cfg.Server.Admin.Socket = filepath.Join(dir, "x.sock")
+	shutdown, err := AdminFromConfig(context.Background(), v)
+	if err != nil {
+		t.Fatal(err)
+	}
+	ctx, cancel := context.WithTimeout(context.Background(), 2*time.Second)
+	defer cancel()
+	if err := shutdown(ctx); err != nil {
+		t.Errorf("shutdown: %v", err)
+	}
+	if _, err := os.Stat(v.cfg.Server.Admin.Socket); !os.IsNotExist(err) {
+		t.Errorf("socket should be removed after shutdown, stat err = %v", err)
+	}
+}

From 72d6aac41c5555bf49c9d6be92f558639eff3c34 Mon Sep 17 00:00:00 2001
From: Jeonghwan Lee <jhlee@cryptolab.co.kr>
Date: Mon, 27 Apr 2026 12:02:21 +0900
Subject: [PATCH 07/27] fix: route daemon stop/restart through admin socket

---
 vault/cmd/main.go              |  22 ++
 vault/internal/server/grpc.go  | 394 +++++++++++++++++++++++++++++++++
 vault/internal/server/serve.go | 172 ++++++++++++++
 3 files changed, 588 insertions(+)
 create mode 100644 vault/cmd/main.go
 create mode 100644 vault/internal/server/grpc.go
 create mode 100644 vault/internal/server/serve.go

diff --git a/vault/cmd/main.go b/vault/cmd/main.go
new file mode 100644
index 0000000..bd1b0be
--- /dev/null
+++ b/vault/cmd/main.go
@@ -0,0 +1,22 @@
+package main
+
+import (
+	"errors"
+	"fmt"
+	"os"
+
+	"github.com/CryptoLabInc/rune-admin/vault/internal/commands"
+	"github.com/CryptoLabInc/rune-admin/vault/internal/server"
+)
+
+func main() {
+	if err := commands.Execute(); err != nil {
+		// ErrRestartRequested is intentional: exit 1 silently so the service
+		// manager (systemd Restart=on-failure / launchd KeepAlive) restarts
+		// the process without noisy stderr output.
+		if !errors.Is(err, server.ErrRestartRequested) {
+			fmt.Fprintln(os.Stderr, err)
+		}
+		os.Exit(1)
+	}
+}
diff --git a/vault/internal/server/grpc.go b/vault/internal/server/grpc.go
new file mode 100644
index 0000000..8625f69
--- /dev/null
+++ b/vault/internal/server/grpc.go
@@ -0,0 +1,394 @@
+package server
+
+import (
+	"context"
+	"encoding/base64"
+	"encoding/json"
+	"errors"
+	"fmt"
+	"sort"
+	"sync/atomic"
+	"time"
+
+	"google.golang.org/grpc/codes"
+	"google.golang.org/grpc/peer"
+	"google.golang.org/grpc/status"
+
+	"github.com/CryptoLabInc/rune-admin/vault/internal/crypto"
+	"github.com/CryptoLabInc/rune-admin/vault/internal/tokens"
+	pb "github.com/CryptoLabInc/rune-admin/vault/pkg/vaultpb"
+)
+
+// MaxMessageSize bounds gRPC frames. EvalKey alone can be tens of MB.
+const MaxMessageSize = 256 * 1024 * 1024
+
+// Vault is the runtime container shared by all RPC handlers and the
+// admin UDS server. It owns the long-lived token store, FHE key handle,
+// and audit logger. Construct via NewVault, tear down via Close.
+type Vault struct {
+	cfg    *Config
+	tokens *tokens.Store
+	keys   *crypto.EnvectorKeys
+	audit  *AuditLogger
+
+	// Cached bundle pieces from disk. Re-read on demand to pick up
+	// rotated keys without restarting; kept here for zero-copy reuse.
+	bundleParams crypto.KeysParams
+
+	// restartRequested is set by the admin /restart endpoint so that
+	// Serve can return ErrRestartRequested and the process exits with
+	// code 1, triggering service-manager (systemd/launchd) restart.
+	restartRequested atomic.Bool
+}
+
+// NewVault wires all subsystems together. Caller is responsible for Close.
+func NewVault(cfg *Config, tokenStore *tokens.Store, keys *crypto.EnvectorKeys, audit *AuditLogger) *Vault {
+	return &Vault{
+		cfg:    cfg,
+		tokens: tokenStore,
+		keys:   keys,
+		audit:  audit,
+		bundleParams: crypto.KeysParams{
+			Root:  cfg.Keys.Path,
+			KeyID: defaultKeyID(cfg),
+			Dim:   cfg.Keys.EmbeddingDim,
+		},
+	}
+}
+
+func defaultKeyID(_ *Config) string {
+	// Fixed for Phase 1 — Python pins KEY_ID="vault-key" in vault_core.py:30.
+	// Surfaced as a helper so a future config field can override.
+	return "vault-key"
+}
+
+// Tokens exposes the token store for the admin UDS server.
+func (v *Vault) Tokens() *tokens.Store { return v.tokens }
+
+// RequestRestart marks the vault for restart. Serve returns ErrRestartRequested
+// after the current shutdown sequence completes.
+func (v *Vault) RequestRestart() { v.restartRequested.Store(true) }
+
+// RestartRequested reports whether RequestRestart was called.
+func (v *Vault) RestartRequested() bool { return v.restartRequested.Load() }
+
+// Config exposes the resolved config (e.g., for status reporting).
+func (v *Vault) Config() *Config { return v.cfg }
+
+// Close releases the FHE key handle. The audit logger and token store
+// are owned by the caller (typically the daemon main).
+func (v *Vault) Close() error {
+	if v.keys != nil {
+		_ = v.keys.Close()
+	}
+	return nil
+}
+
+// VaultGRPC is the gRPC service wrapper. Exposed for grpc.RegisterService.
+type VaultGRPC struct {
+	pb.UnimplementedVaultServiceServer
+	v *Vault
+}
+
+func NewVaultGRPC(v *Vault) *VaultGRPC { return &VaultGRPC{v: v} }
+
+// ── GetPublicKey ──────────────────────────────────────────────────
+
+func (s *VaultGRPC) GetPublicKey(ctx context.Context, req *pb.GetPublicKeyRequest) (*pb.GetPublicKeyResponse, error) {
+	start := time.Now()
+	user := s.v.tokens.GetUsername(req.GetToken())
+	if user == "" {
+		user = "unknown"
+	}
+	resultCount := 0
+	statusStr := "success"
+	var errDetail *string
+	defer func() {
+		s.emit(ctx, "get_public_key", user, nil, resultCount, statusStr, errDetail, time.Since(start))
+	}()
+
+	username, role, err := s.v.tokens.Validate(req.GetToken())
+	if err != nil {
+		st, msg := mapTokenError(err)
+		statusStr, errDetail = errStatus(err)
+		return &pb.GetPublicKeyResponse{Error: msg}, status.Error(st, msg)
+	}
+	user = username
+	if err := role.CheckScope("get_public_key"); err != nil {
+		statusStr = "denied"
+		ed := err.Error()
+		errDetail = &ed
+		return &pb.GetPublicKeyResponse{Error: err.Error()}, status.Error(codes.PermissionDenied, err.Error())
+	}
+
+	bundle, err := s.v.buildBundle(req.GetToken())
+	if err != nil {
+		statusStr = "error"
+		ed := err.Error()
+		errDetail = &ed
+		return &pb.GetPublicKeyResponse{Error: err.Error()}, status.Error(codes.Internal, err.Error())
+	}
+	js, err := json.Marshal(bundle)
+	if err != nil {
+		statusStr = "error"
+		ed := err.Error()
+		errDetail = &ed
+		return &pb.GetPublicKeyResponse{Error: err.Error()}, status.Error(codes.Internal, err.Error())
+	}
+	resultCount = 1
+	return &pb.GetPublicKeyResponse{KeyBundleJson: string(js)}, nil
+}
+
+// buildBundle assembles the per-token JSON bundle returned by GetPublicKey.
+// Order of keys is irrelevant — clients parse by name.
+func (s *Vault) buildBundle(token string) (map[string]any, error) {
+	pub, err := crypto.ReadPublicKeyBundle(s.bundleParams)
+	if err != nil {
+		return nil, err
+	}
+	bundle := map[string]any{
+		"EncKey.json":  pub.EncKey,
+		"EvalKey.json": pub.EvalKey,
+		"key_id":       s.bundleParams.KeyID,
+	}
+	if s.cfg.Keys.IndexName != "" {
+		bundle["index_name"] = s.cfg.Keys.IndexName
+	}
+	agentID := crypto.AgentIDFromToken(token)
+	dek, err := crypto.DeriveAgentKey(s.cfg.Tokens.TeamSecret, agentID)
+	if err != nil {
+		return nil, err
+	}
+	bundle["agent_id"] = agentID
+	bundle["agent_dek"] = base64.StdEncoding.EncodeToString(dek)
+	bundle["envector_endpoint"] = s.cfg.Envector.Endpoint
+	bundle["envector_api_key"] = s.cfg.Envector.APIKey
+	return bundle, nil
+}
+
+// ── DecryptScores ─────────────────────────────────────────────────
+
+func (s *VaultGRPC) DecryptScores(ctx context.Context, req *pb.DecryptScoresRequest) (*pb.DecryptScoresResponse, error) {
+	start := time.Now()
+	topK := req.GetTopK()
+	user := s.v.tokens.GetUsername(req.GetToken())
+	if user == "" {
+		user = "unknown"
+	}
+	resultCount := 0
+	statusStr := "success"
+	var errDetail *string
+	defer func() {
+		s.emit(ctx, "decrypt_scores", user, &topK, resultCount, statusStr, errDetail, time.Since(start))
+	}()
+
+	username, role, err := s.v.tokens.Validate(req.GetToken())
+	if err != nil {
+		st, msg := mapTokenError(err)
+		statusStr, errDetail = errStatus(err)
+		return &pb.DecryptScoresResponse{Error: msg}, status.Error(st, msg)
+	}
+	user = username
+	if err := role.CheckScope("decrypt_scores"); err != nil {
+		statusStr = "denied"
+		ed := err.Error()
+		errDetail = &ed
+		return &pb.DecryptScoresResponse{Error: err.Error()}, status.Error(codes.PermissionDenied, err.Error())
+	}
+	if int(topK) > role.TopK {
+		te := tokens.ErrTopKExceeded{Requested: int(topK), MaxTopK: role.TopK, RoleName: role.Name}
+		statusStr = "denied"
+		msg := te.Error()
+		errDetail = &msg
+		return &pb.DecryptScoresResponse{Error: msg}, status.Error(codes.InvalidArgument, msg)
+	}
+
+	blob, err := base64.StdEncoding.DecodeString(req.GetEncryptedBlobB64())
+	if err != nil {
+		statusStr = "error"
+		msg := fmt.Sprintf("Deserialization failed: %s", err.Error())
+		errDetail = &msg
+		return &pb.DecryptScoresResponse{Error: msg}, nil
+	}
+	if s.v.keys == nil {
+		statusStr = "error"
+		msg := "FHE key not loaded"
+		errDetail = &msg
+		return &pb.DecryptScoresResponse{Error: msg}, status.Error(codes.Internal, msg)
+	}
+	scores2D, shardIdx, err := s.v.keys.Decrypt(blob)
+	if err != nil {
+		statusStr = "error"
+		msg := err.Error()
+		errDetail = &msg
+		return &pb.DecryptScoresResponse{Error: msg}, nil
+	}
+	entries := topK_FromShards(scores2D, shardIdx, int(topK))
+	resultCount = len(entries)
+	return &pb.DecryptScoresResponse{Results: entries}, nil
+}
+
+// topK_FromShards mirrors vault_core._decrypt_scores_impl L276-285:
+// flatten 2D scores into (shard_idx, row_idx, score), sort desc by score,
+// take top k. Output order matches Python's heapq.nlargest.
+func topK_FromShards(scores2D [][]float64, shardIdx []int32, k int) []*pb.ScoreEntry {
+	type item struct {
+		shard, row int32
+		score      float64
+	}
+	all := make([]item, 0)
+	for i, row := range scores2D {
+		shard := int32(i)
+		if i < len(shardIdx) {
+			shard = shardIdx[i]
+		}
+		for j, v := range row {
+			all = append(all, item{shard: shard, row: int32(j), score: v})
+		}
+	}
+	sort.SliceStable(all, func(i, j int) bool { return all[i].score > all[j].score })
+	if k > len(all) {
+		k = len(all)
+	}
+	out := make([]*pb.ScoreEntry, k)
+	for i := 0; i < k; i++ {
+		out[i] = &pb.ScoreEntry{
+			ShardIdx: all[i].shard,
+			RowIdx:   all[i].row,
+			Score:    all[i].score,
+		}
+	}
+	return out
+}
+
+// ── DecryptMetadata ───────────────────────────────────────────────
+
+// envelope is the JSON shape of each encrypted_metadata_list element:
+// {"a": "<agent_id>", "c": "<base64_ciphertext>"}.
+type envelope struct {
+	AgentID string `json:"a"`
+	Cipher  string `json:"c"`
+}
+
+func (s *VaultGRPC) DecryptMetadata(ctx context.Context, req *pb.DecryptMetadataRequest) (*pb.DecryptMetadataResponse, error) {
+	start := time.Now()
+	user := s.v.tokens.GetUsername(req.GetToken())
+	if user == "" {
+		user = "unknown"
+	}
+	resultCount := 0
+	statusStr := "success"
+	var errDetail *string
+	defer func() {
+		s.emit(ctx, "decrypt_metadata", user, nil, resultCount, statusStr, errDetail, time.Since(start))
+	}()
+
+	username, role, err := s.v.tokens.Validate(req.GetToken())
+	if err != nil {
+		st, msg := mapTokenError(err)
+		statusStr, errDetail = errStatus(err)
+		return &pb.DecryptMetadataResponse{Error: msg}, status.Error(st, msg)
+	}
+	user = username
+	if err := role.CheckScope("decrypt_metadata"); err != nil {
+		statusStr = "denied"
+		ed := err.Error()
+		errDetail = &ed
+		return &pb.DecryptMetadataResponse{Error: err.Error()}, status.Error(codes.PermissionDenied, err.Error())
+	}
+	if s.v.cfg.Tokens.TeamSecret == "" {
+		statusStr = "error"
+		msg := "VAULT_TEAM_SECRET not configured"
+		errDetail = &msg
+		return &pb.DecryptMetadataResponse{Error: msg}, nil
+	}
+
+	out := make([]string, 0, len(req.GetEncryptedMetadataList()))
+	for _, blobStr := range req.GetEncryptedMetadataList() {
+		var env envelope
+		if err := json.Unmarshal([]byte(blobStr), &env); err != nil {
+			statusStr = "error"
+			msg := fmt.Sprintf("Metadata decryption failed: %s", err.Error())
+			errDetail = &msg
+			return &pb.DecryptMetadataResponse{Error: msg}, nil
+		}
+		dek, err := crypto.DeriveAgentKey(s.v.cfg.Tokens.TeamSecret, env.AgentID)
+		if err != nil {
+			statusStr = "error"
+			msg := fmt.Sprintf("Metadata decryption failed: %s", err.Error())
+			errDetail = &msg
+			return &pb.DecryptMetadataResponse{Error: msg}, nil
+		}
+		pt, err := crypto.DecryptMetadata(env.Cipher, dek)
+		if err != nil {
+			statusStr = "error"
+			msg := fmt.Sprintf("Metadata decryption failed: %s", err.Error())
+			errDetail = &msg
+			return &pb.DecryptMetadataResponse{Error: msg}, nil
+		}
+		out = append(out, string(pt))
+	}
+	resultCount = len(out)
+	return &pb.DecryptMetadataResponse{DecryptedMetadata: out}, nil
+}
+
+// ── error mapping & audit helpers ────────────────────────────────
+
+// mapTokenError maps tokens.ErrXxx → (gRPC code, user-facing message).
+// Mirrors vault_grpc_server.py error branches.
+func mapTokenError(err error) (codes.Code, string) {
+	var nf tokens.ErrTokenNotFound
+	if errors.As(err, &nf) {
+		return codes.Unauthenticated, err.Error()
+	}
+	var exp tokens.ErrTokenExpired
+	if errors.As(err, &exp) {
+		return codes.Unauthenticated, err.Error()
+	}
+	var rl tokens.ErrRateLimit
+	if errors.As(err, &rl) {
+		return codes.ResourceExhausted, err.Error()
+	}
+	var sc tokens.ErrScope
+	if errors.As(err, &sc) {
+		return codes.PermissionDenied, err.Error()
+	}
+	var tk tokens.ErrTopKExceeded
+	if errors.As(err, &tk) {
+		return codes.InvalidArgument, err.Error()
+	}
+	return codes.Unauthenticated, err.Error()
+}
+
+// errStatus tags an error for the audit log: token/scope errors are
+// "denied", everything else is "error".
+func errStatus(err error) (string, *string) {
+	msg := err.Error()
+	switch {
+	case errors.As(err, new(tokens.ErrTokenNotFound)),
+		errors.As(err, new(tokens.ErrTokenExpired)),
+		errors.As(err, new(tokens.ErrRateLimit)),
+		errors.As(err, new(tokens.ErrScope)),
+		errors.As(err, new(tokens.ErrTopKExceeded)):
+		return "denied", &msg
+	}
+	return "error", &msg
+}
+
+func (s *VaultGRPC) emit(ctx context.Context, method, user string, topK *int32, resultCount int, statusStr string, errDetail *string, duration time.Duration) {
+	if s.v.audit == nil || !s.v.audit.Enabled() {
+		return
+	}
+	p, _ := peer.FromContext(ctx)
+	s.v.audit.Log(AuditEntry{
+		Timestamp:   nowUTCISO(),
+		UserID:      user,
+		Method:      method,
+		TopK:        topK,
+		ResultCount: resultCount,
+		Status:      statusStr,
+		SourceIP:    ExtractSourceIP(p),
+		LatencyMs:   float64(duration.Microseconds()) / 1000.0,
+		Error:       errDetail,
+	})
+}
diff --git a/vault/internal/server/serve.go b/vault/internal/server/serve.go
new file mode 100644
index 0000000..7e02e94
--- /dev/null
+++ b/vault/internal/server/serve.go
@@ -0,0 +1,172 @@
+package server
+
+import (
+	"context"
+	"crypto/tls"
+	"errors"
+	"fmt"
+	"log/slog"
+	"net"
+	"os"
+	"os/signal"
+	"syscall"
+	"time"
+
+	"google.golang.org/grpc"
+	"google.golang.org/grpc/credentials"
+	"google.golang.org/grpc/health"
+	healthpb "google.golang.org/grpc/health/grpc_health_v1"
+	"google.golang.org/grpc/reflection"
+
+	pb "github.com/CryptoLabInc/rune-admin/vault/pkg/vaultpb"
+)
+
+// ErrRestartRequested is returned by Serve when the admin POST /restart
+// endpoint was called. The caller (daemon start) should propagate this as a
+// non-zero exit so the service manager (systemd Restart=on-failure / launchd
+// KeepAlive) restarts the process.
+var ErrRestartRequested = errors.New("restart requested by admin socket")
+
+// Serve starts the gRPC + admin UDS listeners with the given Vault and
+// blocks until ctx is cancelled or a SIGTERM/SIGINT is received. The
+// admin listener is constructed by AdminFactory; passing nil disables the
+// admin UDS surface (useful for unit tests that exercise gRPC alone).
+//
+// Returns nil on graceful shutdown. Listener bind errors and server runtime
+// errors are returned eagerly.
+func Serve(ctx context.Context, v *Vault, adminFactory AdminFactory) error {
+	cfg := v.Config()
+
+	if err := EnsureVault(ctx, cfg); err != nil {
+		return fmt.Errorf("server: %w", err)
+	}
+
+	// gRPC listener
+	grpcAddr := fmt.Sprintf("%s:%d", grpcHost(cfg), cfg.Server.GRPC.Port)
+	grpcLis, err := net.Listen("tcp", grpcAddr)
+	if err != nil {
+		return fmt.Errorf("server: listen %s: %w", grpcAddr, err)
+	}
+	defer grpcLis.Close()
+
+	tlsCreds, err := loadTLSCredentials(cfg.Server.GRPC.TLS)
+	if err != nil {
+		return fmt.Errorf("server: tls: %w", err)
+	}
+
+	interceptor, err := NewValidationInterceptor()
+	if err != nil {
+		return fmt.Errorf("server: interceptor: %w", err)
+	}
+
+	opts := []grpc.ServerOption{
+		grpc.MaxRecvMsgSize(MaxMessageSize),
+		grpc.MaxSendMsgSize(MaxMessageSize),
+		grpc.UnaryInterceptor(interceptor),
+	}
+	if tlsCreds != nil {
+		opts = append(opts, grpc.Creds(tlsCreds))
+	}
+	gs := grpc.NewServer(opts...)
+	pb.RegisterVaultServiceServer(gs, NewVaultGRPC(v))
+
+	// Health + reflection (matches Python registration sites:
+	// vault_grpc_server.py:317-331).
+	healthSvc := health.NewServer()
+	healthSvc.SetServingStatus("rune.vault.v1.VaultService", healthpb.HealthCheckResponse_SERVING)
+	healthSvc.SetServingStatus("", healthpb.HealthCheckResponse_SERVING)
+	healthpb.RegisterHealthServer(gs, healthSvc)
+	reflection.Register(gs)
+
+	// Admin UDS listener (optional)
+	var adminShutdown func(context.Context) error
+	if adminFactory != nil {
+		adminShutdown, err = adminFactory(ctx, v)
+		if err != nil {
+			return fmt.Errorf("server: admin: %w", err)
+		}
+	}
+
+	scheme := "insecure"
+	if tlsCreds != nil {
+		scheme = "tls"
+	}
+	slog.Info("vault: gRPC listening", "addr", grpcAddr, "scheme", scheme)
+
+	// Run gRPC in a goroutine; wait for shutdown signal or ctx cancellation.
+	errCh := make(chan error, 1)
+	go func() {
+		errCh <- gs.Serve(grpcLis)
+	}()
+
+	sigCh := make(chan os.Signal, 1)
+	signal.Notify(sigCh, syscall.SIGTERM, syscall.SIGINT)
+	defer signal.Stop(sigCh)
+
+	select {
+	case <-ctx.Done():
+		slog.Info("vault: context cancelled, shutting down")
+	case sig := <-sigCh:
+		slog.Info("vault: signal received, shutting down", "signal", sig.String())
+	case err := <-errCh:
+		if err != nil && !errors.Is(err, grpc.ErrServerStopped) {
+			return fmt.Errorf("server: grpc serve: %w", err)
+		}
+	}
+
+	healthSvc.Shutdown()
+	stopGracefullyOrForce(gs, 5*time.Second)
+	if adminShutdown != nil {
+		shCtx, cancel := context.WithTimeout(context.Background(), 5*time.Second)
+		defer cancel()
+		_ = adminShutdown(shCtx)
+	}
+	if v.RestartRequested() {
+		return ErrRestartRequested
+	}
+	return nil
+}
+
+// stopGracefullyOrForce gives gRPC up to grace to drain in-flight RPCs;
+// on timeout, falls back to a hard Stop so the daemon never hangs at
+// shutdown waiting for an idle reflection/health stream to close.
+func stopGracefullyOrForce(gs *grpc.Server, grace time.Duration) {
+	done := make(chan struct{})
+	go func() {
+		gs.GracefulStop()
+		close(done)
+	}()
+	select {
+	case <-done:
+	case <-time.After(grace):
+		slog.Warn("vault: graceful stop timed out, forcing", "grace", grace)
+		gs.Stop()
+		<-done
+	}
+}
+
+// AdminFactory builds the admin UDS server and returns a shutdown closer.
+// internal/server/admin.go (added in step 6) supplies the production impl.
+type AdminFactory func(ctx context.Context, v *Vault) (shutdown func(context.Context) error, err error)
+
+func grpcHost(cfg *Config) string {
+	if cfg.Server.GRPC.Host == "" {
+		return "0.0.0.0"
+	}
+	return cfg.Server.GRPC.Host
+}
+
+func loadTLSCredentials(t TLSConfig) (credentials.TransportCredentials, error) {
+	if t.Disable {
+		slog.Warn("vault: TLS disabled — gRPC traffic is unencrypted (dev mode only)")
+		return nil, nil
+	}
+	if t.Cert == "" || t.Key == "" {
+		return nil, errors.New("server.grpc.tls.cert and server.grpc.tls.key are required (or set disable=true)")
+	}
+	cert, err := tls.LoadX509KeyPair(t.Cert, t.Key)
+	if err != nil {
+		return nil, fmt.Errorf("load x509 key pair: %w", err)
+	}
+	return credentials.NewServerTLSFromCert(&cert), nil
+}

From 9d2967b8eb0a9e4b02c921ac122ea481b9cd9553 Mon Sep 17 00:00:00 2001
From: Jeonghwan Lee <jhlee@cryptolab.co.kr>
Date: Mon, 27 Apr 2026 12:02:21 +0900
Subject: [PATCH 08/27] refactor: delegate daemon lifecycle to OS service
 manager

---
 vault/internal/commands/daemon.go             |  84 ++++++
 vault/internal/commands/root.go               |  43 +++
 vault/internal/commands/status.go             | 131 +++++++++
 vault/internal/server/config.go               | 248 +++++++++++++++++
 vault/internal/server/config_test.go          | 257 ++++++++++++++++++
 .../server/testdata/runevault.conf.example    |  40 +++
 vault/internal/tests/e2e_test.go              | 188 +++++++++++++
 7 files changed, 991 insertions(+)
 create mode 100644 vault/internal/commands/daemon.go
 create mode 100644 vault/internal/commands/root.go
 create mode 100644 vault/internal/commands/status.go
 create mode 100644 vault/internal/server/config.go
 create mode 100644 vault/internal/server/config_test.go
 create mode 100644 vault/internal/server/testdata/runevault.conf.example
 create mode 100644 vault/internal/tests/e2e_test.go

diff --git a/vault/internal/commands/daemon.go b/vault/internal/commands/daemon.go
new file mode 100644
index 0000000..8a61418
--- /dev/null
+++ b/vault/internal/commands/daemon.go
@@ -0,0 +1,84 @@
+package commands
+
+import (
+	"context"
+	"fmt"
+	"log/slog"
+	"os"
+
+	"github.com/spf13/cobra"
+
+	"github.com/CryptoLabInc/rune-admin/vault/internal/crypto"
+	"github.com/CryptoLabInc/rune-admin/vault/internal/server"
+	"github.com/CryptoLabInc/rune-admin/vault/internal/tokens"
+)
+
+func newDaemonCmd() *cobra.Command {
+	cmd := &cobra.Command{
+		Use:    "daemon",
+		Short:  "Manage the runevault daemon process",
+		Hidden: true,
+	}
+	cmd.AddCommand(newDaemonStartCmd())
+	return cmd
+}
+
+func newDaemonStartCmd() *cobra.Command {
+	return &cobra.Command{
+		Use:   "start",
+		Short: "Start the daemon in the foreground",
+		RunE: func(cmd *cobra.Command, _ []string) error {
+			return runDaemonStart(cmd.Context())
+		},
+	}
+}
+
+func runDaemonStart(ctx context.Context) error {
+	cfg, err := server.LoadConfig(globals.configPath)
+	if err != nil {
+		return err
+	}
+	if globals.adminSocket != "" {
+		cfg.Server.Admin.Socket = globals.adminSocket
+	}
+	if err := cfg.Validate(); err != nil {
+		return err
+	}
+
+	store := tokens.NewStore()
+	if err := store.LoadFromFiles(cfg.Tokens.RolesFile, cfg.Tokens.TokensFile); err != nil {
+		return err
+	}
+	defer store.Shutdown()
+
+	keyParams := crypto.KeysParams{
+		Root:  cfg.Keys.Path,
+		KeyID: "vault-key",
+		Dim:   cfg.Keys.EmbeddingDim,
+	}
+	if err := crypto.EnsureKeys(keyParams); err != nil {
+		return fmt.Errorf("daemon: ensure keys: %w", err)
+	}
+	keys, err := crypto.OpenSecretKey(keyParams)
+	if err != nil {
+		return fmt.Errorf("daemon: open sec key: %w", err)
+	}
+	defer keys.Close()
+
+	audit, err := server.NewAuditLogger(cfg.Audit)
+	if err != nil {
+		return err
+	}
+	defer audit.Close()
+
+	v := server.NewVault(cfg, store, keys, audit)
+	defer v.Close()
+
+	slog.Info("vault: starting daemon",
+		"pid", os.Getpid(),
+		"config", cfg.Source,
+		"grpc_addr", fmt.Sprintf("%s:%d", cfg.Server.GRPC.Host, cfg.Server.GRPC.Port),
+		"admin_socket", cfg.Server.Admin.Socket)
+
+	return server.Serve(ctx, v, server.AdminFromConfig)
+}
diff --git a/vault/internal/commands/root.go b/vault/internal/commands/root.go
new file mode 100644
index 0000000..839ae2b
--- /dev/null
+++ b/vault/internal/commands/root.go
@@ -0,0 +1,43 @@
+package commands
+
+import (
+	"github.com/spf13/cobra"
+)
+
+type globalFlags struct {
+	configPath  string
+	adminSocket string
+}
+
+var globals globalFlags
+
+func newRootCmd() *cobra.Command {
+	cmd := &cobra.Command{
+		Use:           "runevault",
+		Short:         "Rune Vault daemon server with admin CLI",
+		SilenceUsage:  true,
+		SilenceErrors: true,
+		CompletionOptions: cobra.CompletionOptions{
+			HiddenDefaultCmd: true,
+		},
+	}
+
+	cmd.PersistentFlags().StringVar(&globals.configPath, "config", "",
+		"Path to runevault.conf (default: /opt/runevault/configs/runevault.conf, then ./runevault.conf)")
+	cmd.PersistentFlags().StringVar(&globals.adminSocket, "admin-socket", "",
+		"Override server.admin.socket from config")
+
+	cmd.AddCommand(
+		newVersionCmd(),
+		newDaemonCmd(),
+		newTokenCmd(),
+		newRoleCmd(),
+		newStatusCmd(),
+	)
+
+	return cmd
+}
+
+func Execute() error {
+	return newRootCmd().Execute()
+}
diff --git a/vault/internal/commands/status.go b/vault/internal/commands/status.go
new file mode 100644
index 0000000..3125ba9
--- /dev/null
+++ b/vault/internal/commands/status.go
@@ -0,0 +1,131 @@
+package commands
+
+import (
+	"context"
+	"crypto/tls"
+	"fmt"
+	"net"
+	"net/http"
+	"os"
+	"time"
+
+	"github.com/spf13/cobra"
+	"google.golang.org/grpc"
+	"google.golang.org/grpc/credentials"
+	"google.golang.org/grpc/credentials/insecure"
+	healthpb "google.golang.org/grpc/health/grpc_health_v1"
+
+	"github.com/CryptoLabInc/rune-admin/vault/internal/server"
+)
+
+func newStatusCmd() *cobra.Command {
+	return &cobra.Command{
+		Use:   "status",
+		Short: "Report daemon health and socket liveness",
+		RunE: func(cmd *cobra.Command, _ []string) error {
+			return runStatus(cmd)
+		},
+	}
+}
+
+type statusReport struct {
+	adminSocket  string
+	adminUp      bool
+	adminError   string
+	grpcBind     string
+	grpcProbe    string
+	grpcServing  bool
+	grpcError    string
+	configSource string
+}
+
+func runStatus(cmd *cobra.Command) error {
+	cfg, err := server.LoadConfig(globals.configPath)
+	if err != nil {
+		return err
+	}
+
+	bindHost := cfg.Server.GRPC.Host
+	probeHost := bindHost
+	if probeHost == "" || probeHost == "0.0.0.0" {
+		probeHost = "127.0.0.1"
+	}
+
+	r := statusReport{
+		adminSocket:  cfg.Server.Admin.Socket,
+		grpcBind:     fmt.Sprintf("%s:%d", bindHost, cfg.Server.GRPC.Port),
+		grpcProbe:    fmt.Sprintf("%s:%d", probeHost, cfg.Server.GRPC.Port),
+		configSource: cfg.Source,
+	}
+	if globals.adminSocket != "" {
+		r.adminSocket = globals.adminSocket
+	}
+
+	r.adminUp, r.adminError = probeAdminUDS(r.adminSocket)
+	r.grpcServing, r.grpcError = probeGRPCHealth(r.grpcProbe, cfg.Server.GRPC.TLS.Disable)
+
+	out := cmd.OutOrStdout()
+	fmt.Fprintf(out, "Config:       %s\n", r.configSource)
+	fmt.Fprintf(out, "Admin socket: %s (%s)\n", r.adminSocket, healthStr(r.adminUp, r.adminError))
+	fmt.Fprintf(out, "gRPC:         %s (%s)\n", r.grpcBind, healthStr(r.grpcServing, r.grpcError))
+
+	if !(r.adminUp && r.grpcServing) {
+		os.Exit(2)
+	}
+	return nil
+}
+
+func healthStr(ok bool, errMsg string) string {
+	if ok {
+		return "ok"
+	}
+	if errMsg != "" {
+		return "down — " + errMsg
+	}
+	return "down"
+}
+
+func probeAdminUDS(path string) (bool, string) {
+	if path == "" {
+		return false, "socket path empty"
+	}
+	hc := &http.Client{
+		Timeout: 2 * time.Second,
+		Transport: &http.Transport{
+			DialContext: func(ctx context.Context, _, _ string) (net.Conn, error) {
+				return (&net.Dialer{}).DialContext(ctx, "unix", path)
+			},
+			DisableKeepAlives: true,
+		},
+	}
+	resp, err := hc.Get("http://admin/health")
+	if err != nil {
+		return false, err.Error()
+	}
+	defer resp.Body.Close()
+	return resp.StatusCode == 200, ""
+}
+
+func probeGRPCHealth(addr string, tlsDisabled bool) (bool, string) {
+	ctx, cancel := context.WithTimeout(context.Background(), 2*time.Second)
+	defer cancel()
+	var creds grpc.DialOption
+	if tlsDisabled {
+		creds = grpc.WithTransportCredentials(insecure.NewCredentials())
+	} else {
+		// InsecureSkipVerify is intentional: status probe is local-only and
+		// does not need to verify the self-signed server cert.
+		creds = grpc.WithTransportCredentials(credentials.NewTLS(&tls.Config{InsecureSkipVerify: true})) //nolint:gosec
+	}
+	conn, err := grpc.NewClient(addr, creds)
+	if err != nil {
+		return false, err.Error()
+	}
+	defer conn.Close()
+	cli := healthpb.NewHealthClient(conn)
+	resp, err := cli.Check(ctx, &healthpb.HealthCheckRequest{})
+	if err != nil {
+		return false, err.Error()
+	}
+	return resp.GetStatus() == healthpb.HealthCheckResponse_SERVING, ""
+}
diff --git a/vault/internal/server/config.go b/vault/internal/server/config.go
new file mode 100644
index 0000000..1ddaeb3
--- /dev/null
+++ b/vault/internal/server/config.go
@@ -0,0 +1,248 @@
+// Package server hosts the daemon transports (gRPC, admin UDS), audit log,
+// and runtime configuration. Pure crypto/token logic lives in internal/crypto
+// and internal/tokens respectively.
+package server
+
+import (
+	"errors"
+	"fmt"
+	"io/fs"
+	"log/slog"
+	"os"
+	"path/filepath"
+	"strings"
+
+	"gopkg.in/yaml.v3"
+)
+
+// ConfigLookupPaths lists, in priority order, the on-disk locations that
+// LoadConfig probes when the caller doesn't pass an explicit path.
+var ConfigLookupPaths = []string{
+	"/opt/runevault/configs/runevault.conf",
+	"./runevault.conf",
+}
+
+// 0640: group-readable so runevault group members can run CLI commands without sudo.
+const expectedSecretMode fs.FileMode = 0o640
+
+// Config is the in-memory shape of runevault.conf. Field names follow the
+// YAML schema exactly so the loader can decode without an intermediate type.
+type Config struct {
+	Server   ServerConfig   `yaml:"server"`
+	Keys     KeysConfig     `yaml:"keys"`
+	Envector EnvectorConfig `yaml:"envector"`
+	Tokens   TokensConfig   `yaml:"tokens"`
+	Audit    AuditConfig    `yaml:"audit"`
+
+	// Source records where this Config was loaded from (resolved absolute
+	// path), populated by LoadConfig. Empty for in-memory test configs.
+	Source string `yaml:"-" json:"-"`
+}
+
+type ServerConfig struct {
+	GRPC  GRPCConfig  `yaml:"grpc"`
+	Admin AdminConfig `yaml:"admin"`
+}
+
+type GRPCConfig struct {
+	Host string    `yaml:"host"`
+	Port int       `yaml:"port"`
+	TLS  TLSConfig `yaml:"tls"`
+}
+
+type TLSConfig struct {
+	Cert    string `yaml:"cert"`
+	Key     string `yaml:"key"`
+	Disable bool   `yaml:"disable"`
+}
+
+type AdminConfig struct {
+	Socket string `yaml:"socket"`
+}
+
+type KeysConfig struct {
+	Path         string `yaml:"path"`
+	IndexName    string `yaml:"index_name"`
+	EmbeddingDim int    `yaml:"embedding_dim"`
+}
+
+// EnvectorConfig accepts either an inline api_key or an api_key_file
+// pointing at a 0600-mode file containing the same value. If both are
+// set, api_key_file wins. Resolve() materialises the final string into
+// APIKey and clears APIKeyFile.
+type EnvectorConfig struct {
+	Endpoint   string `yaml:"endpoint"`
+	APIKey     string `yaml:"api_key"`
+	APIKeyFile string `yaml:"api_key_file"`
+}
+
+type TokensConfig struct {
+	TeamSecret     string `yaml:"team_secret"`
+	TeamSecretFile string `yaml:"team_secret_file"`
+	RolesFile      string `yaml:"roles_file"`
+	TokensFile     string `yaml:"tokens_file"`
+}
+
+// AuditConfig.Mode is one of: "", "file", "stdout", "file+stdout".
+// Empty disables audit logging.
+type AuditConfig struct {
+	Mode string `yaml:"mode"`
+	Path string `yaml:"path"`
+}
+
+// LoadConfig resolves the config path (caller override → ConfigLookupPaths)
+// and decodes the YAML at that location. The returned Config has
+// *_file indirection materialised into the corresponding inline fields
+// and Source set to the resolved absolute path.
+//
+// Missing config produces an error that names every path probed so the
+// operator can copy the example file into place.
+func LoadConfig(override string) (*Config, error) {
+	path, searched, err := resolveConfigPath(override)
+	if err != nil {
+		return nil, err
+	}
+
+	data, err := os.ReadFile(path)
+	if err != nil {
+		return nil, fmt.Errorf("read config %s: %w", path, err)
+	}
+
+	var cfg Config
+	dec := yaml.NewDecoder(strings.NewReader(string(data)))
+	dec.KnownFields(true)
+	if err := dec.Decode(&cfg); err != nil {
+		return nil, fmt.Errorf("parse config %s: %w (searched: %s)", path, err, strings.Join(searched, ", "))
+	}
+	cfg.Source = path
+
+	checkSecretMode(path, "runevault.conf")
+
+	if err := cfg.Resolve(); err != nil {
+		return nil, fmt.Errorf("resolve config %s: %w", path, err)
+	}
+	return &cfg, nil
+}
+
+// resolveConfigPath returns the path to use plus the list of all paths
+// searched (for error messages). Override wins if non-empty.
+func resolveConfigPath(override string) (path string, searched []string, err error) {
+	if override != "" {
+		searched = append(searched, override)
+		if _, statErr := os.Stat(override); statErr != nil {
+			return "", searched, fmt.Errorf("config file not found at --config %s: %w", override, statErr)
+		}
+		abs, _ := filepath.Abs(override)
+		return abs, searched, nil
+	}
+	for _, p := range ConfigLookupPaths {
+		searched = append(searched, p)
+		if _, statErr := os.Stat(p); statErr == nil {
+			abs, _ := filepath.Abs(p)
+			return abs, searched, nil
+		}
+	}
+	return "", searched, fmt.Errorf("config file not found (searched: %s)", strings.Join(searched, ", "))
+}
+
+// Resolve materialises *_file indirections into their inline equivalents
+// and warns about any non-0600 secret files. Idempotent.
+func (c *Config) Resolve() error {
+	if c.Envector.APIKeyFile != "" {
+		val, err := readSecretFile(c.Envector.APIKeyFile, "envector.api_key_file")
+		if err != nil {
+			return err
+		}
+		c.Envector.APIKey = val
+		c.Envector.APIKeyFile = ""
+	}
+	if c.Tokens.TeamSecretFile != "" {
+		val, err := readSecretFile(c.Tokens.TeamSecretFile, "tokens.team_secret_file")
+		if err != nil {
+			return err
+		}
+		c.Tokens.TeamSecret = val
+		c.Tokens.TeamSecretFile = ""
+	}
+	return nil
+}
+
+func readSecretFile(path, label string) (string, error) {
+	checkSecretMode(path, label)
+	b, err := os.ReadFile(path)
+	if err != nil {
+		return "", fmt.Errorf("read %s %s: %w", label, path, err)
+	}
+	return strings.TrimRight(string(b), "\n"), nil
+}
+
+// checkSecretMode emits a warning (does not fail) if the file mode is
+// less restrictive than 0600. The warning is only written for non-empty
+// paths that exist; missing files are surfaced by the caller's read.
+func checkSecretMode(path, label string) {
+	info, err := os.Stat(path)
+	if err != nil {
+		return
+	}
+	mode := info.Mode().Perm()
+	if mode&^expectedSecretMode != 0 {
+		slog.Warn("config: secret file mode is too permissive",
+			"label", label,
+			"path", path,
+			"mode", fmt.Sprintf("%04o", mode),
+			"expected", "0640")
+	}
+}
+
+// Redact returns a copy of c with secret fields replaced by sentinel
+// strings. Use this for any debug dumps, structured log payloads, or
+// admin endpoints that surface configuration to operators.
+func (c *Config) Redact() Config {
+	out := *c
+	if out.Envector.APIKey != "" {
+		out.Envector.APIKey = "[REDACTED]"
+	}
+	if out.Envector.APIKeyFile != "" {
+		out.Envector.APIKeyFile = "[REDACTED]"
+	}
+	if out.Tokens.TeamSecret != "" {
+		out.Tokens.TeamSecret = "[REDACTED]"
+	}
+	if out.Tokens.TeamSecretFile != "" {
+		out.Tokens.TeamSecretFile = "[REDACTED]"
+	}
+	return out
+}
+
+// Validate enforces invariants the daemon needs at startup.
+// Returns nil for fully populated configs.
+func (c *Config) Validate() error {
+	var errs []string
+	if c.Server.Admin.Socket == "" {
+		errs = append(errs, "server.admin.socket is required")
+	}
+	if c.Server.GRPC.Port == 0 {
+		errs = append(errs, "server.grpc.port is required")
+	}
+	if !c.Server.GRPC.TLS.Disable {
+		if c.Server.GRPC.TLS.Cert == "" || c.Server.GRPC.TLS.Key == "" {
+			errs = append(errs, "server.grpc.tls.cert and server.grpc.tls.key are required (or set server.grpc.tls.disable=true)")
+		}
+	}
+	if c.Keys.Path == "" {
+		errs = append(errs, "keys.path is required")
+	}
+	if c.Keys.EmbeddingDim == 0 {
+		errs = append(errs, "keys.embedding_dim is required")
+	}
+	if c.Tokens.RolesFile == "" {
+		errs = append(errs, "tokens.roles_file is required")
+	}
+	if c.Tokens.TokensFile == "" {
+		errs = append(errs, "tokens.tokens_file is required")
+	}
+	if len(errs) > 0 {
+		return errors.New("config invalid:\n  - " + strings.Join(errs, "\n  - "))
+	}
+	return nil
+}
diff --git a/vault/internal/server/config_test.go b/vault/internal/server/config_test.go
new file mode 100644
index 0000000..c791341
--- /dev/null
+++ b/vault/internal/server/config_test.go
@@ -0,0 +1,257 @@
+package server
+
+import (
+	"os"
+	"path/filepath"
+	"strings"
+	"testing"
+)
+
+// minimalValidConfig returns a YAML body that satisfies Validate().
+func minimalValidConfig(t *testing.T) string {
+	t.Helper()
+	return `server:
+  grpc:
+    host: 127.0.0.1
+    port: 50051
+    tls:
+      disable: true
+  admin:
+    socket: /tmp/admin.sock
+keys:
+  path: /tmp/vault-keys
+  embedding_dim: 1024
+envector:
+  endpoint: https://example.com
+  api_key: inline-api-key
+tokens:
+  team_secret: inline-team-secret-deadbeef
+  roles_file: /tmp/roles.yml
+  tokens_file: /tmp/tokens.yml
+audit:
+  mode: stdout
+`
+}
+
+func writeConfig(t *testing.T, body string) string {
+	t.Helper()
+	dir := t.TempDir()
+	path := filepath.Join(dir, "runevault.conf")
+	if err := os.WriteFile(path, []byte(body), 0o600); err != nil {
+		t.Fatal(err)
+	}
+	return path
+}
+
+func TestLoadConfigMinimalValid(t *testing.T) {
+	path := writeConfig(t, minimalValidConfig(t))
+	cfg, err := LoadConfig(path)
+	if err != nil {
+		t.Fatal(err)
+	}
+	if cfg.Server.GRPC.Port != 50051 {
+		t.Errorf("port = %d, want 50051", cfg.Server.GRPC.Port)
+	}
+	if cfg.Tokens.TeamSecret != "inline-team-secret-deadbeef" {
+		t.Errorf("team_secret = %q, want inline value", cfg.Tokens.TeamSecret)
+	}
+	if cfg.Source != path {
+		// Source may be absolute even if path is already absolute (it should match).
+		abs, _ := filepath.Abs(path)
+		if cfg.Source != abs {
+			t.Errorf("Source = %q, want %q", cfg.Source, abs)
+		}
+	}
+	if err := cfg.Validate(); err != nil {
+		t.Errorf("Validate: %v", err)
+	}
+}
+
+func TestLoadConfigMissingNamesAllPaths(t *testing.T) {
+	_, err := LoadConfig("/tmp/this/path/does/not/exist/runevault.conf")
+	if err == nil {
+		t.Fatal("expected error for missing config")
+	}
+	if !strings.Contains(err.Error(), "/tmp/this/path/does/not/exist/runevault.conf") {
+		t.Errorf("err missing override path: %v", err)
+	}
+}
+
+func TestLoadConfigDefaultLookupErrorListsPaths(t *testing.T) {
+	// Stash the package-level lookup list and restore.
+	orig := ConfigLookupPaths
+	defer func() { ConfigLookupPaths = orig }()
+	ConfigLookupPaths = []string{"/nope/a.conf", "/nope/b.conf"}
+
+	_, err := LoadConfig("")
+	if err == nil {
+		t.Fatal("expected error")
+	}
+	for _, p := range ConfigLookupPaths {
+		if !strings.Contains(err.Error(), p) {
+			t.Errorf("err missing %s: %v", p, err)
+		}
+	}
+}
+
+func TestLoadConfigUnknownFieldsRejected(t *testing.T) {
+	body := minimalValidConfig(t) + "extra_unknown_field: 42\n"
+	path := writeConfig(t, body)
+	_, err := LoadConfig(path)
+	if err == nil {
+		t.Error("unknown top-level field accepted, want strict error")
+	}
+}
+
+func TestLoadConfigAPIKeyFileIndirection(t *testing.T) {
+	dir := t.TempDir()
+	keyFile := filepath.Join(dir, "envector.key")
+	if err := os.WriteFile(keyFile, []byte("file-api-key\n"), 0o600); err != nil {
+		t.Fatal(err)
+	}
+	body := strings.Replace(
+		minimalValidConfig(t),
+		"  api_key: inline-api-key",
+		"  api_key_file: "+keyFile,
+		1,
+	)
+	path := writeConfig(t, body)
+	cfg, err := LoadConfig(path)
+	if err != nil {
+		t.Fatal(err)
+	}
+	if cfg.Envector.APIKey != "file-api-key" {
+		t.Errorf("api_key = %q, want file-api-key", cfg.Envector.APIKey)
+	}
+	if cfg.Envector.APIKeyFile != "" {
+		t.Errorf("api_key_file should be cleared after Resolve, got %q", cfg.Envector.APIKeyFile)
+	}
+}
+
+func TestLoadConfigTeamSecretFileIndirection(t *testing.T) {
+	dir := t.TempDir()
+	secretFile := filepath.Join(dir, "team.secret")
+	if err := os.WriteFile(secretFile, []byte("file-team-secret"), 0o600); err != nil {
+		t.Fatal(err)
+	}
+	body := strings.Replace(
+		minimalValidConfig(t),
+		"  team_secret: inline-team-secret-deadbeef",
+		"  team_secret_file: "+secretFile,
+		1,
+	)
+	path := writeConfig(t, body)
+	cfg, err := LoadConfig(path)
+	if err != nil {
+		t.Fatal(err)
+	}
+	if cfg.Tokens.TeamSecret != "file-team-secret" {
+		t.Errorf("team_secret = %q, want file-team-secret", cfg.Tokens.TeamSecret)
+	}
+}
+
+func TestLoadConfigSecretFileMissing(t *testing.T) {
+	body := strings.Replace(
+		minimalValidConfig(t),
+		"  team_secret: inline-team-secret-deadbeef",
+		"  team_secret_file: /nope/team.secret",
+		1,
+	)
+	path := writeConfig(t, body)
+	_, err := LoadConfig(path)
+	if err == nil {
+		t.Fatal("expected error for missing team_secret_file")
+	}
+	if !strings.Contains(err.Error(), "team_secret_file") {
+		t.Errorf("err missing label: %v", err)
+	}
+}
+
+func TestRedactMasksSecrets(t *testing.T) {
+	cfg := &Config{
+		Envector: EnvectorConfig{APIKey: "deadbeef", APIKeyFile: "/x"},
+		Tokens:   TokensConfig{TeamSecret: "supersecret", TeamSecretFile: "/y"},
+	}
+	r := cfg.Redact()
+	if r.Envector.APIKey != "[REDACTED]" {
+		t.Errorf("api_key not redacted: %q", r.Envector.APIKey)
+	}
+	if r.Envector.APIKeyFile != "[REDACTED]" {
+		t.Errorf("api_key_file not redacted: %q", r.Envector.APIKeyFile)
+	}
+	if r.Tokens.TeamSecret != "[REDACTED]" {
+		t.Errorf("team_secret not redacted: %q", r.Tokens.TeamSecret)
+	}
+	if r.Tokens.TeamSecretFile != "[REDACTED]" {
+		t.Errorf("team_secret_file not redacted: %q", r.Tokens.TeamSecretFile)
+	}
+	// Original must be untouched.
+	if cfg.Envector.APIKey != "deadbeef" {
+		t.Errorf("Redact mutated original")
+	}
+}
+
+func TestValidateRejectsMissingFields(t *testing.T) {
+	cases := map[string]func(*Config){
+		"missing socket":      func(c *Config) { c.Server.Admin.Socket = "" },
+		"missing port":        func(c *Config) { c.Server.GRPC.Port = 0 },
+		"missing keys.path":   func(c *Config) { c.Keys.Path = "" },
+		"missing dim":         func(c *Config) { c.Keys.EmbeddingDim = 0 },
+		"missing roles_file":  func(c *Config) { c.Tokens.RolesFile = "" },
+		"missing tokens_file": func(c *Config) { c.Tokens.TokensFile = "" },
+	}
+	base := func() *Config {
+		path := writeConfig(t, minimalValidConfig(t))
+		c, err := LoadConfig(path)
+		if err != nil {
+			t.Fatal(err)
+		}
+		return c
+	}
+	for name, mut := range cases {
+		t.Run(name, func(t *testing.T) {
+			c := base()
+			mut(c)
+			if err := c.Validate(); err == nil {
+				t.Errorf("Validate accepted %s", name)
+			}
+		})
+	}
+}
+
+func TestValidateRejectsTLSWithoutCertKey(t *testing.T) {
+	body := strings.Replace(
+		minimalValidConfig(t),
+		"      disable: true",
+		"      disable: false",
+		1,
+	)
+	path := writeConfig(t, body)
+	cfg, err := LoadConfig(path)
+	if err != nil {
+		t.Fatal(err)
+	}
+	if err := cfg.Validate(); err == nil {
+		t.Error("Validate accepted TLS enabled without cert/key")
+	}
+}
+
+func TestExampleConfigParsesCleanly(t *testing.T) {
+	// The committed example file should at least parse — operators copy it.
+	data, err := os.ReadFile("testdata/runevault.conf.example")
+	if err != nil {
+		t.Fatal(err)
+	}
+	tmp := t.TempDir()
+	path := filepath.Join(tmp, "example.conf")
+	if err := os.WriteFile(path, data, 0o600); err != nil {
+		t.Fatal(err)
+	}
+	cfg, err := LoadConfig(path)
+	if err != nil {
+		t.Fatalf("example file failed to parse: %v", err)
+	}
+	if cfg.Server.GRPC.Port != 50051 {
+		t.Errorf("example: port = %d", cfg.Server.GRPC.Port)
+	}
+}
diff --git a/vault/internal/server/testdata/runevault.conf.example b/vault/internal/server/testdata/runevault.conf.example
new file mode 100644
index 0000000..70243e9
--- /dev/null
+++ b/vault/internal/server/testdata/runevault.conf.example
@@ -0,0 +1,40 @@
+# runevault.conf — example deployment configuration.
+#
+# Lookup order:
+#   1. --config <path> CLI flag
+#   2. /opt/rune-vault/configs/runevault.conf
+#   3. ./runevault.conf (cwd, dev only)
+#
+# This file should be mode 0600, owned by the vault-user.
+# Replace placeholder values before use.
+
+server:
+  grpc:
+    host: 0.0.0.0
+    port: 50051
+    tls:
+      cert: /opt/rune-vault/certs/server.pem
+      key: /opt/rune-vault/certs/server.key
+      disable: false        # true for dev only — never in production
+  admin:
+    socket: /opt/rune-vault/admin.sock
+
+keys:
+  path: /opt/rune-vault/vault-keys
+  index_name: my-team
+  embedding_dim: 1024
+
+envector:
+  endpoint: https://envector.example.com
+  api_key: REPLACE_WITH_API_KEY
+  # Alternative: api_key_file: /run/secrets/envector_api_key
+
+tokens:
+  team_secret: REPLACE_WITH_RANDOM_HEX_32
+  # Alternative: team_secret_file: /run/secrets/team_secret
+  roles_file: /opt/rune-vault/configs/roles.yml
+  tokens_file: /opt/rune-vault/configs/tokens.yml
+
+audit:
+  mode: file+stdout         # one of: "", file, stdout, file+stdout
+  path: /opt/rune-vault/logs/audit.log
diff --git a/vault/internal/tests/e2e_test.go b/vault/internal/tests/e2e_test.go
new file mode 100644
index 0000000..33d3ddf
--- /dev/null
+++ b/vault/internal/tests/e2e_test.go
@@ -0,0 +1,188 @@
+//go:build e2e
+
+package tests
+
+import (
+	"fmt"
+	"os"
+	"os/exec"
+	"path/filepath"
+	"strings"
+	"syscall"
+	"testing"
+	"time"
+)
+
+// TestE2EDaemonLifecycle boots runevault as a daemon against a tmp config
+// (TLS disabled), exercises token/role CLI operations through the admin UDS,
+// then verifies daemon stop.
+//
+// Set RUNEVAULT_TEST_BINARY to a pre-built binary path to skip the in-test
+// build step (required in CI — run `mise run go:build` first).
+func TestE2EDaemonLifecycle(t *testing.T) {
+	repoRoot := RepoRoot()
+	tmp, err := os.MkdirTemp("", "vts-")
+	if err != nil {
+		t.Fatal(err)
+	}
+	t.Cleanup(func() { os.RemoveAll(tmp) })
+
+	binary := resolveBinary(t, repoRoot, tmp)
+
+	confPath := filepath.Join(tmp, "runevault.conf")
+	conf := fmt.Sprintf(`server:
+  grpc:
+    host: 127.0.0.1
+    port: 53052
+    tls:
+      disable: true
+  admin:
+    socket: %[1]s/x.sock
+keys:
+  path: %[1]s/keys
+  embedding_dim: 1024
+envector:
+  endpoint: ""
+  api_key: ""
+tokens:
+  team_secret: smoke-secret
+  roles_file: %[1]s/roles.yml
+  tokens_file: %[1]s/tokens.yml
+audit:
+  mode: stdout
+`, tmp)
+	if err := os.WriteFile(confPath, []byte(conf), 0o600); err != nil {
+		t.Fatal(err)
+	}
+
+	// Spawn daemon in background.
+	daemon := exec.Command(binary, "--config", confPath, "daemon", "start")
+	logFile, err := os.Create(filepath.Join(tmp, "daemon.log"))
+	if err != nil {
+		t.Fatal(err)
+	}
+	defer logFile.Close()
+	daemon.Stdout = logFile
+	daemon.Stderr = logFile
+	if err := daemon.Start(); err != nil {
+		t.Fatalf("daemon start: %v", err)
+	}
+	daemonPID := daemon.Process.Pid
+	// Reap the daemon promptly when it exits — without this, the kernel
+	// keeps it as a zombie and PIDLive (kill -0) returns true even though
+	// the daemon has already finished its shutdown sequence. That defeats
+	// `daemon stop`'s liveness poll.
+	waitDone := make(chan error, 1)
+	go func() { waitDone <- daemon.Wait() }()
+	t.Cleanup(func() {
+		// Send SIGKILL via syscall so we don't race with cmd.Wait's fd close.
+		_ = syscall.Kill(daemonPID, syscall.SIGKILL)
+		select {
+		case <-waitDone:
+		case <-time.After(2 * time.Second):
+		}
+	})
+
+	// Wait for the admin socket to appear (FHE key generation can take a
+	// few seconds on cold starts).
+	socket := filepath.Join(tmp, "x.sock")
+	if !waitFor(socket, 30*time.Second) {
+		body, _ := os.ReadFile(filepath.Join(tmp, "daemon.log"))
+		t.Fatalf("admin socket never appeared\ndaemon log:\n%s", body)
+	}
+
+	run := func(args ...string) (string, error) {
+		cmd := exec.Command(binary, append([]string{"--config", confPath}, args...)...)
+		out, err := cmd.CombinedOutput()
+		return string(out), err
+	}
+
+	// ── status ──
+	out, err := run("status")
+	if err != nil {
+		t.Fatalf("status: %v\n%s", err, out)
+	}
+	if !strings.Contains(out, "Admin socket:") || !strings.Contains(out, "ok)") {
+		t.Errorf("status output unexpected:\n%s", out)
+	}
+
+	// ── token issue ──
+	out, err = run("token", "issue", "--user", "alice", "--role", "member", "--expires", "30d")
+	if err != nil {
+		t.Fatalf("issue: %v\n%s", err, out)
+	}
+	if !strings.Contains(out, "Token issued for 'alice'") {
+		t.Errorf("issue output: %s", out)
+	}
+	if !strings.Contains(out, "evt_") {
+		t.Errorf("token not in output: %s", out)
+	}
+
+	// ── token list ──
+	out, err = run("token", "list")
+	if err != nil {
+		t.Fatalf("list: %v\n%s", err, out)
+	}
+	if !strings.Contains(out, "alice") || !strings.Contains(out, "member") {
+		t.Errorf("list output missing alice: %s", out)
+	}
+
+	// ── role list (defaults present) ──
+	out, err = run("role", "list")
+	if err != nil {
+		t.Fatalf("role list: %v\n%s", err, out)
+	}
+	if !strings.Contains(out, "admin") || !strings.Contains(out, "member") {
+		t.Errorf("role list output: %s", out)
+	}
+
+	// ── token revoke ──
+	out, err = run("token", "revoke", "--user", "alice")
+	if err != nil {
+		t.Fatalf("revoke: %v\n%s", err, out)
+	}
+	if !strings.Contains(out, "Revoked") {
+		t.Errorf("revoke output: %s", out)
+	}
+
+	// Signal daemon to shut down gracefully via SIGTERM (lifecycle is OS-managed).
+	if err := syscall.Kill(daemonPID, syscall.SIGTERM); err != nil {
+		t.Fatalf("SIGTERM daemon: %v", err)
+	}
+	select {
+	case <-waitDone:
+	case <-time.After(10 * time.Second):
+		t.Errorf("daemon did not exit after SIGTERM")
+	}
+}
+
+// resolveBinary returns the runevault binary path. If RUNEVAULT_TEST_BINARY
+// is set it is used as-is (relative paths are resolved from repoRoot).
+// Otherwise the binary is built from source into tmp.
+func resolveBinary(t *testing.T, repoRoot, tmp string) string {
+	t.Helper()
+	if p := os.Getenv("RUNEVAULT_TEST_BINARY"); p != "" {
+		if !filepath.IsAbs(p) {
+			p = filepath.Join(repoRoot, p)
+		}
+		return p
+	}
+	binary := filepath.Join(tmp, "runevault")
+	build := exec.Command("go", "build", "-o", binary, "./cmd")
+	build.Dir = filepath.Join(repoRoot, "vault")
+	if out, err := build.CombinedOutput(); err != nil {
+		t.Fatalf("build: %v\n%s", err, out)
+	}
+	return binary
+}
+
+func waitFor(path string, dur time.Duration) bool {
+	deadline := time.Now().Add(dur)
+	for time.Now().Before(deadline) {
+		if _, err := os.Stat(path); err == nil {
+			return true
+		}
+		time.Sleep(100 * time.Millisecond)
+	}
+	return false
+}

From 5b1e922df3dc573cf1cffd2d46fd9cc10bfdf3c1 Mon Sep 17 00:00:00 2001
From: Jeonghwan Lee <jhlee@cryptolab.co.kr>
Date: Mon, 27 Apr 2026 12:43:55 +0900
Subject: [PATCH 09/27] feat: add logs command to tail daemon output

Wraps tail (macOS) or journalctl (Linux) with optional -f flag.
Log path is derived from config source on macOS; Linux delegates to journald.
---
 vault/internal/commands/logs.go | 66 +++++++++++++++++++++++++++++++++
 vault/internal/commands/root.go |  1 +
 2 files changed, 67 insertions(+)
 create mode 100644 vault/internal/commands/logs.go

diff --git a/vault/internal/commands/logs.go b/vault/internal/commands/logs.go
new file mode 100644
index 0000000..138c958
--- /dev/null
+++ b/vault/internal/commands/logs.go
@@ -0,0 +1,66 @@
+package commands
+
+import (
+	"os"
+	"os/exec"
+	"path/filepath"
+	"runtime"
+
+	"github.com/spf13/cobra"
+
+	"github.com/CryptoLabInc/rune-admin/vault/internal/server"
+)
+
+// newLogsCmd returns the "logs" subcommand which tails the daemon log output.
+// On Linux it delegates to journalctl; on macOS it tails the service stderr file.
+func newLogsCmd() *cobra.Command {
+	var follow bool
+	cmd := &cobra.Command{
+		Use:   "logs",
+		Short: "Show daemon log output",
+		RunE: func(cmd *cobra.Command, _ []string) error {
+			return runLogs(follow)
+		},
+	}
+	cmd.Flags().BoolVarP(&follow, "follow", "f", false, "Follow log output (like tail -f)")
+	return cmd
+}
+
+func runLogs(follow bool) error {
+	if runtime.GOOS == "linux" {
+		args := []string{"-u", "runevault", "--no-pager"}
+		if follow {
+			args = append(args, "-f")
+		}
+		c := exec.Command("journalctl", args...)
+		c.Stdout = os.Stdout
+		c.Stderr = os.Stderr
+		return c.Run()
+	}
+
+	cfg, err := server.LoadConfig(globals.configPath)
+	if err != nil {
+		return err
+	}
+	logPath := daemonStderrLogPath(cfg)
+
+	var args []string
+	if follow {
+		args = append(args, "-f")
+	}
+	args = append(args, logPath)
+	c := exec.Command("tail", args...)
+	c.Stdout = os.Stdout
+	c.Stderr = os.Stderr
+	return c.Run()
+}
+
+// daemonStderrLogPath derives the launchd stderr log path from the config
+// source location: /opt/runevault/configs/runevault.conf → /opt/runevault/logs/runevault.stderr.log
+func daemonStderrLogPath(cfg *server.Config) string {
+	if cfg.Source != "" {
+		prefix := filepath.Dir(filepath.Dir(cfg.Source))
+		return filepath.Join(prefix, "logs", "runevault.stderr.log")
+	}
+	return "/opt/runevault/logs/runevault.stderr.log"
+}
diff --git a/vault/internal/commands/root.go b/vault/internal/commands/root.go
index 839ae2b..7a22b11 100644
--- a/vault/internal/commands/root.go
+++ b/vault/internal/commands/root.go
@@ -33,6 +33,7 @@ func newRootCmd() *cobra.Command {
 		newTokenCmd(),
 		newRoleCmd(),
 		newStatusCmd(),
+		newLogsCmd(),
 	)
 
 	return cmd

From f65edd967ec963a70253b626d67d7437879da128 Mon Sep 17 00:00:00 2001
From: Jeonghwan Lee <jhlee@cryptolab.co.kr>
Date: Mon, 27 Apr 2026 13:46:23 +0900
Subject: [PATCH 10/27] feat: add cloud (CSP) installation to install.sh
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

- Add --target <local|aws|gcp|oci> flag and interactive target menu
- Add --install-dir flag for CSP install directory override
- Add CSP dispatch functions: resolve_target, csp_preflight,
  csp_prompt_config, csp_generate_ssh_key, csp_copy_terraform_files,
  csp_render_tfvars, csp_run_terraform, csp_post_deploy, csp_summary
- Add RUNEVAULT_TLS_HOSTNAME support in generate_tls_certs() as DNS SAN
- Remove team_secret from operator→VM flow; VM auto-generates it
- Remove RUNEVAULT_TEAM_SECRET env var from user-facing interface
- Rewrite deployment/{aws,gcp,oci} cloud-init/startup-script files to
  use Go-native install.sh instead of Docker compose
- Add runevault_version variable to deployment/{aws,gcp,oci}/main.tf
- Remove team_secret variable and output from all three main.tf files

Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>
---
 deployment/aws/cloud-init.yaml   | 179 ++------------
 deployment/aws/main.tf           |  31 +--
 deployment/gcp/main.tf           |  31 +--
 deployment/gcp/startup-script.sh | 166 ++-----------
 deployment/oci/main.tf           |  31 +--
 deployment/oci/startup-script.sh | 162 ++-----------
 install.sh                       | 392 ++++++++++++++++++++++++++++++-
 7 files changed, 477 insertions(+), 515 deletions(-)

diff --git a/deployment/aws/cloud-init.yaml b/deployment/aws/cloud-init.yaml
index 170b536..90251d9 100644
--- a/deployment/aws/cloud-init.yaml
+++ b/deployment/aws/cloud-init.yaml
@@ -1,171 +1,28 @@
 #cloud-config
-
-# Rune-Vault Installation Script for AWS EC2
-# Deploys Docker-based Vault with gRPC (port 50051)
-
 package_update: true
-package_upgrade: true
-
-packages:
-  - ca-certificates
-  - curl
-  - gnupg
-  - jq
-  - openssl
+packages: [ca-certificates, curl, openssl]
 
 write_files:
-  - path: /opt/rune/docker-compose.yml
+  - path: /etc/profile.d/runevault-installer-env.sh
     content: |
-      services:
-        vault:
-          image: ghcr.io/cryptolabinc/rune-vault:latest
-          container_name: rune-vault
-          restart: unless-stopped
-          ports:
-            - "0.0.0.0:50051:50051"
-          environment:
-            - VAULT_TEAM_SECRET=${team_secret}
-            - VAULT_INDEX_NAME=${vault_index_name}
-            - ENVECTOR_ENDPOINT=${envector_endpoint}
-            - ENVECTOR_API_KEY=${envector_api_key}
-            - EMBEDDING_DIM=1024
-            - VAULT_TLS_CERT=$${VAULT_TLS_CERT:-}
-            - VAULT_TLS_KEY=$${VAULT_TLS_KEY:-}
-            - VAULT_TLS_DISABLE=$${VAULT_TLS_DISABLE:-}
-          volumes:
-            - vault-keys:/app/vault_keys:rw
-            - ./config:/app/config:rw
-            - ./certs:/app/certs:rw
-            - ./backups:/secure/backups:rw
-            - ./logs:/var/log/rune-vault:rw
-          healthcheck:
-            test: ["CMD", "curl", "-sf", "http://localhost:8081/health"]
-            interval: 30s
-            timeout: 10s
-            retries: 3
-          security_opt:
-            - no-new-privileges:true
-          deploy:
-            resources:
-              limits:
-                memory: 1G
-                cpus: "1.0"
-              reservations:
-                memory: 512M
-                cpus: "0.5"
-
-      volumes:
-        vault-keys:
-    owner: root:root
-    permissions: '0644'
-
-  - path: /opt/rune/.env
-    content: |
-      VAULT_TLS_CERT=${tls_mode == "none" ? "" : "/app/certs/server.pem"}
-      VAULT_TLS_KEY=${tls_mode == "none" ? "" : "/app/certs/server.key"}
-      VAULT_TLS_DISABLE=${tls_mode == "none" ? "true" : ""}
-    owner: root:root
+      export RUNEVAULT_TEAM_NAME='${vault_index_name}'
+      export RUNEVAULT_ENVECTOR_ENDPOINT='${envector_endpoint}'
+      export RUNEVAULT_ENVECTOR_API_KEY='${envector_api_key}'
+      export RUNEVAULT_TLS_HOSTNAME='${tls_hostname}'
     permissions: '0600'
 
 runcmd:
-  # Create Rune directory structure
-  - mkdir -p /opt/rune/certs /opt/rune/backups /opt/rune/logs /opt/rune/config
-  - chmod 700 /opt/rune/certs
-
-  # Install Docker CE with compose plugin (v2)
-  - |
-    install -m 0755 -d /etc/apt/keyrings
-    curl -fsSL https://download.docker.com/linux/ubuntu/gpg -o /etc/apt/keyrings/docker.asc
-    chmod a+r /etc/apt/keyrings/docker.asc
-    echo "deb [arch=$(dpkg --print-architecture) signed-by=/etc/apt/keyrings/docker.asc] https://download.docker.com/linux/ubuntu $(. /etc/os-release && echo $VERSION_CODENAME) stable" > /etc/apt/sources.list.d/docker.list
-    apt-get update
-    apt-get install -y docker-ce docker-ce-cli containerd.io docker-compose-plugin
-
-  # Start Docker
-  - systemctl enable docker
-  - systemctl start docker
-
-  # Add ubuntu user to docker group and set up runevault alias
-  - usermod -aG docker ubuntu
+  - exec > /var/log/runevault-install.log 2>&1
   - |
-    if ! grep -q 'alias runevault=' /home/ubuntu/.bashrc 2>/dev/null; then
-      echo "alias runevault='docker exec -it rune-vault python3 /app/vault_admin_cli.py'" >> /home/ubuntu/.bashrc
-    fi
-
-  # Generate per-user token auth config files
+      arch=$(dpkg --print-architecture); [ "$arch" = "amd64" ] && carch=amd64 || carch=arm64
+      curl -fsSL "https://github.com/sigstore/cosign/releases/latest/download/cosign-linux-$${carch}" -o /usr/local/bin/cosign
+      chmod 0755 /usr/local/bin/cosign
+  - set -a; . /etc/profile.d/runevault-installer-env.sh; set +a
   - |
-    cat > /opt/rune/config/vault-roles.yml <<'ROLES'
-    roles:
-      admin:
-        scope: [get_public_key, decrypt_scores, decrypt_metadata, manage_tokens]
-        top_k: 50
-        rate_limit: 150/60s
-      member:
-        scope: [get_public_key, decrypt_scores, decrypt_metadata]
-        top_k: 10
-        rate_limit: 30/60s
-    ROLES
-    echo "tokens: []" > /opt/rune/config/vault-tokens.yml
-    chmod 600 /opt/rune/config/vault-roles.yml /opt/rune/config/vault-tokens.yml
-
-  # TLS setup — inline cert generation (avoids GitHub rate limits)
-  - |
-    if [ "${tls_mode}" = "self-signed" ]; then
-      CERT_DIR="/opt/rune/certs"
-      PUBLIC_IP=$(curl -4 -sf --connect-timeout 5 ifconfig.me 2>/dev/null || true)
-      openssl genrsa -out "$CERT_DIR/ca.key" 4096 2>/dev/null
-      openssl req -new -x509 -key "$CERT_DIR/ca.key" -out "$CERT_DIR/ca.pem" \
-        -days 3650 -subj "/CN=Rune-Vault CA" -sha256
-      openssl genrsa -out "$CERT_DIR/server.key" 2048 2>/dev/null
-      TMPCONF=$(mktemp)
-      printf '%s\n' \
-        '[req]' \
-        'distinguished_name = req_dn' \
-        'req_extensions = v3_req' \
-        'prompt = no' \
-        '[req_dn]' \
-        'CN = localhost' \
-        '[v3_req]' \
-        'subjectAltName = @alt_names' \
-        '[alt_names]' \
-        'DNS.1 = localhost' \
-        'DNS.2 = vault' \
-        'DNS.3 = rune-vault' \
-        'IP.1  = 127.0.0.1' \
-        > "$TMPCONF"
-      TLS_HOSTNAME="${tls_hostname}"
-      if [ -n "$TLS_HOSTNAME" ]; then
-        echo "DNS.4 = $TLS_HOSTNAME" >> "$TMPCONF"
-      fi
-      if [ -n "$PUBLIC_IP" ]; then
-        echo "IP.2  = $PUBLIC_IP" >> "$TMPCONF"
-      fi
-      openssl req -new -key "$CERT_DIR/server.key" -out "$CERT_DIR/server.csr" -config "$TMPCONF"
-      openssl x509 -req -in "$CERT_DIR/server.csr" \
-        -CA "$CERT_DIR/ca.pem" -CAkey "$CERT_DIR/ca.key" -CAcreateserial \
-        -out "$CERT_DIR/server.pem" -days 825 -sha256 \
-        -extfile "$TMPCONF" -extensions v3_req 2>/dev/null
-      rm -f "$TMPCONF" "$CERT_DIR/server.csr" "$CERT_DIR/ca.srl"
-      chmod 600 "$CERT_DIR/ca.key" "$CERT_DIR/server.key"
-      chmod 644 "$CERT_DIR/ca.pem" "$CERT_DIR/server.pem"
-    fi
-
-  # Pull with retry and start Rune-Vault
-  - |
-    cd /opt/rune
-    for i in 1 2 3 4 5; do
-      docker compose pull && break
-      echo "Docker pull retry $i..." && sleep 10
-    done
-  - cd /opt/rune && docker compose up -d
-
-  # Wait for Vault to be ready
-  - sleep 10
-  - timeout 300 bash -c 'until docker exec rune-vault curl -sf http://localhost:8081/health 2>/dev/null; do sleep 2; done'
-
-final_message: |
-  Rune-Vault installation completed!
-
-  Vault gRPC endpoint: <public-ip>:50051
-  Health check: docker exec rune-vault curl -sf http://localhost:8081/health
-  Docker logs: docker logs rune-vault
+      INSTALL_URL="https://raw.githubusercontent.com/CryptoLabInc/rune-admin/${runevault_version}/install.sh"
+      for i in 1 2 3 4 5; do
+        curl -fsSL --retry 5 --retry-delay 10 --connect-timeout 15 "$${INSTALL_URL}" -o /tmp/install.sh && break
+        sleep $((i*10))
+      done
+      bash /tmp/install.sh --target local --non-interactive --version "${runevault_version}"
+  - rm -f /etc/profile.d/runevault-installer-env.sh
diff --git a/deployment/aws/main.tf b/deployment/aws/main.tf
index 108d44b..95b3d9d 100644
--- a/deployment/aws/main.tf
+++ b/deployment/aws/main.tf
@@ -26,12 +26,6 @@ variable "team_name" {
   default     = "default"
 }
 
-variable "team_secret" {
-  description = "Team secret for DEK derivation. Generated by install.sh."
-  type        = string
-  sensitive   = true
-}
-
 variable "tls_mode" {
   description = "TLS mode: self-signed or none"
   type        = string
@@ -67,6 +61,11 @@ variable "instance_type" {
   default     = "t3.medium"  # 2 vCPU, 4GB RAM
 }
 
+variable "runevault_version" {
+  description = "Pinned runevault release tag — drives the install.sh URL and binary version on the VM."
+  type        = string
+}
+
 variable "public_key" {
   description = "SSH public key content for EC2 access"
   type        = string
@@ -209,13 +208,13 @@ resource "aws_instance" "vault" {
   key_name               = var.public_key != "" ? aws_key_pair.vault_key[0].key_name : null
 
   user_data = templatefile("${path.module}/cloud-init.yaml", {
-    team_secret       = var.team_secret
-    team_name         = var.team_name
-    tls_mode          = var.tls_mode
-    tls_hostname      = var.tls_hostname
-    envector_endpoint = var.envector_endpoint
-    envector_api_key  = var.envector_api_key
-    vault_index_name  = var.vault_index_name
+    team_name          = var.team_name
+    tls_mode           = var.tls_mode
+    tls_hostname       = var.tls_hostname
+    envector_endpoint  = var.envector_endpoint
+    envector_api_key   = var.envector_api_key
+    vault_index_name   = var.vault_index_name
+    runevault_version  = var.runevault_version
   })
 
   root_block_device {
@@ -255,12 +254,6 @@ output "vault_url" {
   value       = "${aws_eip.vault_eip.public_ip}:50051"
 }
 
-output "team_secret" {
-  description = "Team secret for DEK derivation"
-  value       = var.team_secret
-  sensitive   = true
-}
-
 output "vault_public_ip" {
   description = "Public IP address"
   value       = aws_eip.vault_eip.public_ip
diff --git a/deployment/gcp/main.tf b/deployment/gcp/main.tf
index bb4d206..694be53 100644
--- a/deployment/gcp/main.tf
+++ b/deployment/gcp/main.tf
@@ -37,12 +37,6 @@ variable "team_name" {
   type        = string
 }
 
-variable "team_secret" {
-  description = "Team secret for DEK derivation. Generated by install.sh."
-  type        = string
-  sensitive   = true
-}
-
 locals {
   zone = var.zone != "" ? var.zone : "${var.region}-a"
 }
@@ -82,6 +76,11 @@ variable "machine_type" {
   default     = "e2-medium"  # 2 vCPU, 4GB RAM
 }
 
+variable "runevault_version" {
+  description = "Pinned runevault release tag — drives the install.sh URL and binary version on the VM."
+  type        = string
+}
+
 variable "public_key" {
   description = "SSH public key content for instance access"
   type        = string
@@ -164,13 +163,13 @@ resource "google_compute_instance" "vault" {
   }
 
   metadata_startup_script = templatefile("${path.module}/startup-script.sh", {
-    team_secret       = var.team_secret
-    team_name         = var.team_name
-    tls_mode          = var.tls_mode
-    tls_hostname      = var.tls_hostname
-    envector_endpoint = var.envector_endpoint
-    envector_api_key  = var.envector_api_key
-    vault_index_name  = var.vault_index_name
+    team_name          = var.team_name
+    tls_mode           = var.tls_mode
+    tls_hostname       = var.tls_hostname
+    envector_endpoint  = var.envector_endpoint
+    envector_api_key   = var.envector_api_key
+    vault_index_name   = var.vault_index_name
+    runevault_version  = var.runevault_version
   })
 
   service_account {
@@ -193,12 +192,6 @@ output "vault_url" {
   value       = "${google_compute_address.vault_ip.address}:50051"
 }
 
-output "team_secret" {
-  description = "Team secret for DEK derivation"
-  value       = var.team_secret
-  sensitive   = true
-}
-
 output "vault_public_ip" {
   description = "Public IP address"
   value       = google_compute_address.vault_ip.address
diff --git a/deployment/gcp/startup-script.sh b/deployment/gcp/startup-script.sh
index 20829c7..658cd20 100644
--- a/deployment/gcp/startup-script.sh
+++ b/deployment/gcp/startup-script.sh
@@ -1,155 +1,33 @@
 #!/bin/bash
 set -euo pipefail
+exec > /var/log/runevault-install.log 2>&1
+echo "=== runevault startup at $(date) ==="
 
-# Rune-Vault Startup Script for GCP Compute Engine
-# Deploys Docker-based Vault with gRPC (port 50051)
-
-exec > /var/log/rune-vault-startup.log 2>&1
-echo "=== Rune-Vault startup script began at $(date) ==="
-
-# Install packages
-apt-get update
-apt-get install -y ca-certificates curl gnupg jq openssl
-
-# Create Rune directory structure
-mkdir -p /opt/rune/certs /opt/rune/backups /opt/rune/logs /opt/rune/config
-chmod 700 /opt/rune/certs
-
-# Write docker-compose.yml
-cat > /opt/rune/docker-compose.yml <<'COMPOSE'
-services:
-  vault:
-    image: ghcr.io/cryptolabinc/rune-vault:latest
-    container_name: rune-vault
-    restart: unless-stopped
-    ports:
-      - "0.0.0.0:50051:50051"
-    env_file:
-      - .env
-    environment:
-      - VAULT_TEAM_SECRET=${team_secret}
-      - VAULT_INDEX_NAME=${vault_index_name}
-      - ENVECTOR_ENDPOINT=${envector_endpoint}
-      - ENVECTOR_API_KEY=${envector_api_key}
-      - EMBEDDING_DIM=1024
-    volumes:
-      - vault-keys:/app/vault_keys:rw
-      - ./config:/app/config:rw
-      - ./certs:/app/certs:rw
-      - ./backups:/secure/backups:rw
-      - ./logs:/var/log/rune-vault:rw
-    healthcheck:
-      test: ["CMD", "curl", "-sf", "http://localhost:8081/health"]
-      interval: 30s
-      timeout: 10s
-      retries: 3
-    security_opt:
-      - no-new-privileges:true
-    deploy:
-      resources:
-        limits:
-          memory: 1G
-          cpus: "1.0"
-        reservations:
-          memory: 512M
-          cpus: "0.5"
+for i in $(seq 1 30); do
+  apt-get update -q && apt-get install -y ca-certificates curl openssl && break
+  echo "apt retry $i..." && sleep 10
+done
 
-volumes:
-  vault-keys:
-COMPOSE
+arch=$(dpkg --print-architecture); [ "$arch" = "amd64" ] && carch=amd64 || carch=arm64
+curl -fsSL "https://github.com/sigstore/cosign/releases/latest/download/cosign-linux-$${carch}" -o /usr/local/bin/cosign
+chmod 0755 /usr/local/bin/cosign
 
-# Write .env file
-cat > /opt/rune/.env <<'ENVFILE'
-VAULT_TLS_CERT=${tls_mode == "none" ? "" : "/app/certs/server.pem"}
-VAULT_TLS_KEY=${tls_mode == "none" ? "" : "/app/certs/server.key"}
-VAULT_TLS_DISABLE=${tls_mode == "none" ? "true" : ""}
+cat > /etc/profile.d/runevault-installer-env.sh <<'ENVFILE'
+export RUNEVAULT_TEAM_NAME='${vault_index_name}'
+export RUNEVAULT_ENVECTOR_ENDPOINT='${envector_endpoint}'
+export RUNEVAULT_ENVECTOR_API_KEY='${envector_api_key}'
+export RUNEVAULT_TLS_HOSTNAME='${tls_hostname}'
 ENVFILE
-chmod 600 /opt/rune/.env
-
-# Install Docker CE with compose plugin (v2)
-install -m 0755 -d /etc/apt/keyrings
-curl -fsSL https://download.docker.com/linux/ubuntu/gpg -o /etc/apt/keyrings/docker.asc
-chmod a+r /etc/apt/keyrings/docker.asc
-echo "deb [arch=$(dpkg --print-architecture) signed-by=/etc/apt/keyrings/docker.asc] https://download.docker.com/linux/ubuntu $(. /etc/os-release && echo "$VERSION_CODENAME") stable" > /etc/apt/sources.list.d/docker.list
-apt-get update
-apt-get install -y docker-ce docker-ce-cli containerd.io docker-compose-plugin
-
-# Start Docker
-systemctl enable docker
-systemctl start docker
-
-# Generate per-user token auth config files
-cat > /opt/rune/config/vault-roles.yml <<'ROLES'
-roles:
-  admin:
-    scope: [get_public_key, decrypt_scores, decrypt_metadata, manage_tokens]
-    top_k: 50
-    rate_limit: 150/60s
-  member:
-    scope: [get_public_key, decrypt_scores, decrypt_metadata]
-    top_k: 10
-    rate_limit: 30/60s
-ROLES
-echo "tokens: []" > /opt/rune/config/vault-tokens.yml
-chmod 600 /opt/rune/config/vault-roles.yml /opt/rune/config/vault-tokens.yml
-
-# Set up runevault CLI alias for ubuntu user
-if ! grep -q 'alias runevault=' /home/ubuntu/.bashrc 2>/dev/null; then
-  echo "alias runevault='docker exec -it rune-vault python3 /app/vault_admin_cli.py'" >> /home/ubuntu/.bashrc
-fi
-usermod -aG docker ubuntu 2>/dev/null || true
-
-# TLS setup
-if [ "${tls_mode}" = "self-signed" ]; then
-  CERT_DIR="/opt/rune/certs"
-  PUBLIC_IP=$(curl -4 -sf --connect-timeout 5 ifconfig.me 2>/dev/null || true)
-  openssl genrsa -out "$CERT_DIR/ca.key" 4096 2>/dev/null
-  openssl req -new -x509 -key "$CERT_DIR/ca.key" -out "$CERT_DIR/ca.pem" \
-    -days 3650 -subj "/CN=Rune-Vault CA" -sha256
-  openssl genrsa -out "$CERT_DIR/server.key" 2048 2>/dev/null
-  TMPCONF=$(mktemp)
-  printf '%s\n' \
-    '[req]' \
-    'distinguished_name = req_dn' \
-    'req_extensions = v3_req' \
-    'prompt = no' \
-    '[req_dn]' \
-    'CN = localhost' \
-    '[v3_req]' \
-    'subjectAltName = @alt_names' \
-    '[alt_names]' \
-    'DNS.1 = localhost' \
-    'DNS.2 = vault' \
-    'DNS.3 = rune-vault' \
-    'IP.1  = 127.0.0.1' \
-    > "$TMPCONF"
-  TLS_HOSTNAME="${tls_hostname}"
-  if [ -n "$TLS_HOSTNAME" ]; then
-    echo "DNS.4 = $TLS_HOSTNAME" >> "$TMPCONF"
-  fi
-  if [ -n "$PUBLIC_IP" ]; then
-    echo "IP.2  = $PUBLIC_IP" >> "$TMPCONF"
-  fi
-  openssl req -new -key "$CERT_DIR/server.key" -out "$CERT_DIR/server.csr" -config "$TMPCONF"
-  openssl x509 -req -in "$CERT_DIR/server.csr" \
-    -CA "$CERT_DIR/ca.pem" -CAkey "$CERT_DIR/ca.key" -CAcreateserial \
-    -out "$CERT_DIR/server.pem" -days 825 -sha256 \
-    -extfile "$TMPCONF" -extensions v3_req 2>/dev/null
-  rm -f "$TMPCONF" "$CERT_DIR/server.csr" "$CERT_DIR/ca.srl"
-  chmod 600 "$CERT_DIR/ca.key" "$CERT_DIR/server.key"
-  chmod 644 "$CERT_DIR/ca.pem" "$CERT_DIR/server.pem"
-fi
+chmod 600 /etc/profile.d/runevault-installer-env.sh
+set -a; . /etc/profile.d/runevault-installer-env.sh; set +a
 
-# Pull with retry and start Rune-Vault
-cd /opt/rune
+INSTALL_URL="https://raw.githubusercontent.com/CryptoLabInc/rune-admin/${runevault_version}/install.sh"
 for i in 1 2 3 4 5; do
-  docker compose pull && break
-  echo "Docker pull retry $i..." && sleep 10
+  curl -fsSL --retry 5 --retry-delay 10 --connect-timeout 15 "$${INSTALL_URL}" -o /tmp/install.sh && break
+  sleep $((i*10))
 done
-docker compose up -d
 
-# Wait for Vault to be ready
-sleep 10
-timeout 300 bash -c 'until docker exec rune-vault curl -sf http://localhost:8081/health 2>/dev/null; do sleep 2; done'
+bash /tmp/install.sh --target local --non-interactive --version "${runevault_version}"
 
-echo "=== Rune-Vault startup script completed at $(date) ==="
+rm -f /etc/profile.d/runevault-installer-env.sh
+echo "=== completed at $(date) ==="
diff --git a/deployment/oci/main.tf b/deployment/oci/main.tf
index e0f9e70..61b8b33 100644
--- a/deployment/oci/main.tf
+++ b/deployment/oci/main.tf
@@ -37,12 +37,6 @@ variable "team_name" {
   type        = string
 }
 
-variable "team_secret" {
-  description = "Team secret for DEK derivation. Generated by install.sh."
-  type        = string
-  sensitive   = true
-}
-
 variable "tls_mode" {
   description = "TLS mode: self-signed, custom, or none"
   type        = string
@@ -72,6 +66,11 @@ variable "vault_index_name" {
   default     = "runecontext"
 }
 
+variable "runevault_version" {
+  description = "Pinned runevault release tag — drives the install.sh URL and binary version on the VM."
+  type        = string
+}
+
 variable "public_key" {
   description = "SSH public key content for instance access"
   type        = string
@@ -176,13 +175,13 @@ resource "oci_core_instance" "vault_instance" {
   metadata = {
     ssh_authorized_keys = var.public_key
     user_data = base64encode(templatefile("${path.module}/startup-script.sh", {
-      team_secret       = var.team_secret
-      team_name         = var.team_name
-      tls_mode          = var.tls_mode
-      tls_hostname      = var.tls_hostname
-      envector_endpoint = var.envector_endpoint
-      envector_api_key  = var.envector_api_key
-      vault_index_name  = var.vault_index_name
+      team_name          = var.team_name
+      tls_mode           = var.tls_mode
+      tls_hostname       = var.tls_hostname
+      envector_endpoint  = var.envector_endpoint
+      envector_api_key   = var.envector_api_key
+      vault_index_name   = var.vault_index_name
+      runevault_version  = var.runevault_version
     }))
   }
 }
@@ -211,12 +210,6 @@ output "vault_url" {
   value       = "${oci_core_instance.vault_instance.public_ip}:50051"
 }
 
-output "team_secret" {
-  value       = var.team_secret
-  description = "Team secret for DEK derivation"
-  sensitive   = true
-}
-
 output "vault_public_ip" {
   value       = oci_core_instance.vault_instance.public_ip
   description = "Public IP of Vault instance"
diff --git a/deployment/oci/startup-script.sh b/deployment/oci/startup-script.sh
index 69b27a1..3bdaf3e 100644
--- a/deployment/oci/startup-script.sh
+++ b/deployment/oci/startup-script.sh
@@ -1,160 +1,36 @@
 #!/bin/bash
 set -euo pipefail
+exec > /var/log/runevault-install.log 2>&1
+echo "=== runevault startup at $(date) ==="
 
-# Rune-Vault Startup Script for OCI Compute
-# Deploys Docker-based Vault with gRPC (port 50051)
-
-exec > /var/log/rune-vault-startup.log 2>&1
-echo "=== Rune-Vault startup script began at $(date) ==="
-
-# Install packages (retry on lock or transient mirror errors)
 for i in $(seq 1 30); do
   apt-get update -q \
     && apt-get -y --fix-broken install \
-    && apt-get install -y ca-certificates curl gnupg jq openssl \
+    && apt-get install -y ca-certificates curl openssl \
     && break
   echo "apt retry $i..." && sleep 10
 done
 
-# Create Rune directory structure
-mkdir -p /opt/rune/certs /opt/rune/backups /opt/rune/logs /opt/rune/config
-chmod 755 /opt/rune/certs
-
-# Write docker-compose.yml
-cat > /opt/rune/docker-compose.yml <<'COMPOSE'
-services:
-  vault:
-    image: ghcr.io/cryptolabinc/rune-vault:latest
-    container_name: rune-vault
-    restart: unless-stopped
-    ports:
-      - "0.0.0.0:50051:50051"
-    env_file:
-      - .env
-    environment:
-      - VAULT_TEAM_SECRET=${team_secret}
-      - VAULT_INDEX_NAME=${vault_index_name}
-      - ENVECTOR_ENDPOINT=${envector_endpoint}
-      - ENVECTOR_API_KEY=${envector_api_key}
-      - EMBEDDING_DIM=1024
-    volumes:
-      - vault-keys:/app/vault_keys:rw
-      - ./config:/app/config:rw
-      - ./certs:/app/certs:rw
-      - ./backups:/secure/backups:rw
-      - ./logs:/var/log/rune-vault:rw
-    healthcheck:
-      test: ["CMD", "curl", "-sf", "http://localhost:8081/health"]
-      interval: 30s
-      timeout: 10s
-      retries: 3
-    security_opt:
-      - no-new-privileges:true
-    deploy:
-      resources:
-        limits:
-          memory: 1G
-          cpus: "1.0"
-        reservations:
-          memory: 512M
-          cpus: "0.5"
+arch=$(dpkg --print-architecture); [ "$arch" = "amd64" ] && carch=amd64 || carch=arm64
+curl -fsSL "https://github.com/sigstore/cosign/releases/latest/download/cosign-linux-$${carch}" -o /usr/local/bin/cosign
+chmod 0755 /usr/local/bin/cosign
 
-volumes:
-  vault-keys:
-COMPOSE
-
-# Write .env file
-cat > /opt/rune/.env <<'ENVFILE'
-VAULT_TLS_CERT=${tls_mode == "none" ? "" : "/app/certs/server.pem"}
-VAULT_TLS_KEY=${tls_mode == "none" ? "" : "/app/certs/server.key"}
-VAULT_TLS_DISABLE=${tls_mode == "none" ? "true" : ""}
+cat > /etc/profile.d/runevault-installer-env.sh <<'ENVFILE'
+export RUNEVAULT_TEAM_NAME='${vault_index_name}'
+export RUNEVAULT_ENVECTOR_ENDPOINT='${envector_endpoint}'
+export RUNEVAULT_ENVECTOR_API_KEY='${envector_api_key}'
+export RUNEVAULT_TLS_HOSTNAME='${tls_hostname}'
 ENVFILE
-chmod 600 /opt/rune/.env
-
-# Install Docker CE with compose plugin (v2)
-install -m 0755 -d /etc/apt/keyrings
-curl -fsSL https://download.docker.com/linux/ubuntu/gpg -o /etc/apt/keyrings/docker.asc
-chmod a+r /etc/apt/keyrings/docker.asc
-echo "deb [arch=$(dpkg --print-architecture) signed-by=/etc/apt/keyrings/docker.asc] https://download.docker.com/linux/ubuntu $(. /etc/os-release && echo "$VERSION_CODENAME") stable" > /etc/apt/sources.list.d/docker.list
-apt-get update
-apt-get install -y docker-ce docker-ce-cli containerd.io docker-compose-plugin
-
-# Start Docker
-systemctl enable docker
-systemctl start docker
-
-# Generate per-user token auth config files
-cat > /opt/rune/config/vault-roles.yml <<'ROLES'
-roles:
-  admin:
-    scope: [get_public_key, decrypt_scores, decrypt_metadata, manage_tokens]
-    top_k: 50
-    rate_limit: 150/60s
-  member:
-    scope: [get_public_key, decrypt_scores, decrypt_metadata]
-    top_k: 10
-    rate_limit: 30/60s
-ROLES
-echo "tokens: []" > /opt/rune/config/vault-tokens.yml
-chmod 600 /opt/rune/config/vault-roles.yml /opt/rune/config/vault-tokens.yml
-
-# Set up runevault CLI alias for ubuntu user
-if ! grep -q 'alias runevault=' /home/ubuntu/.bashrc 2>/dev/null; then
-  echo "alias runevault='docker exec -it rune-vault python3 /app/vault_admin_cli.py'" >> /home/ubuntu/.bashrc
-fi
-usermod -aG docker ubuntu 2>/dev/null || true
-
-# TLS setup
-if [ "${tls_mode}" = "self-signed" ]; then
-  CERT_DIR="/opt/rune/certs"
-  PUBLIC_IP=$(curl -4 -sf --connect-timeout 5 ifconfig.me 2>/dev/null || true)
-  openssl genrsa -out "$CERT_DIR/ca.key" 4096 2>/dev/null
-  openssl req -new -x509 -key "$CERT_DIR/ca.key" -out "$CERT_DIR/ca.pem" \
-    -days 3650 -subj "/CN=Rune-Vault CA" -sha256
-  openssl genrsa -out "$CERT_DIR/server.key" 2048 2>/dev/null
-  TMPCONF=$(mktemp)
-  printf '%s\n' \
-    '[req]' \
-    'distinguished_name = req_dn' \
-    'req_extensions = v3_req' \
-    'prompt = no' \
-    '[req_dn]' \
-    'CN = localhost' \
-    '[v3_req]' \
-    'subjectAltName = @alt_names' \
-    '[alt_names]' \
-    'DNS.1 = localhost' \
-    'DNS.2 = vault' \
-    'DNS.3 = rune-vault' \
-    'IP.1  = 127.0.0.1' \
-    > "$TMPCONF"
-  TLS_HOSTNAME="${tls_hostname}"
-  if [ -n "$TLS_HOSTNAME" ]; then
-    echo "DNS.4 = $TLS_HOSTNAME" >> "$TMPCONF"
-  fi
-  if [ -n "$PUBLIC_IP" ]; then
-    echo "IP.2  = $PUBLIC_IP" >> "$TMPCONF"
-  fi
-  openssl req -new -key "$CERT_DIR/server.key" -out "$CERT_DIR/server.csr" -config "$TMPCONF"
-  openssl x509 -req -in "$CERT_DIR/server.csr" \
-    -CA "$CERT_DIR/ca.pem" -CAkey "$CERT_DIR/ca.key" -CAcreateserial \
-    -out "$CERT_DIR/server.pem" -days 825 -sha256 \
-    -extfile "$TMPCONF" -extensions v3_req 2>/dev/null
-  rm -f "$TMPCONF" "$CERT_DIR/server.csr" "$CERT_DIR/ca.srl"
-  chmod 600 "$CERT_DIR/ca.key" "$CERT_DIR/server.key"
-  chmod 644 "$CERT_DIR/ca.pem" "$CERT_DIR/server.pem"
-fi
+chmod 600 /etc/profile.d/runevault-installer-env.sh
+set -a; . /etc/profile.d/runevault-installer-env.sh; set +a
 
-# Pull with retry and start Rune-Vault
-cd /opt/rune
+INSTALL_URL="https://raw.githubusercontent.com/CryptoLabInc/rune-admin/${runevault_version}/install.sh"
 for i in 1 2 3 4 5; do
-  docker compose pull && break
-  echo "Docker pull retry $i..." && sleep 10
+  curl -fsSL --retry 5 --retry-delay 10 --connect-timeout 15 "$${INSTALL_URL}" -o /tmp/install.sh && break
+  sleep $((i*10))
 done
-docker compose up -d
 
-# Wait for Vault to be ready
-sleep 10
-timeout 300 bash -c 'until docker exec rune-vault curl -sf http://localhost:8081/health 2>/dev/null; do sleep 2; done'
+bash /tmp/install.sh --target local --non-interactive --version "${runevault_version}"
 
-echo "=== Rune-Vault startup script completed at $(date) ==="
+rm -f /etc/profile.d/runevault-installer-env.sh
+echo "=== completed at $(date) ==="
diff --git a/install.sh b/install.sh
index 8f6288b..5a58e11 100755
--- a/install.sh
+++ b/install.sh
@@ -9,19 +9,33 @@
 #   sudo bash install.sh [options]
 #
 # Options:
-#   --version <tag>      Install a specific release tag (default: latest)
-#   --force              Overwrite existing config and TLS certificates
-#   --non-interactive    Skip all prompts; supply secrets via env vars
-#   --uninstall          Stop the service, remove files, optionally delete data
+#   --version <tag>               Install a specific release tag (default: latest)
+#   --target <local|aws|gcp|oci>  Deploy locally or to a cloud provider (default: local)
+#   --install-dir <path>          CSP install directory (default: $HOME/rune-vault-<csp>)
+#   --force                       Overwrite existing config and TLS certificates
+#   --non-interactive             Skip all prompts; supply secrets via env vars
+#   --uninstall                   Stop the service, remove files, optionally delete data
 #
-# Non-interactive env vars:
+# Non-interactive env vars (local install):
 #   RUNEVAULT_TEAM_NAME              keys.index_name (required)
 #   RUNEVAULT_ENVECTOR_ENDPOINT      envector.endpoint (required)
 #   RUNEVAULT_ENVECTOR_API_KEY       envector.api_key
 #   RUNEVAULT_ENVECTOR_API_KEY_FILE  envector.api_key_file (alternative)
-#   RUNEVAULT_TEAM_SECRET            tokens.team_secret (auto-generated if unset)
 #   RUNEVAULT_TLS_CERT_PATH          Path to existing TLS cert (skips auto-gen)
 #   RUNEVAULT_TLS_KEY_PATH           Path to existing TLS key  (skips auto-gen)
+#   RUNEVAULT_TLS_HOSTNAME           Additional DNS SAN for auto-generated TLS cert
+#
+# Non-interactive env vars (CSP install — operator workstation):
+#   RUNEVAULT_ENVECTOR_ENDPOINT      enVector endpoint URL (required)
+#   RUNEVAULT_ENVECTOR_API_KEY       enVector API key (required)
+#   RUNEVAULT_TEAM_NAME              Vault index name (required)
+#   RUNEVAULT_TLS_HOSTNAME           Domain name for TLS SAN on VM cert (optional)
+#   RUNEVAULT_TARGET                 Pre-select target without interactive menu
+#   RUNEVAULT_INSTALL_DIR            Pre-set CSP install directory
+#   RUNEVAULT_CSP_TEAM_NAME          Team name for cloud resource naming
+#   RUNEVAULT_CSP_REGION             Cloud region
+#   RUNEVAULT_GCP_PROJECT_ID         GCP: project ID (required for GCP)
+#   RUNEVAULT_OCI_COMPARTMENT_ID     OCI: compartment OCID (required for OCI)
 #
 # Dev/testing env vars (set by scripts/install-dev.sh):
 #   RUNEVAULT_LOCAL_BINARY    Path to local binary; skips download + verification
@@ -39,6 +53,9 @@ CERT_REGEXP="^https://github.com/CryptoLabInc/rune-admin/.github/workflows/relea
 SERVICE_USER=runevault
 GRPC_PORT=50051
 
+RAW_BASE="https://raw.githubusercontent.com/${REPO}"
+DEFAULT_INSTALL_DIR_CSP_FMT="%s/rune-vault-%s"
+
 # Overridable by env (used by scripts/install-dev.sh)
 INSTALL_PREFIX="${RUNEVAULT_INSTALL_PREFIX:-/opt/runevault}"
 BINARY_DEST="${RUNEVAULT_BINARY_PATH:-/usr/local/bin/runevault}"
@@ -46,6 +63,10 @@ SKIP_VERIFY="${RUNEVAULT_SKIP_VERIFY:-0}"
 LOCAL_BINARY="${RUNEVAULT_LOCAL_BINARY:-}"
 SKIP_SERVICE="${RUNEVAULT_SKIP_SERVICE:-0}"
 
+TARGET="${RUNEVAULT_TARGET:-}"
+INSTALL_DIR_CSP="${RUNEVAULT_INSTALL_DIR:-}"
+CSP_PUBLIC_IP=""
+
 # ── Color helpers ──────────────────────────────────────────────────────────────
 if [[ -t 1 ]]; then
   _RED='\033[0;31m' _GRN='\033[0;32m' _BLU='\033[0;34m' _YLW='\033[0;33m' _RST='\033[0m'
@@ -69,6 +90,8 @@ while [[ $# -gt 0 ]]; do
     --uninstall)       UNINSTALL=1; shift ;;
     --force)           FORCE=1; shift ;;
     --non-interactive) NON_INTERACTIVE=1; shift ;;
+    --target)         TARGET="$2"; shift 2 ;;
+    --install-dir)    INSTALL_DIR_CSP="$2"; shift 2 ;;
     *) die "Unknown flag: $1" ;;
   esac
 done
@@ -160,6 +183,355 @@ run_uninstall() {
   success "Rune-Vault uninstalled."
 }
 
+# ── CSP helpers ───────────────────────────────────────────────────────────────
+
+_prompt() {
+  local varname=$1 label=$2 default=${3:-}
+  [[ -n "${!varname:-}" ]] && return 0
+  local val
+  if [[ -n "$default" ]]; then
+    read -r -p "${label} [${default}]: " val
+    printf -v "$varname" '%s' "${val:-$default}"
+  else
+    read -r -p "${label}: " val
+    printf -v "$varname" '%s' "$val"
+  fi
+}
+
+resolve_target() {
+  if [[ -n "${TARGET:-}" ]]; then
+    case "$TARGET" in
+      local|aws|gcp|oci) ;;
+      *) die "Invalid --target value: ${TARGET}. Valid: local, aws, gcp, oci." ;;
+    esac
+    return 0
+  fi
+  if [[ "$NON_INTERACTIVE" -eq 0 && -t 0 ]]; then
+    printf '\n'
+    printf '  Select installation target:\n'
+    printf '    1) Local (this machine)\n'
+    printf '    2) AWS\n'
+    printf '    3) GCP\n'
+    printf '    4) OCI\n'
+    printf '\n'
+    local choice
+    read -r -p "  Choice [1]: " choice
+    case "${choice:-1}" in
+      1|local) TARGET=local ;;
+      2|aws)   TARGET=aws ;;
+      3|gcp)   TARGET=gcp ;;
+      4|oci)   TARGET=oci ;;
+      *) die "Invalid choice: ${choice}" ;;
+    esac
+  else
+    TARGET=local
+  fi
+}
+
+csp_preflight() {
+  local csp=$1
+  info "Running CSP preflight checks for ${csp}..."
+
+  local missing=0
+  for tool in terraform ssh-keygen scp curl; do
+    command -v "$tool" >/dev/null 2>&1 || { warn "'${tool}' not found."; missing=1; }
+  done
+
+  local csp_cli
+  case "$csp" in
+    aws) csp_cli=aws ;;
+    gcp) csp_cli=gcloud ;;
+    oci) csp_cli=oci ;;
+  esac
+  command -v "$csp_cli" >/dev/null 2>&1 \
+    || { warn "CSP CLI '${csp_cli}' not found. Install and configure credentials."; missing=1; }
+
+  if [[ "$missing" -eq 1 ]]; then
+    die "Missing prerequisites above. Install them and re-run."
+  fi
+
+  success "CSP preflight passed."
+}
+
+csp_prompt_config() {
+  local csp=$1
+
+  if [[ "$NON_INTERACTIVE" -eq 0 ]]; then
+    printf '\n'
+    printf '══════════════════════════════════════════════════════════\n'
+    printf '  Cloud deployment configuration\n'
+    printf '══════════════════════════════════════════════════════════\n'
+    printf '\n'
+    printf '  Create your enVector cluster at https://envector.io\n'
+    printf '  before proceeding. You will need the endpoint URL and\n'
+    printf '  API key from the dashboard.\n'
+    printf '\n'
+
+    _prompt ENVECTOR_ENDPOINT  "enVector endpoint"         ""
+    _prompt ENVECTOR_API_KEY   "enVector API key"           ""
+    _prompt VAULT_INDEX_NAME   "Vault index name"           "runecontext"
+    _prompt TEAM_NAME          "Team name (resource naming)" "default"
+    _prompt TLS_HOSTNAME       "TLS hostname / domain SAN (optional, Enter to skip)" ""
+
+    case "$csp" in
+      aws) _prompt CSP_REGION "AWS region"   "us-east-1"   ;;
+      gcp)
+        _prompt CSP_REGION    "GCP region"   "us-central1"
+        _prompt GCP_PROJECT_ID "GCP project ID" ""
+        ;;
+      oci)
+        _prompt CSP_REGION      "OCI region"          "us-ashburn-1"
+        _prompt OCI_COMPARTMENT_ID "OCI compartment OCID" ""
+        ;;
+    esac
+    printf '\n'
+  else
+    ENVECTOR_ENDPOINT="${RUNEVAULT_ENVECTOR_ENDPOINT:-}"
+    ENVECTOR_API_KEY="${RUNEVAULT_ENVECTOR_API_KEY:-}"
+    VAULT_INDEX_NAME="${RUNEVAULT_TEAM_NAME:-}"
+    TEAM_NAME="${RUNEVAULT_CSP_TEAM_NAME:-default}"
+    TLS_HOSTNAME="${RUNEVAULT_TLS_HOSTNAME:-}"
+    CSP_REGION="${RUNEVAULT_CSP_REGION:-}"
+    GCP_PROJECT_ID="${RUNEVAULT_GCP_PROJECT_ID:-}"
+    OCI_COMPARTMENT_ID="${RUNEVAULT_OCI_COMPARTMENT_ID:-}"
+
+    local missing=()
+    [[ -z "$ENVECTOR_ENDPOINT" ]] && missing+=("RUNEVAULT_ENVECTOR_ENDPOINT")
+    [[ -z "$ENVECTOR_API_KEY" ]]  && missing+=("RUNEVAULT_ENVECTOR_API_KEY")
+    [[ -z "$VAULT_INDEX_NAME" ]]  && missing+=("RUNEVAULT_TEAM_NAME")
+    [[ "$csp" = gcp && -z "$GCP_PROJECT_ID" ]]      && missing+=("RUNEVAULT_GCP_PROJECT_ID")
+    [[ "$csp" = oci && -z "$OCI_COMPARTMENT_ID" ]]  && missing+=("RUNEVAULT_OCI_COMPARTMENT_ID")
+    if [[ ${#missing[@]} -gt 0 ]]; then
+      printf 'ERROR: Missing required env vars:\n' >&2
+      for v in "${missing[@]}"; do printf '  %s\n' "$v" >&2; done
+      exit 1
+    fi
+  fi
+
+  [[ -n "$ENVECTOR_ENDPOINT" ]]  || die "enVector endpoint is required."
+  [[ -n "$ENVECTOR_API_KEY" ]]   || die "enVector API key is required."
+  [[ -n "$VAULT_INDEX_NAME" ]]   || die "Vault index name is required."
+  [[ "$csp" = gcp ]] && { [[ -n "$GCP_PROJECT_ID" ]]     || die "GCP project ID is required."; }
+  [[ "$csp" = oci ]] && { [[ -n "$OCI_COMPARTMENT_ID" ]] || die "OCI compartment OCID is required."; }
+
+}
+
+csp_generate_ssh_key() {
+  local key_path="${INSTALL_DIR_CSP}/ssh_key"
+  if [[ -f "$key_path" ]]; then
+    info "SSH key already exists: ${key_path}"
+    return 0
+  fi
+  ssh-keygen -t ed25519 -N '' -f "$key_path" -q
+  chmod 0600 "$key_path"
+  chmod 0644 "${key_path}.pub"
+  [[ -n "${SUDO_USER:-}" ]] \
+    && chown "${SUDO_USER}" "$key_path" "${key_path}.pub"
+  success "SSH key generated: ${key_path}"
+}
+
+_curl_retry_csp() {
+  local url=$1 dest=$2 i
+  for i in 1 2 3; do
+    curl -fsSL --connect-timeout 15 -o "$dest" "$url" && return 0
+    warn "Download attempt ${i} failed for $(basename "$url"). Retrying..."
+    sleep 5
+  done
+  die "Failed to download: ${url}"
+}
+
+csp_copy_terraform_files() {
+  local csp=$1
+  local script_dir
+  script_dir="$(cd "$(dirname "$0")" && pwd)"
+  local tf_src="${script_dir}/deployment/${csp}"
+  local tf_dest="${INSTALL_DIR_CSP}/deployment"
+  mkdir -p "$tf_dest"
+
+  local files
+  case "$csp" in
+    aws) files=(main.tf cloud-init.yaml) ;;
+    *)   files=(main.tf startup-script.sh) ;;
+  esac
+
+  for f in "${files[@]}"; do
+    if [[ -f "${tf_src}/${f}" ]]; then
+      cp "${tf_src}/${f}" "${tf_dest}/${f}"
+    else
+      info "Downloading ${f} from GitHub..."
+      _curl_retry_csp "${RAW_BASE}/${VERSION}/deployment/${csp}/${f}" "${tf_dest}/${f}"
+    fi
+  done
+
+  printf '*.tfvars\nterraform.tfstate*\n.terraform/\n' > "${INSTALL_DIR_CSP}/.gitignore"
+  [[ -n "${SUDO_USER:-}" ]] && chown -R "${SUDO_USER}" "$tf_dest" "${INSTALL_DIR_CSP}/.gitignore"
+  success "Terraform files ready: ${tf_dest}"
+}
+
+escape_tf() { printf '%s' "$1" | sed 's/\\/\\\\/g; s/"/\\"/g'; }
+
+csp_render_tfvars() {
+  local csp=$1
+  local tf_dir="${INSTALL_DIR_CSP}/deployment"
+  local tfvars="${tf_dir}/terraform.tfvars"
+  local public_key=""
+
+  if [[ -f "${tf_dir}/terraform.tfstate" ]]; then
+    if [[ "$NON_INTERACTIVE" -eq 0 ]]; then
+      local answer=n
+      read -r -p "terraform.tfstate already exists in ${tf_dir}. Re-apply? [y/N] " answer
+      [[ "$answer" =~ ^[Yy] ]] || { info "Aborted."; exit 0; }
+    else
+      warn "terraform.tfstate exists — re-applying (idempotent)."
+    fi
+  fi
+
+  [[ -f "${INSTALL_DIR_CSP}/ssh_key.pub" ]] \
+    && public_key=$(cat "${INSTALL_DIR_CSP}/ssh_key.pub")
+
+  {
+    printf 'team_name          = "%s"\n' "$(escape_tf "${TEAM_NAME:-default}")"
+    printf 'tls_mode           = "self-signed"\n'
+    printf 'tls_hostname       = "%s"\n' "$(escape_tf "${TLS_HOSTNAME:-}")"
+    printf 'envector_endpoint  = "%s"\n' "$(escape_tf "${ENVECTOR_ENDPOINT}")"
+    printf 'envector_api_key   = "%s"\n' "$(escape_tf "${ENVECTOR_API_KEY}")"
+    printf 'vault_index_name   = "%s"\n' "$(escape_tf "${VAULT_INDEX_NAME}")"
+    printf 'runevault_version  = "%s"\n' "$(escape_tf "${VERSION}")"
+    printf 'public_key         = "%s"\n' "$(escape_tf "${public_key}")"
+    printf 'region             = "%s"\n' "$(escape_tf "${CSP_REGION}")"
+    case "$csp" in
+      gcp) printf 'project_id         = "%s"\n' "$(escape_tf "${GCP_PROJECT_ID}")" ;;
+      oci) printf 'compartment_id     = "%s"\n' "$(escape_tf "${OCI_COMPARTMENT_ID}")" ;;
+    esac
+  } > "$tfvars"
+
+  chmod 0600 "$tfvars"
+  [[ -n "${SUDO_USER:-}" ]] && chown "${SUDO_USER}" "$tfvars"
+  success "terraform.tfvars written: ${tfvars}"
+}
+
+csp_run_terraform() {
+  local tf_dir="${INSTALL_DIR_CSP}/deployment"
+  local tf_user="${SUDO_USER:-$(id -un)}"
+
+  info "Running terraform init..."
+  (cd "$tf_dir" && sudo -u "$tf_user" terraform init -input=false)
+  info "Running terraform apply..."
+  (cd "$tf_dir" && sudo -u "$tf_user" terraform apply -auto-approve -input=false)
+
+  chmod 0600 "${tf_dir}/terraform.tfstate" 2>/dev/null || true
+  chmod 0600 "${tf_dir}/terraform.tfstate.backup" 2>/dev/null || true
+  success "Terraform apply complete."
+}
+
+csp_post_deploy() {
+  local tf_dir="${INSTALL_DIR_CSP}/deployment"
+  local tf_user="${SUDO_USER:-$(id -un)}"
+  local key_path="${INSTALL_DIR_CSP}/ssh_key"
+
+  local public_ip
+  public_ip=$(cd "$tf_dir" && sudo -u "$tf_user" terraform output -raw vault_public_ip 2>/dev/null) \
+    || die "Could not read vault_public_ip from terraform output."
+  CSP_PUBLIC_IP="$public_ip"
+
+  info "Waiting for gRPC port 50051 on ${public_ip} (up to 10 min)..."
+  local elapsed=0
+  while [[ $elapsed -lt 600 ]]; do
+    bash -c "echo > /dev/tcp/${public_ip}/50051" 2>/dev/null && break || true
+    sleep 10
+    elapsed=$((elapsed + 10))
+  done
+  if [[ $elapsed -ge 600 ]]; then
+    warn "Timed out waiting for port 50051. The VM may still be initializing."
+  fi
+
+  sleep 30
+
+  info "Fetching CA certificate from VM..."
+  mkdir -p "${INSTALL_DIR_CSP}/certs"
+  [[ -n "${SUDO_USER:-}" ]] && chown "${SUDO_USER}" "${INSTALL_DIR_CSP}/certs"
+  local scp_opts="-o BatchMode=yes -o StrictHostKeyChecking=no -o ConnectTimeout=15"
+  local scp_prefix=""
+  [[ -n "${SUDO_USER:-}" ]] && scp_prefix="sudo -u ${SUDO_USER}"
+  local ca_fetched=0
+  for ssh_user in ubuntu opc; do
+    local attempt
+    for attempt in 1 2 3; do
+      # shellcheck disable=SC2086
+      if $scp_prefix scp $scp_opts -i "$key_path" \
+           "${ssh_user}@${public_ip}:/opt/runevault/certs/ca.pem" \
+           "${INSTALL_DIR_CSP}/certs/ca.pem" 2>/dev/null; then
+        ca_fetched=1
+        break 2
+      fi
+      sleep 10
+    done
+  done
+
+  if [[ "$ca_fetched" -eq 0 ]]; then
+    warn "Could not fetch CA cert automatically. Fetch it manually:"
+    warn "  scp -i ${key_path} ubuntu@${public_ip}:/opt/runevault/certs/ca.pem ${INSTALL_DIR_CSP}/certs/ca.pem"
+  else
+    success "CA certificate saved: ${INSTALL_DIR_CSP}/certs/ca.pem"
+  fi
+}
+
+csp_summary() {
+  local csp=$1
+  local tf_dir="${INSTALL_DIR_CSP}/deployment"
+  local key_path="${INSTALL_DIR_CSP}/ssh_key"
+  local public_ip="${CSP_PUBLIC_IP:-<unknown>}"
+
+  printf '\n'
+  success "Rune-Vault deployed to $(printf '%s' "$csp" | tr 'a-z' 'A-Z')."
+  printf '\n'
+  printf '  Endpoint:  %s:50051\n' "$public_ip"
+  printf '  CA cert:   %s\n'       "${INSTALL_DIR_CSP}/certs/ca.pem"
+  printf '  SSH:       ssh -i %s ubuntu@%s\n' "$key_path" "$public_ip"
+  printf '  Terraform: %s\n'       "$tf_dir"
+  printf '\n'
+  printf 'Tear down:\n'
+  printf '  cd %s && terraform destroy -auto-approve\n' "$tf_dir"
+  printf '\n'
+  printf 'Retrieve team_secret from VM (share securely with team members):\n'
+  printf '  ssh -i %s ubuntu@%s\n' "$key_path" "$public_ip"
+  printf '  sudo grep team_secret /opt/runevault/configs/runevault.conf\n'
+  printf '\n'
+  warn "BACKUP: Keep this safe — it cannot be recovered if lost:"
+  warn "  Terraform state: ${tf_dir}/terraform.tfstate"
+}
+
+csp_dispatch() {
+  local csp="$TARGET"
+  local user_home="${SUDO_USER:+$(eval echo ~"${SUDO_USER}")}"
+  user_home="${user_home:-$HOME}"
+  INSTALL_DIR_CSP="${INSTALL_DIR_CSP:-${user_home}/rune-vault-${csp}}"
+  mkdir -p "$INSTALL_DIR_CSP"
+  [[ -n "${SUDO_USER:-}" ]] && chown "${SUDO_USER}" "$INSTALL_DIR_CSP"
+
+  csp_preflight "$csp"
+
+  if [[ -z "$VERSION" ]]; then
+    info "Resolving latest release version..."
+    VERSION=$(curl -fsSL \
+      "https://api.github.com/repos/${REPO}/releases/latest" \
+      | grep '"tag_name"' | head -1 \
+      | sed 's/.*"tag_name": *"\([^"]*\)".*/\1/')
+    [[ -n "$VERSION" ]] || die "Failed to resolve latest version from GitHub API."
+    info "Latest version: ${VERSION}"
+  fi
+
+  csp_prompt_config "$csp"
+  [[ -n "$VERSION" ]] || die "runevault version is required (use --version <tag>)."
+  csp_generate_ssh_key
+  csp_copy_terraform_files "$csp"
+  csp_render_tfvars "$csp"
+  csp_run_terraform
+  csp_post_deploy
+  csp_summary "$csp"
+  exit 0
+}
+
 # ── Tool auto-install ──────────────────────────────────────────────────────────
 
 # Run brew as the original (non-root) user when invoked via sudo on macOS.
@@ -531,6 +903,7 @@ generate_tls_certs() {
   printf 'DNS.3 = runevault\n'                       >> "$tmpconf"
   printf 'IP.1  = 127.0.0.1\n'                       >> "$tmpconf"
   [[ -n "$public_ip" ]] && printf 'IP.2  = %s\n' "$public_ip" >> "$tmpconf"
+  [[ -n "${RUNEVAULT_TLS_HOSTNAME:-}" ]] && printf 'DNS.4 = %s\n' "${RUNEVAULT_TLS_HOSTNAME}" >> "$tmpconf"
 
   openssl genrsa -out "${cert_dir}/ca.key" 4096 2>/dev/null
   openssl req -new -x509 \
@@ -855,10 +1228,9 @@ post_install() {
 }
 
 # ── Main ───────────────────────────────────────────────────────────────────────
-if [[ "$UNINSTALL" -eq 1 ]]; then
-  run_uninstall
-  exit 0
-fi
+[[ "$UNINSTALL" -eq 1 ]] && { run_uninstall; exit 0; }
+resolve_target
+[[ "$TARGET" != "local" ]] && csp_dispatch
 
 preflight
 download_and_verify

From 08182b400ed52765c74daef595c19a5c25004f36 Mon Sep 17 00:00:00 2001
From: Jeonghwan Lee <jhlee@cryptolab.co.kr>
Date: Mon, 27 Apr 2026 14:09:28 +0900
Subject: [PATCH 11/27] fix: unify team_name for CSP resource naming and vault
 index
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Remove separate vault_index_name and tls_hostname variables — team_name
now serves as both the cloud resource name and the vault index passed to
the VM via RUNEVAULT_TEAM_NAME. Fixes runtime crash after region prompt
caused by VAULT_INDEX_NAME validation on an unset variable.

Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>
---
 deployment/aws/cloud-init.yaml   |  3 +--
 deployment/aws/main.tf           | 15 ---------------
 deployment/gcp/main.tf           | 15 ---------------
 deployment/gcp/startup-script.sh |  3 +--
 deployment/oci/main.tf           | 15 ---------------
 deployment/oci/startup-script.sh |  3 +--
 install.sh                       | 24 +++++++-----------------
 7 files changed, 10 insertions(+), 68 deletions(-)

diff --git a/deployment/aws/cloud-init.yaml b/deployment/aws/cloud-init.yaml
index 90251d9..bb71ab9 100644
--- a/deployment/aws/cloud-init.yaml
+++ b/deployment/aws/cloud-init.yaml
@@ -5,10 +5,9 @@ packages: [ca-certificates, curl, openssl]
 write_files:
   - path: /etc/profile.d/runevault-installer-env.sh
     content: |
-      export RUNEVAULT_TEAM_NAME='${vault_index_name}'
+      export RUNEVAULT_TEAM_NAME='${team_name}'
       export RUNEVAULT_ENVECTOR_ENDPOINT='${envector_endpoint}'
       export RUNEVAULT_ENVECTOR_API_KEY='${envector_api_key}'
-      export RUNEVAULT_TLS_HOSTNAME='${tls_hostname}'
     permissions: '0600'
 
 runcmd:
diff --git a/deployment/aws/main.tf b/deployment/aws/main.tf
index 95b3d9d..4bea3b0 100644
--- a/deployment/aws/main.tf
+++ b/deployment/aws/main.tf
@@ -32,12 +32,6 @@ variable "tls_mode" {
   default     = "self-signed"
 }
 
-variable "tls_hostname" {
-  description = "Domain name to include in TLS certificate SAN"
-  type        = string
-  default     = ""
-}
-
 variable "envector_endpoint" {
   description = "enVector Cloud endpoint"
   type        = string
@@ -49,12 +43,6 @@ variable "envector_api_key" {
   sensitive   = true
 }
 
-variable "vault_index_name" {
-  description = "Vault index name"
-  type        = string
-  default     = "runecontext"
-}
-
 variable "instance_type" {
   description = "EC2 instance type"
   type        = string
@@ -209,11 +197,8 @@ resource "aws_instance" "vault" {
 
   user_data = templatefile("${path.module}/cloud-init.yaml", {
     team_name          = var.team_name
-    tls_mode           = var.tls_mode
-    tls_hostname       = var.tls_hostname
     envector_endpoint  = var.envector_endpoint
     envector_api_key   = var.envector_api_key
-    vault_index_name   = var.vault_index_name
     runevault_version  = var.runevault_version
   })
 
diff --git a/deployment/gcp/main.tf b/deployment/gcp/main.tf
index 694be53..2268158 100644
--- a/deployment/gcp/main.tf
+++ b/deployment/gcp/main.tf
@@ -47,12 +47,6 @@ variable "tls_mode" {
   default     = "self-signed"
 }
 
-variable "tls_hostname" {
-  description = "Domain name to include in TLS certificate SAN"
-  type        = string
-  default     = ""
-}
-
 variable "envector_endpoint" {
   description = "enVector Cloud endpoint"
   type        = string
@@ -64,12 +58,6 @@ variable "envector_api_key" {
   sensitive   = true
 }
 
-variable "vault_index_name" {
-  description = "Vault index name"
-  type        = string
-  default     = "runecontext"
-}
-
 variable "machine_type" {
   description = "Compute Engine machine type"
   type        = string
@@ -164,11 +152,8 @@ resource "google_compute_instance" "vault" {
 
   metadata_startup_script = templatefile("${path.module}/startup-script.sh", {
     team_name          = var.team_name
-    tls_mode           = var.tls_mode
-    tls_hostname       = var.tls_hostname
     envector_endpoint  = var.envector_endpoint
     envector_api_key   = var.envector_api_key
-    vault_index_name   = var.vault_index_name
     runevault_version  = var.runevault_version
   })
 
diff --git a/deployment/gcp/startup-script.sh b/deployment/gcp/startup-script.sh
index 658cd20..4b8419e 100644
--- a/deployment/gcp/startup-script.sh
+++ b/deployment/gcp/startup-script.sh
@@ -13,10 +13,9 @@ curl -fsSL "https://github.com/sigstore/cosign/releases/latest/download/cosign-l
 chmod 0755 /usr/local/bin/cosign
 
 cat > /etc/profile.d/runevault-installer-env.sh <<'ENVFILE'
-export RUNEVAULT_TEAM_NAME='${vault_index_name}'
+export RUNEVAULT_TEAM_NAME='${team_name}'
 export RUNEVAULT_ENVECTOR_ENDPOINT='${envector_endpoint}'
 export RUNEVAULT_ENVECTOR_API_KEY='${envector_api_key}'
-export RUNEVAULT_TLS_HOSTNAME='${tls_hostname}'
 ENVFILE
 chmod 600 /etc/profile.d/runevault-installer-env.sh
 set -a; . /etc/profile.d/runevault-installer-env.sh; set +a
diff --git a/deployment/oci/main.tf b/deployment/oci/main.tf
index 61b8b33..54daa39 100644
--- a/deployment/oci/main.tf
+++ b/deployment/oci/main.tf
@@ -43,12 +43,6 @@ variable "tls_mode" {
   default     = "self-signed"
 }
 
-variable "tls_hostname" {
-  description = "Domain name to include in TLS certificate SAN"
-  type        = string
-  default     = ""
-}
-
 variable "envector_endpoint" {
   description = "enVector Cloud endpoint"
   type        = string
@@ -60,12 +54,6 @@ variable "envector_api_key" {
   sensitive   = true
 }
 
-variable "vault_index_name" {
-  description = "Vault index name"
-  type        = string
-  default     = "runecontext"
-}
-
 variable "runevault_version" {
   description = "Pinned runevault release tag — drives the install.sh URL and binary version on the VM."
   type        = string
@@ -176,11 +164,8 @@ resource "oci_core_instance" "vault_instance" {
     ssh_authorized_keys = var.public_key
     user_data = base64encode(templatefile("${path.module}/startup-script.sh", {
       team_name          = var.team_name
-      tls_mode           = var.tls_mode
-      tls_hostname       = var.tls_hostname
       envector_endpoint  = var.envector_endpoint
       envector_api_key   = var.envector_api_key
-      vault_index_name   = var.vault_index_name
       runevault_version  = var.runevault_version
     }))
   }
diff --git a/deployment/oci/startup-script.sh b/deployment/oci/startup-script.sh
index 3bdaf3e..9deb2bd 100644
--- a/deployment/oci/startup-script.sh
+++ b/deployment/oci/startup-script.sh
@@ -16,10 +16,9 @@ curl -fsSL "https://github.com/sigstore/cosign/releases/latest/download/cosign-l
 chmod 0755 /usr/local/bin/cosign
 
 cat > /etc/profile.d/runevault-installer-env.sh <<'ENVFILE'
-export RUNEVAULT_TEAM_NAME='${vault_index_name}'
+export RUNEVAULT_TEAM_NAME='${team_name}'
 export RUNEVAULT_ENVECTOR_ENDPOINT='${envector_endpoint}'
 export RUNEVAULT_ENVECTOR_API_KEY='${envector_api_key}'
-export RUNEVAULT_TLS_HOSTNAME='${tls_hostname}'
 ENVFILE
 chmod 600 /etc/profile.d/runevault-installer-env.sh
 set -a; . /etc/profile.d/runevault-installer-env.sh; set +a
diff --git a/install.sh b/install.sh
index 5a58e11..4b5d362 100755
--- a/install.sh
+++ b/install.sh
@@ -23,16 +23,13 @@
 #   RUNEVAULT_ENVECTOR_API_KEY_FILE  envector.api_key_file (alternative)
 #   RUNEVAULT_TLS_CERT_PATH          Path to existing TLS cert (skips auto-gen)
 #   RUNEVAULT_TLS_KEY_PATH           Path to existing TLS key  (skips auto-gen)
-#   RUNEVAULT_TLS_HOSTNAME           Additional DNS SAN for auto-generated TLS cert
 #
 # Non-interactive env vars (CSP install — operator workstation):
 #   RUNEVAULT_ENVECTOR_ENDPOINT      enVector endpoint URL (required)
 #   RUNEVAULT_ENVECTOR_API_KEY       enVector API key (required)
-#   RUNEVAULT_TEAM_NAME              Vault index name (required)
-#   RUNEVAULT_TLS_HOSTNAME           Domain name for TLS SAN on VM cert (optional)
+#   RUNEVAULT_TEAM_NAME              Team name — used for resource naming and vault index (required)
 #   RUNEVAULT_TARGET                 Pre-select target without interactive menu
 #   RUNEVAULT_INSTALL_DIR            Pre-set CSP install directory
-#   RUNEVAULT_CSP_TEAM_NAME          Team name for cloud resource naming
 #   RUNEVAULT_CSP_REGION             Cloud region
 #   RUNEVAULT_GCP_PROJECT_ID         GCP: project ID (required for GCP)
 #   RUNEVAULT_OCI_COMPARTMENT_ID     OCI: compartment OCID (required for OCI)
@@ -267,11 +264,9 @@ csp_prompt_config() {
     printf '  API key from the dashboard.\n'
     printf '\n'
 
-    _prompt ENVECTOR_ENDPOINT  "enVector endpoint"         ""
-    _prompt ENVECTOR_API_KEY   "enVector API key"           ""
-    _prompt VAULT_INDEX_NAME   "Vault index name"           "runecontext"
-    _prompt TEAM_NAME          "Team name (resource naming)" "default"
-    _prompt TLS_HOSTNAME       "TLS hostname / domain SAN (optional, Enter to skip)" ""
+    _prompt TEAM_NAME          "Team name"          ""
+    _prompt ENVECTOR_ENDPOINT  "enVector endpoint"  ""
+    _prompt ENVECTOR_API_KEY   "enVector API key"   ""
 
     case "$csp" in
       aws) _prompt CSP_REGION "AWS region"   "us-east-1"   ;;
@@ -286,19 +281,17 @@ csp_prompt_config() {
     esac
     printf '\n'
   else
+    TEAM_NAME="${RUNEVAULT_TEAM_NAME:-}"
     ENVECTOR_ENDPOINT="${RUNEVAULT_ENVECTOR_ENDPOINT:-}"
     ENVECTOR_API_KEY="${RUNEVAULT_ENVECTOR_API_KEY:-}"
-    VAULT_INDEX_NAME="${RUNEVAULT_TEAM_NAME:-}"
-    TEAM_NAME="${RUNEVAULT_CSP_TEAM_NAME:-default}"
-    TLS_HOSTNAME="${RUNEVAULT_TLS_HOSTNAME:-}"
     CSP_REGION="${RUNEVAULT_CSP_REGION:-}"
     GCP_PROJECT_ID="${RUNEVAULT_GCP_PROJECT_ID:-}"
     OCI_COMPARTMENT_ID="${RUNEVAULT_OCI_COMPARTMENT_ID:-}"
 
     local missing=()
+    [[ -z "$TEAM_NAME" ]]         && missing+=("RUNEVAULT_TEAM_NAME")
     [[ -z "$ENVECTOR_ENDPOINT" ]] && missing+=("RUNEVAULT_ENVECTOR_ENDPOINT")
     [[ -z "$ENVECTOR_API_KEY" ]]  && missing+=("RUNEVAULT_ENVECTOR_API_KEY")
-    [[ -z "$VAULT_INDEX_NAME" ]]  && missing+=("RUNEVAULT_TEAM_NAME")
     [[ "$csp" = gcp && -z "$GCP_PROJECT_ID" ]]      && missing+=("RUNEVAULT_GCP_PROJECT_ID")
     [[ "$csp" = oci && -z "$OCI_COMPARTMENT_ID" ]]  && missing+=("RUNEVAULT_OCI_COMPARTMENT_ID")
     if [[ ${#missing[@]} -gt 0 ]]; then
@@ -308,9 +301,9 @@ csp_prompt_config() {
     fi
   fi
 
+  [[ -n "$TEAM_NAME" ]]          || die "Team name is required."
   [[ -n "$ENVECTOR_ENDPOINT" ]]  || die "enVector endpoint is required."
   [[ -n "$ENVECTOR_API_KEY" ]]   || die "enVector API key is required."
-  [[ -n "$VAULT_INDEX_NAME" ]]   || die "Vault index name is required."
   [[ "$csp" = gcp ]] && { [[ -n "$GCP_PROJECT_ID" ]]     || die "GCP project ID is required."; }
   [[ "$csp" = oci ]] && { [[ -n "$OCI_COMPARTMENT_ID" ]] || die "OCI compartment OCID is required."; }
 
@@ -392,10 +385,8 @@ csp_render_tfvars() {
   {
     printf 'team_name          = "%s"\n' "$(escape_tf "${TEAM_NAME:-default}")"
     printf 'tls_mode           = "self-signed"\n'
-    printf 'tls_hostname       = "%s"\n' "$(escape_tf "${TLS_HOSTNAME:-}")"
     printf 'envector_endpoint  = "%s"\n' "$(escape_tf "${ENVECTOR_ENDPOINT}")"
     printf 'envector_api_key   = "%s"\n' "$(escape_tf "${ENVECTOR_API_KEY}")"
-    printf 'vault_index_name   = "%s"\n' "$(escape_tf "${VAULT_INDEX_NAME}")"
     printf 'runevault_version  = "%s"\n' "$(escape_tf "${VERSION}")"
     printf 'public_key         = "%s"\n' "$(escape_tf "${public_key}")"
     printf 'region             = "%s"\n' "$(escape_tf "${CSP_REGION}")"
@@ -903,7 +894,6 @@ generate_tls_certs() {
   printf 'DNS.3 = runevault\n'                       >> "$tmpconf"
   printf 'IP.1  = 127.0.0.1\n'                       >> "$tmpconf"
   [[ -n "$public_ip" ]] && printf 'IP.2  = %s\n' "$public_ip" >> "$tmpconf"
-  [[ -n "${RUNEVAULT_TLS_HOSTNAME:-}" ]] && printf 'DNS.4 = %s\n' "${RUNEVAULT_TLS_HOSTNAME}" >> "$tmpconf"
 
   openssl genrsa -out "${cert_dir}/ca.key" 4096 2>/dev/null
   openssl req -new -x509 \

From 404c82bf7cc9452e26cc6f5da72801e974bd0d79 Mon Sep 17 00:00:00 2001
From: Jeonghwan Lee <jhlee@cryptolab.co.kr>
Date: Mon, 27 Apr 2026 14:37:44 +0900
Subject: [PATCH 12/27] fix: prevent silent exit when CSP function ends with
 failing &&-chain

csp_prompt_config ended with [[ "$csp" = oci ]] && { ... }, so on AWS
the function's last command returned non-zero. With set -e, the calling
csp_prompt_config invocation in csp_dispatch then killed the script
silently right after the AWS region prompt. Rewrite the GCP/OCI checks
as if-statements; apply the same fix to setup_system.

Also slim csp_preflight to terraform-only with a y/N auto-install prompt
mirroring local preflight, and add terraform install support to
_install_tool (brew on macOS, HashiCorp zip on Linux).

Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>
---
 install.sh | 69 ++++++++++++++++++++++++++++++++++++++++--------------
 1 file changed, 51 insertions(+), 18 deletions(-)

diff --git a/install.sh b/install.sh
index 4b5d362..47d470e 100755
--- a/install.sh
+++ b/install.sh
@@ -229,24 +229,34 @@ csp_preflight() {
   local csp=$1
   info "Running CSP preflight checks for ${csp}..."
 
-  local missing=0
-  for tool in terraform ssh-keygen scp curl; do
-    command -v "$tool" >/dev/null 2>&1 || { warn "'${tool}' not found."; missing=1; }
-  done
+  if command -v terraform >/dev/null 2>&1; then
+    success "CSP preflight passed."
+    return 0
+  fi
 
-  local csp_cli
-  case "$csp" in
-    aws) csp_cli=aws ;;
-    gcp) csp_cli=gcloud ;;
-    oci) csp_cli=oci ;;
-  esac
-  command -v "$csp_cli" >/dev/null 2>&1 \
-    || { warn "CSP CLI '${csp_cli}' not found. Install and configure credentials."; missing=1; }
+  printf '\n'
+  warn "terraform is not installed."
+  printf '\n'
 
-  if [[ "$missing" -eq 1 ]]; then
-    die "Missing prerequisites above. Install them and re-run."
+  local answer=n
+  if [[ "$NON_INTERACTIVE" -eq 0 ]]; then
+    read -r -p "Install terraform automatically? [y/N] " answer
+  else
+    warn "Non-interactive mode: cannot auto-install terraform."
   fi
 
+  case "$answer" in
+    [Yy]*) _install_tool terraform ;;
+    *)
+      printf 'Install it manually and re-run the installer:\n' >&2
+      case "$OS_SLUG" in
+        linux)  printf '  terraform: https://developer.hashicorp.com/terraform/install\n' >&2 ;;
+        darwin) printf '  terraform: brew install terraform\n' >&2 ;;
+      esac
+      exit 1
+      ;;
+  esac
+
   success "CSP preflight passed."
 }
 
@@ -304,9 +314,12 @@ csp_prompt_config() {
   [[ -n "$TEAM_NAME" ]]          || die "Team name is required."
   [[ -n "$ENVECTOR_ENDPOINT" ]]  || die "enVector endpoint is required."
   [[ -n "$ENVECTOR_API_KEY" ]]   || die "enVector API key is required."
-  [[ "$csp" = gcp ]] && { [[ -n "$GCP_PROJECT_ID" ]]     || die "GCP project ID is required."; }
-  [[ "$csp" = oci ]] && { [[ -n "$OCI_COMPARTMENT_ID" ]] || die "OCI compartment OCID is required."; }
-
+  if [[ "$csp" = gcp ]]; then
+    [[ -n "$GCP_PROJECT_ID" ]]     || die "GCP project ID is required."
+  fi
+  if [[ "$csp" = oci ]]; then
+    [[ -n "$OCI_COMPARTMENT_ID" ]] || die "OCI compartment OCID is required."
+  fi
 }
 
 csp_generate_ssh_key() {
@@ -555,8 +568,26 @@ _install_tool() {
       ;;
     linux:openssl)  _pkg_install openssl ;;
     linux:sha256sum) _pkg_install coreutils ;;
+    linux:terraform)
+      local tf_version arch_suffix=amd64
+      [[ "$ARCH_SLUG" = arm64 ]] && arch_suffix=arm64
+      tf_version=$(curl -fsSL https://api.github.com/repos/hashicorp/terraform/releases/latest \
+        | grep '"tag_name"' | head -1 \
+        | sed 's/.*"tag_name": *"v\([^"]*\)".*/\1/')
+      [[ -n "$tf_version" ]] || die "Failed to resolve latest terraform version."
+      command -v unzip >/dev/null 2>&1 || _pkg_install unzip
+      local tmpdir
+      tmpdir=$(mktemp -d)
+      curl -fsSL \
+        "https://releases.hashicorp.com/terraform/${tf_version}/terraform_${tf_version}_linux_${arch_suffix}.zip" \
+        -o "${tmpdir}/tf.zip"
+      unzip -o "${tmpdir}/tf.zip" -d "${tmpdir}" >/dev/null
+      install -m 0755 "${tmpdir}/terraform" /usr/local/bin/terraform
+      rm -rf "${tmpdir}"
+      ;;
     darwin:cosign)  _brew install cosign ;;
     darwin:openssl) _brew install openssl ;;
+    darwin:terraform) _brew install terraform ;;
     darwin:shasum)
       die "shasum is pre-installed on macOS. Something is very wrong." ;;
     *:systemctl)
@@ -851,7 +882,9 @@ setup_system() {
   install -m 0755 "$SCRATCH/runevault" "$BINARY_DEST"
   success "Binary installed: ${BINARY_DEST}"
 
-  [[ "$SKIP_SERVICE" -eq 0 ]] && _add_invoking_user_to_group
+  if [[ "$SKIP_SERVICE" -eq 0 ]]; then
+    _add_invoking_user_to_group
+  fi
 }
 
 # ── Phase 5: TLS certificates ──────────────────────────────────────────────────

From 1f2c3a7145ca65f6ab0a447be9a53c610fa19678 Mon Sep 17 00:00:00 2001
From: Jeonghwan Lee <jhlee@cryptolab.co.kr>
Date: Mon, 27 Apr 2026 14:56:17 +0900
Subject: [PATCH 13/27] fix: poll CA cert via SCP until VM install actually
 completes

Previously csp_post_deploy waited for port 50051 (10 min) plus a fixed
30s sleep, then made 6 short SCP attempts. If the VM-side install was
slow or the cert hadn't been generated yet, SCP failed and the script
fell back to a useless "retry the same SCP" warning.

Replace the port wait + fixed sleep with a single SCP polling loop that
retries every 15s for up to 30 min. SCP succeeds the moment the VM has
generated /opt/runevault/certs/ca.pem, which is the precise signal we
care about. On timeout, die with a pointer to the VM-side install log.

Also pick ssh_user from $csp instead of trying ubuntu/opc in turn.

Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>
---
 install.sh | 63 ++++++++++++++++++++++++++----------------------------
 1 file changed, 30 insertions(+), 33 deletions(-)

diff --git a/install.sh b/install.sh
index 47d470e..f48429f 100755
--- a/install.sh
+++ b/install.sh
@@ -429,6 +429,7 @@ csp_run_terraform() {
 }
 
 csp_post_deploy() {
+  local csp=$1
   local tf_dir="${INSTALL_DIR_CSP}/deployment"
   local tf_user="${SUDO_USER:-$(id -un)}"
   local key_path="${INSTALL_DIR_CSP}/ssh_key"
@@ -438,46 +439,33 @@ csp_post_deploy() {
     || die "Could not read vault_public_ip from terraform output."
   CSP_PUBLIC_IP="$public_ip"
 
-  info "Waiting for gRPC port 50051 on ${public_ip} (up to 10 min)..."
-  local elapsed=0
-  while [[ $elapsed -lt 600 ]]; do
-    bash -c "echo > /dev/tcp/${public_ip}/50051" 2>/dev/null && break || true
-    sleep 10
-    elapsed=$((elapsed + 10))
-  done
-  if [[ $elapsed -ge 600 ]]; then
-    warn "Timed out waiting for port 50051. The VM may still be initializing."
-  fi
-
-  sleep 30
+  local ssh_user
+  case "$csp" in
+    oci) ssh_user=opc ;;
+    *)   ssh_user=ubuntu ;;
+  esac
 
-  info "Fetching CA certificate from VM..."
   mkdir -p "${INSTALL_DIR_CSP}/certs"
   [[ -n "${SUDO_USER:-}" ]] && chown "${SUDO_USER}" "${INSTALL_DIR_CSP}/certs"
   local scp_opts="-o BatchMode=yes -o StrictHostKeyChecking=no -o ConnectTimeout=15"
   local scp_prefix=""
   [[ -n "${SUDO_USER:-}" ]] && scp_prefix="sudo -u ${SUDO_USER}"
-  local ca_fetched=0
-  for ssh_user in ubuntu opc; do
-    local attempt
-    for attempt in 1 2 3; do
-      # shellcheck disable=SC2086
-      if $scp_prefix scp $scp_opts -i "$key_path" \
-           "${ssh_user}@${public_ip}:/opt/runevault/certs/ca.pem" \
-           "${INSTALL_DIR_CSP}/certs/ca.pem" 2>/dev/null; then
-        ca_fetched=1
-        break 2
-      fi
-      sleep 10
-    done
+
+  local timeout_secs=1800
+  info "Waiting for VM install to finish and CA cert to appear (up to $((timeout_secs / 60)) min)..."
+  local deadline=$(( $(date +%s) + timeout_secs ))
+  while [[ $(date +%s) -lt $deadline ]]; do
+    # shellcheck disable=SC2086
+    if $scp_prefix scp $scp_opts -i "$key_path" \
+         "${ssh_user}@${public_ip}:/opt/runevault/certs/ca.pem" \
+         "${INSTALL_DIR_CSP}/certs/ca.pem" 2>/dev/null; then
+      success "CA certificate saved: ${INSTALL_DIR_CSP}/certs/ca.pem"
+      return 0
+    fi
+    sleep 15
   done
 
-  if [[ "$ca_fetched" -eq 0 ]]; then
-    warn "Could not fetch CA cert automatically. Fetch it manually:"
-    warn "  scp -i ${key_path} ubuntu@${public_ip}:/opt/runevault/certs/ca.pem ${INSTALL_DIR_CSP}/certs/ca.pem"
-  else
-    success "CA certificate saved: ${INSTALL_DIR_CSP}/certs/ca.pem"
-  fi
+  die "Timed out waiting for VM-side install. SSH in and check /var/log/runevault-install.log: ssh -i ${key_path} ${ssh_user}@${public_ip}"
 }
 
 csp_summary() {
@@ -531,7 +519,7 @@ csp_dispatch() {
   csp_copy_terraform_files "$csp"
   csp_render_tfvars "$csp"
   csp_run_terraform
-  csp_post_deploy
+  csp_post_deploy "$csp"
   csp_summary "$csp"
   exit 0
 }
@@ -841,6 +829,15 @@ _create_system_user() {
 
 _add_invoking_user_to_group() {
   local invoking_user="${SUDO_USER:-}"
+  if [[ -z "$invoking_user" && "$OS_SLUG" = linux ]]; then
+    local candidate
+    for candidate in ubuntu ec2-user debian opc; do
+      if id -u "$candidate" >/dev/null 2>&1; then
+        invoking_user="$candidate"
+        break
+      fi
+    done
+  fi
   [[ -z "$invoking_user" ]] && return 0
   if [[ "$OS_SLUG" = linux ]]; then
     usermod -aG "$SERVICE_USER" "$invoking_user"

From 11aea029edcbb67585f614ddea4056ecdc335234 Mon Sep 17 00:00:00 2001
From: Jeonghwan Lee <jhlee@cryptolab.co.kr>
Date: Mon, 27 Apr 2026 15:27:48 +0900
Subject: [PATCH 14/27] fix: add cloud default user to runevault group in
 cloud-init
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

The VM-side install.sh runs as root via cloud-init, so SUDO_USER is
empty and _add_invoking_user_to_group is a no-op — the canonical SSH
user (ubuntu on all three CSPs) ends up outside the runevault group
and can't reach /opt/runevault/admin.sock or /opt/runevault/certs.

Add an explicit "usermod -aG runevault ubuntu" right after install.sh
in each cloud-init / startup-script. Drop the auto-detect fallback in
install.sh now that cloud-init owns this responsibility for cloud
deploys; local installs still pick up SUDO_USER as before.

Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>
---
 deployment/aws/cloud-init.yaml   | 1 +
 deployment/gcp/startup-script.sh | 2 ++
 deployment/oci/startup-script.sh | 2 ++
 install.sh                       | 9 ---------
 4 files changed, 5 insertions(+), 9 deletions(-)

diff --git a/deployment/aws/cloud-init.yaml b/deployment/aws/cloud-init.yaml
index bb71ab9..78e4643 100644
--- a/deployment/aws/cloud-init.yaml
+++ b/deployment/aws/cloud-init.yaml
@@ -24,4 +24,5 @@ runcmd:
         sleep $((i*10))
       done
       bash /tmp/install.sh --target local --non-interactive --version "${runevault_version}"
+  - usermod -aG runevault ubuntu
   - rm -f /etc/profile.d/runevault-installer-env.sh
diff --git a/deployment/gcp/startup-script.sh b/deployment/gcp/startup-script.sh
index 4b8419e..141fee4 100644
--- a/deployment/gcp/startup-script.sh
+++ b/deployment/gcp/startup-script.sh
@@ -28,5 +28,7 @@ done
 
 bash /tmp/install.sh --target local --non-interactive --version "${runevault_version}"
 
+usermod -aG runevault ubuntu
+
 rm -f /etc/profile.d/runevault-installer-env.sh
 echo "=== completed at $(date) ==="
diff --git a/deployment/oci/startup-script.sh b/deployment/oci/startup-script.sh
index 9deb2bd..78c881e 100644
--- a/deployment/oci/startup-script.sh
+++ b/deployment/oci/startup-script.sh
@@ -31,5 +31,7 @@ done
 
 bash /tmp/install.sh --target local --non-interactive --version "${runevault_version}"
 
+usermod -aG runevault ubuntu
+
 rm -f /etc/profile.d/runevault-installer-env.sh
 echo "=== completed at $(date) ==="
diff --git a/install.sh b/install.sh
index f48429f..eb5dfcf 100755
--- a/install.sh
+++ b/install.sh
@@ -829,15 +829,6 @@ _create_system_user() {
 
 _add_invoking_user_to_group() {
   local invoking_user="${SUDO_USER:-}"
-  if [[ -z "$invoking_user" && "$OS_SLUG" = linux ]]; then
-    local candidate
-    for candidate in ubuntu ec2-user debian opc; do
-      if id -u "$candidate" >/dev/null 2>&1; then
-        invoking_user="$candidate"
-        break
-      fi
-    done
-  fi
   [[ -z "$invoking_user" ]] && return 0
   if [[ "$OS_SLUG" = linux ]]; then
     usermod -aG "$SERVICE_USER" "$invoking_user"

From 28ea1a60b109b5d2727caa7aa69eebeca16a4606 Mon Sep 17 00:00:00 2001
From: Jeonghwan Lee <jhlee@cryptolab.co.kr>
Date: Mon, 27 Apr 2026 15:38:40 +0900
Subject: [PATCH 15/27] chore: replace team_secret retrieval with SSH-based
 Next steps in CSP summary

team_secret no longer surfaces in operator-facing output (auto-generated
on the VM, not relevant to share). Replace that section with a Next
steps block that SSHes into the VM and runs runevault commands there,
mirroring the local install's Next steps. Same block for all three
CSPs since AWS/GCP/OCI all use Ubuntu 22.04 + systemd.

Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>
---
 install.sh | 8 ++++++--
 1 file changed, 6 insertions(+), 2 deletions(-)

diff --git a/install.sh b/install.sh
index eb5dfcf..fe00a60 100755
--- a/install.sh
+++ b/install.sh
@@ -485,9 +485,13 @@ csp_summary() {
   printf 'Tear down:\n'
   printf '  cd %s && terraform destroy -auto-approve\n' "$tf_dir"
   printf '\n'
-  printf 'Retrieve team_secret from VM (share securely with team members):\n'
+  printf 'Next steps (SSH into the VM, then run on the VM):\n'
   printf '  ssh -i %s ubuntu@%s\n' "$key_path" "$public_ip"
-  printf '  sudo grep team_secret /opt/runevault/configs/runevault.conf\n'
+  printf '\n'
+  printf '  Issue a token:  runevault token issue --user <name> --role member\n'
+  printf '  Check status:   runevault status\n'
+  printf '  View logs:      journalctl -u runevault -f\n'
+  printf '  Manage daemon:  sudo systemctl start|stop|restart runevault\n'
   printf '\n'
   warn "BACKUP: Keep this safe — it cannot be recovered if lost:"
   warn "  Terraform state: ${tf_dir}/terraform.tfstate"

From d3ea1b12295a7938247f4e98a9c4d2ac5dec5883 Mon Sep 17 00:00:00 2001
From: Jeonghwan Lee <jhlee@cryptolab.co.kr>
Date: Mon, 27 Apr 2026 16:00:32 +0900
Subject: [PATCH 16/27] feat: tighten CSP preflight with CLI presence + auth
 checks

Terraform's default credential chain is satisfied by the cloud CLI's
auth artifacts in practice (~/.aws/credentials, gcloud ADC file,
~/.oci/config), so verifying the CLI is installed and authenticated
catches the most common "terraform apply silently fails" cause early.

Run "<cli> <non-destructive-auth-call>" as $SUDO_USER (the user that
csp_run_terraform will run terraform under) so the check matches the
actual credential resolution path:
  - aws sts get-caller-identity
  - gcloud auth application-default print-access-token
  - oci iam region list

Also point both local install and CSP summary to "runevault logs" for
the View logs hint, replacing the per-OS journalctl/tail snippets now
that the CLI provides a unified entrypoint.

Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>
---
 install.sh | 73 +++++++++++++++++++++++++++++++++++-------------------
 1 file changed, 48 insertions(+), 25 deletions(-)

diff --git a/install.sh b/install.sh
index fe00a60..256b983 100755
--- a/install.sh
+++ b/install.sh
@@ -229,33 +229,57 @@ csp_preflight() {
   local csp=$1
   info "Running CSP preflight checks for ${csp}..."
 
-  if command -v terraform >/dev/null 2>&1; then
-    success "CSP preflight passed."
-    return 0
+  if ! command -v terraform >/dev/null 2>&1; then
+    printf '\n'
+    warn "terraform is not installed."
+    printf '\n'
+    local answer=n
+    if [[ "$NON_INTERACTIVE" -eq 0 ]]; then
+      read -r -p "Install terraform automatically? [y/N] " answer
+    else
+      warn "Non-interactive mode: cannot auto-install terraform."
+    fi
+    case "$answer" in
+      [Yy]*) _install_tool terraform ;;
+      *)
+        printf 'Install it manually and re-run the installer:\n' >&2
+        case "$OS_SLUG" in
+          linux)  printf '  terraform: https://developer.hashicorp.com/terraform/install\n' >&2 ;;
+          darwin) printf '  terraform: brew install terraform\n' >&2 ;;
+        esac
+        exit 1
+        ;;
+    esac
   fi
 
-  printf '\n'
-  warn "terraform is not installed."
-  printf '\n'
+  local csp_cli auth_cmd auth_setup
+  case "$csp" in
+    aws)
+      csp_cli=aws
+      auth_cmd='aws sts get-caller-identity'
+      auth_setup='aws configure'
+      ;;
+    gcp)
+      csp_cli=gcloud
+      auth_cmd='gcloud auth application-default print-access-token'
+      auth_setup='gcloud auth application-default login'
+      ;;
+    oci)
+      csp_cli=oci
+      auth_cmd='oci iam region list'
+      auth_setup='oci setup config'
+      ;;
+  esac
 
-  local answer=n
-  if [[ "$NON_INTERACTIVE" -eq 0 ]]; then
-    read -r -p "Install terraform automatically? [y/N] " answer
-  else
-    warn "Non-interactive mode: cannot auto-install terraform."
+  local tf_user="${SUDO_USER:-$(id -un)}"
+
+  if ! sudo -u "$tf_user" -H bash -lc "command -v ${csp_cli}" >/dev/null 2>&1; then
+    die "'${csp_cli}' CLI not found in PATH for user '${tf_user}'. Install it and re-run."
   fi
 
-  case "$answer" in
-    [Yy]*) _install_tool terraform ;;
-    *)
-      printf 'Install it manually and re-run the installer:\n' >&2
-      case "$OS_SLUG" in
-        linux)  printf '  terraform: https://developer.hashicorp.com/terraform/install\n' >&2 ;;
-        darwin) printf '  terraform: brew install terraform\n' >&2 ;;
-      esac
-      exit 1
-      ;;
-  esac
+  if ! sudo -u "$tf_user" -H bash -lc "${auth_cmd}" >/dev/null 2>&1; then
+    die "'${csp_cli}' is not authenticated for user '${tf_user}'. Authenticate and re-run: ${auth_setup}"
+  fi
 
   success "CSP preflight passed."
 }
@@ -490,7 +514,7 @@ csp_summary() {
   printf '\n'
   printf '  Issue a token:  runevault token issue --user <name> --role member\n'
   printf '  Check status:   runevault status\n'
-  printf '  View logs:      journalctl -u runevault -f\n'
+  printf '  View logs:      runevault logs\n'
   printf '  Manage daemon:  sudo systemctl start|stop|restart runevault\n'
   printf '\n'
   warn "BACKUP: Keep this safe — it cannot be recovered if lost:"
@@ -1223,11 +1247,10 @@ post_install() {
   printf 'Next steps:\n'
   printf '  Issue a token:  runevault token issue --user <name> --role member\n'
   printf '  Check status:   runevault status\n'
+  printf '  View logs:      runevault logs\n'
   if [[ "$OS_SLUG" = linux ]]; then
-    printf '  View logs:      journalctl -u runevault -f\n'
     printf '  Manage daemon:  sudo systemctl start|stop|restart runevault\n'
   else
-    printf '  View logs:      tail -f %s/logs/runevault.stderr.log\n' "${INSTALL_PREFIX}"
     printf '  Manage daemon:  sudo launchctl bootout system/com.cryptolabinc.runevault\n'
     printf '                  sudo launchctl bootstrap system /Library/LaunchDaemons/com.cryptolabinc.runevault.plist\n'
   fi

From 8e8ce33d56ea8e6659a81352fa2239395892d168 Mon Sep 17 00:00:00 2001
From: Jeonghwan Lee <jhlee@cryptolab.co.kr>
Date: Mon, 27 Apr 2026 16:08:02 +0900
Subject: [PATCH 17/27] chore: bump cloud VM images to Ubuntu 24.04 LTS

Update AMI/image filters across all three CSPs:
- AWS: ubuntu-noble-24.04 on hvm-ssd-gp3
- GCP: ubuntu-2404-lts-amd64
- OCI: Canonical-Ubuntu-24.04-* filtered by VM.Standard.E5.Flex compatibility

The OCI bump also fixes the launch failure on ap-seoul-1 where the
22.04 image wasn't compatible with E5.Flex shape.

Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>
---
 deployment/aws/main.tf |  2 +-
 deployment/gcp/main.tf |  2 +-
 deployment/oci/main.tf | 12 +++++++-----
 3 files changed, 9 insertions(+), 7 deletions(-)

diff --git a/deployment/aws/main.tf b/deployment/aws/main.tf
index 4bea3b0..f9e3ef5 100644
--- a/deployment/aws/main.tf
+++ b/deployment/aws/main.tf
@@ -67,7 +67,7 @@ data "aws_ami" "ubuntu" {
 
   filter {
     name   = "name"
-    values = ["ubuntu/images/hvm-ssd/ubuntu-jammy-22.04-amd64-server-*"]
+    values = ["ubuntu/images/hvm-ssd-gp3/ubuntu-noble-24.04-amd64-server-*"]
   }
 
   filter {
diff --git a/deployment/gcp/main.tf b/deployment/gcp/main.tf
index 2268158..3a5d9f0 100644
--- a/deployment/gcp/main.tf
+++ b/deployment/gcp/main.tf
@@ -132,7 +132,7 @@ resource "google_compute_instance" "vault" {
 
   boot_disk {
     initialize_params {
-      image = "ubuntu-os-cloud/ubuntu-2204-lts"
+      image = "ubuntu-os-cloud/ubuntu-2404-lts-amd64"
       size  = 20
       type  = "pd-standard"
     }
diff --git a/deployment/oci/main.tf b/deployment/oci/main.tf
index 54daa39..39febaa 100644
--- a/deployment/oci/main.tf
+++ b/deployment/oci/main.tf
@@ -177,14 +177,16 @@ data "oci_identity_availability_domains" "ads" {
 }
 
 data "oci_core_images" "ubuntu_image" {
-  compartment_id   = var.compartment_id
-  operating_system = "Canonical Ubuntu"
-  sort_by          = "TIMECREATED"
-  sort_order       = "DESC"
+  compartment_id           = var.compartment_id
+  operating_system         = "Canonical Ubuntu"
+  operating_system_version = "24.04"
+  shape                    = "VM.Standard.E5.Flex"
+  sort_by                  = "TIMECREATED"
+  sort_order               = "DESC"
 
   filter {
     name   = "display_name"
-    values = ["^Canonical-Ubuntu-22.04-.*"]
+    values = ["^Canonical-Ubuntu-24.04-.*"]
     regex  = true
   }
 }

From 83ca17dbc3f3be1b63432321d67465643c87a6e8 Mon Sep 17 00:00:00 2001
From: Jeonghwan Lee <jhlee@cryptolab.co.kr>
Date: Mon, 27 Apr 2026 16:23:49 +0900
Subject: [PATCH 18/27] fix: use ubuntu as SCP user on OCI

OCI launches the Canonical Ubuntu cloud image, whose default SSH user
is 'ubuntu' (the 'opc' default belongs to Oracle Linux images, which
we don't deploy). The csp_post_deploy SCP polling loop was hard-coded
to opc for OCI, so it would loop forever connecting as a non-existent
user. Use 'ubuntu' for all three CSPs.

Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>
---
 install.sh | 6 +-----
 1 file changed, 1 insertion(+), 5 deletions(-)

diff --git a/install.sh b/install.sh
index 256b983..325abc3 100755
--- a/install.sh
+++ b/install.sh
@@ -463,11 +463,7 @@ csp_post_deploy() {
     || die "Could not read vault_public_ip from terraform output."
   CSP_PUBLIC_IP="$public_ip"
 
-  local ssh_user
-  case "$csp" in
-    oci) ssh_user=opc ;;
-    *)   ssh_user=ubuntu ;;
-  esac
+  local ssh_user=ubuntu
 
   mkdir -p "${INSTALL_DIR_CSP}/certs"
   [[ -n "${SUDO_USER:-}" ]] && chown "${SUDO_USER}" "${INSTALL_DIR_CSP}/certs"

From e125cd1ad370e1fb68ac2dcd3f26c5c78432f7dc Mon Sep 17 00:00:00 2001
From: Jeonghwan Lee <jhlee@cryptolab.co.kr>
Date: Thu, 30 Apr 2026 09:45:41 +0900
Subject: [PATCH 19/27] feat: add CSP uninstall flow that wraps terraform
 destroy
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

run_uninstall now dispatches by --target. Local keeps the existing
service + files + data flow; CSP targets call the new csp_uninstall,
which runs terraform destroy against the install dir's terraform.tfstate
and optionally removes the directory afterwards. Operators no longer
have to manually cd into the install dir to tear down cloud
infrastructure — --uninstall --target aws|gcp|oci is enough.

Also switches the interactive target prompt label between "installation"
and "uninstall" to match the active flow, and reorders main so target
is resolved before the uninstall dispatch.

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
---
 install.sh | 74 +++++++++++++++++++++++++++++++++++++++++++++++++++---
 1 file changed, 70 insertions(+), 4 deletions(-)

diff --git a/install.sh b/install.sh
index 325abc3..b11ef54 100755
--- a/install.sh
+++ b/install.sh
@@ -14,7 +14,9 @@
 #   --install-dir <path>          CSP install directory (default: $HOME/rune-vault-<csp>)
 #   --force                       Overwrite existing config and TLS certificates
 #   --non-interactive             Skip all prompts; supply secrets via env vars
-#   --uninstall                   Stop the service, remove files, optionally delete data
+#   --uninstall                   Tear down the install. Local: stop service + remove files
+#                                 (optionally delete data). CSP: run 'terraform destroy' and
+#                                 optionally remove the install directory.
 #
 # Non-interactive env vars (local install):
 #   RUNEVAULT_TEAM_NAME              keys.index_name (required)
@@ -111,7 +113,13 @@ esac
 # ── Uninstall flow ─────────────────────────────────────────────────────────────
 run_uninstall() {
   info "Uninstalling Rune-Vault..."
-  [[ "$(id -u)" -eq 0 ]] || die "Uninstall must be run as root (use sudo)."
+
+  if [[ "$TARGET" != "local" ]]; then
+    csp_uninstall "$TARGET"
+    return 0
+  fi
+
+  [[ "$(id -u)" -eq 0 ]] || die "Local uninstall must be run as root (use sudo)."
 
   if [[ "$OS_SLUG" = linux ]]; then
     if systemctl is-active --quiet runevault.service 2>/dev/null; then
@@ -204,8 +212,10 @@ resolve_target() {
     return 0
   fi
   if [[ "$NON_INTERACTIVE" -eq 0 && -t 0 ]]; then
+    local action="installation"
+    [[ "$UNINSTALL" -eq 1 ]] && action="uninstall"
     printf '\n'
-    printf '  Select installation target:\n'
+    printf '  Select %s target:\n' "$action"
     printf '    1) Local (this machine)\n'
     printf '    2) AWS\n'
     printf '    3) GCP\n'
@@ -517,6 +527,62 @@ csp_summary() {
   warn "  Terraform state: ${tf_dir}/terraform.tfstate"
 }
 
+csp_uninstall() {
+  local csp=$1
+  local user_home="${SUDO_USER:+$(eval echo ~"${SUDO_USER}")}"
+  user_home="${user_home:-$HOME}"
+  INSTALL_DIR_CSP="${INSTALL_DIR_CSP:-${user_home}/rune-vault-${csp}}"
+  local tf_dir="${INSTALL_DIR_CSP}/deployment"
+
+  if [[ ! -f "${tf_dir}/terraform.tfstate" ]]; then
+    warn "No terraform.tfstate found at ${tf_dir}/terraform.tfstate — nothing to destroy."
+    return 0
+  fi
+
+  command -v terraform >/dev/null 2>&1 \
+    || die "terraform is required to destroy CSP infrastructure. Install it: https://developer.hashicorp.com/terraform/install"
+
+  printf '\n'
+  warn "This will run 'terraform destroy' on the ${csp} infrastructure at:"
+  warn "  ${tf_dir}"
+  warn "All cloud resources (VM, network, etc.) will be removed permanently."
+  printf '\n'
+
+  if [[ "$NON_INTERACTIVE" -eq 0 ]]; then
+    local answer=n
+    read -r -p "Continue? [y/N] " answer
+    [[ "$answer" =~ ^[Yy] ]] || { info "Aborted."; exit 0; }
+  fi
+
+  local tf_user="${SUDO_USER:-$(id -un)}"
+  info "Running terraform destroy in ${tf_dir}..."
+  (cd "$tf_dir" && sudo -u "$tf_user" terraform destroy -auto-approve)
+  success "Cloud infrastructure destroyed."
+
+  printf '\n'
+  warn "The following directory contains terraform state, SSH keys, and CA cert:"
+  warn "  ${INSTALL_DIR_CSP}/"
+  printf '\n'
+
+  if [[ "$NON_INTERACTIVE" -eq 1 ]]; then
+    warn "Non-interactive mode: directory preserved. Remove manually: rm -rf ${INSTALL_DIR_CSP}"
+  else
+    local answer=n
+    read -r -p "Delete the entire directory? [y/N] " answer
+    case "$answer" in
+      [Yy]*)
+        rm -rf "${INSTALL_DIR_CSP}"
+        success "Directory removed: ${INSTALL_DIR_CSP}"
+        ;;
+      *)
+        info "Directory preserved: ${INSTALL_DIR_CSP}"
+        ;;
+    esac
+  fi
+
+  success "Rune-Vault ${csp} infrastructure uninstalled."
+}
+
 csp_dispatch() {
   local csp="$TARGET"
   local user_home="${SUDO_USER:+$(eval echo ~"${SUDO_USER}")}"
@@ -1262,8 +1328,8 @@ post_install() {
 }
 
 # ── Main ───────────────────────────────────────────────────────────────────────
-[[ "$UNINSTALL" -eq 1 ]] && { run_uninstall; exit 0; }
 resolve_target
+[[ "$UNINSTALL" -eq 1 ]] && { run_uninstall; exit 0; }
 [[ "$TARGET" != "local" ]] && csp_dispatch
 
 preflight

From c67f99fe52272191a1025d6ffb9f611fd305c5e2 Mon Sep 17 00:00:00 2001
From: Jeonghwan Lee <jhlee@cryptolab.co.kr>
Date: Thu, 30 Apr 2026 09:45:48 +0900
Subject: [PATCH 20/27] feat: round out dev installer with prompts, uninstall,
 and CSP variants

- install-dev.sh prompts for enVector endpoint and API key on
  interactive local installs (previously silently used placeholder
  defaults, producing a non-functional vault on every dev local run).
- install-dev.sh forwards --uninstall to install.sh for both local and
  CSP targets, skipping the dev preflight/build path. The CSP variant
  reuses install.sh's new csp_uninstall (terraform destroy) wrapper.
- Add dev cloud-init / startup-script variants that only install
  prereqs (cosign + apt packages); install.sh + the locally built
  binary are SCP'd in by install-dev.sh after cloud-init finishes.
  AWS variant escapes \${carch} as \$\${carch} so terraform's
  templatefile() leaves the shell expansion intact.
- Switch resolve_target label between "install" and "uninstall" to
  match the active flow.
- Default team_name changed from "dev-team" to "devteam" because
  vault index names cannot contain hyphens.

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
---
 deployment/aws/cloud-init-dev.yaml   |  10 +
 deployment/gcp/startup-script-dev.sh |  16 +
 deployment/oci/startup-script-dev.sh |  19 +
 scripts/install-dev.sh               | 691 +++++++++++++++++++++++++--
 4 files changed, 707 insertions(+), 29 deletions(-)
 create mode 100644 deployment/aws/cloud-init-dev.yaml
 create mode 100755 deployment/gcp/startup-script-dev.sh
 create mode 100755 deployment/oci/startup-script-dev.sh

diff --git a/deployment/aws/cloud-init-dev.yaml b/deployment/aws/cloud-init-dev.yaml
new file mode 100644
index 0000000..76dbf8a
--- /dev/null
+++ b/deployment/aws/cloud-init-dev.yaml
@@ -0,0 +1,10 @@
+#cloud-config
+# Dev mode: installs prereqs only. install.sh is injected via SCP by install-dev.sh.
+package_update: true
+packages: [ca-certificates, curl, openssl]
+
+runcmd:
+  - |
+      arch=$(dpkg --print-architecture); [ "$arch" = "amd64" ] && carch=amd64 || carch=arm64
+      curl -fsSL "https://github.com/sigstore/cosign/releases/latest/download/cosign-linux-$${carch}" -o /usr/local/bin/cosign
+      chmod 0755 /usr/local/bin/cosign
diff --git a/deployment/gcp/startup-script-dev.sh b/deployment/gcp/startup-script-dev.sh
new file mode 100755
index 0000000..26d08e3
--- /dev/null
+++ b/deployment/gcp/startup-script-dev.sh
@@ -0,0 +1,16 @@
+#!/bin/bash
+# Dev mode: installs prereqs only. install.sh + binary injected via SCP by install-dev.sh.
+set -euo pipefail
+exec > /var/log/runevault-install.log 2>&1
+echo "=== runevault dev startup at $(date) ==="
+
+for i in $(seq 1 30); do
+  apt-get update -q && apt-get install -y ca-certificates curl openssl && break
+  echo "apt retry $i..." && sleep 10
+done
+
+arch=$(dpkg --print-architecture); [ "$arch" = "amd64" ] && carch=amd64 || carch=arm64
+curl -fsSL "https://github.com/sigstore/cosign/releases/latest/download/cosign-linux-$${carch}" -o /usr/local/bin/cosign
+chmod 0755 /usr/local/bin/cosign
+
+echo "=== prereqs ready at $(date), waiting for install-dev.sh injection ==="
diff --git a/deployment/oci/startup-script-dev.sh b/deployment/oci/startup-script-dev.sh
new file mode 100755
index 0000000..e813044
--- /dev/null
+++ b/deployment/oci/startup-script-dev.sh
@@ -0,0 +1,19 @@
+#!/bin/bash
+# Dev mode: installs prereqs only. install.sh + binary injected via SCP by install-dev.sh.
+set -euo pipefail
+exec > /var/log/runevault-install.log 2>&1
+echo "=== runevault dev startup at $(date) ==="
+
+for i in $(seq 1 30); do
+  apt-get update -q \
+    && apt-get -y --fix-broken install \
+    && apt-get install -y ca-certificates curl openssl \
+    && break
+  echo "apt retry $i..." && sleep 10
+done
+
+arch=$(dpkg --print-architecture); [ "$arch" = "amd64" ] && carch=amd64 || carch=arm64
+curl -fsSL "https://github.com/sigstore/cosign/releases/latest/download/cosign-linux-$${carch}" -o /usr/local/bin/cosign
+chmod 0755 /usr/local/bin/cosign
+
+echo "=== prereqs ready at $(date), waiting for install-dev.sh injection ==="
diff --git a/scripts/install-dev.sh b/scripts/install-dev.sh
index 5dbbcdf..90336cf 100755
--- a/scripts/install-dev.sh
+++ b/scripts/install-dev.sh
@@ -1,49 +1,682 @@
 #!/usr/bin/env bash
 #
-# Local testing wrapper for install.sh.
+# Rune-Vault dev installer (sibling of install.sh).
 #
-# Uses the locally built binary instead of downloading from GitHub.
-# Skips cosign verification. Useful for testing the installer flow without
-# a published release.
+# Installs the runevault daemon from your local working tree — never from a
+# published release. Use this to verify in-progress source code on your local
+# machine or on a CSP VM (AWS, GCP, OCI) before cutting a release.
 #
 # Usage:
-#   mise run go:build                         # build the binary first
-#   sudo bash scripts/install-dev.sh          # full install to /opt/runevault
-#   bash scripts/install-dev.sh --prefix /tmp/vault-test  # rootless local test
+#   sudo bash scripts/install-dev.sh [options]
+#
+# Options:
+#   --target <local|aws|gcp|oci>  Install/uninstall target (default: prompt if TTY, else local)
+#   --install-dir <path>          CSP install dir (default: $HOME/rune-vault-<csp>)
+#   --prefix <dir>                Local-only: rootless test prefix
+#   --non-interactive             Skip all prompts; supply secrets via env vars
+#   --uninstall                   Forward uninstall to install.sh (local or CSP target)
+#   --force                       Forwarded to install.sh (local target only)
+#
+# Differences from install.sh:
+#   - Always installs from the local working tree (no GitHub release download).
+#   - For CSP targets, builds linux/amd64 in Docker (golang:1.25-bookworm) with
+#     --platform linux/amd64 — works on any host arch via qemu emulation.
+#   - cloud-init-dev / startup-script-dev only prepare the VM; install.sh runs
+#     over SSH after cloud-init finishes.
+#
+# Non-interactive env vars (CSP install — operator workstation):
+#   RUNEVAULT_ENVECTOR_ENDPOINT      enVector endpoint URL (required)
+#   RUNEVAULT_ENVECTOR_API_KEY       enVector API key (required)
+#   RUNEVAULT_TEAM_NAME              Team name (required)
+#   RUNEVAULT_TARGET                 Pre-select target without interactive menu
+#   RUNEVAULT_INSTALL_DIR            Pre-set CSP install directory
+#   RUNEVAULT_CSP_REGION             Cloud region
+#   RUNEVAULT_GCP_PROJECT_ID         GCP: project ID (required for GCP)
+#   RUNEVAULT_OCI_COMPARTMENT_ID     OCI: compartment OCID (required for OCI)
 
 set -euo pipefail
 
-REPO_ROOT=$(cd "$(dirname "$0")/.." && pwd)
-LOCAL_BINARY="${REPO_ROOT}/vault/bin/runevault"
+# ── Constants ──────────────────────────────────────────────────────────────────
+SCRIPT_DIR=$(cd "$(dirname "$0")" && pwd)
+REPO_ROOT=$(cd "${SCRIPT_DIR}/.." && pwd)
+LOCAL_BINARY_HOST="${REPO_ROOT}/vault/bin/runevault"
+TARGET_OS=linux
+TARGET_ARCH=amd64
+LINUX_BINARY="${REPO_ROOT}/vault/bin/runevault-${TARGET_OS}-${TARGET_ARCH}"
+BUILDER_IMAGE="golang:1.25-bookworm"
+GRPC_PORT=50051
 
-[[ -x "$LOCAL_BINARY" ]] || {
-  printf 'ERROR: Binary not found at %s\n' "$LOCAL_BINARY" >&2
-  printf '  Run: mise run go:build\n' >&2
-  exit 1
-}
+# Overridable by env (mirrors install.sh)
+TARGET="${RUNEVAULT_TARGET:-}"
+INSTALL_DIR_CSP="${RUNEVAULT_INSTALL_DIR:-}"
+CSP_PUBLIC_IP=""
+
+# CSP config (populated by dev_csp_prompt_config)
+TEAM_NAME=""
+ENVECTOR_ENDPOINT=""
+ENVECTOR_API_KEY=""
+CSP_REGION=""
+GCP_PROJECT_ID=""
+OCI_COMPARTMENT_ID=""
+
+# ── Color helpers (copied from install.sh) ─────────────────────────────────────
+if [[ -t 1 ]]; then
+  _RED='\033[0;31m' _GRN='\033[0;32m' _BLU='\033[0;34m' _YLW='\033[0;33m' _RST='\033[0m'
+else
+  _RED='' _GRN='' _BLU='' _YLW='' _RST=''
+fi
+die()     { printf "${_RED}ERROR:${_RST} %s\n" "$*" >&2; exit 1; }
+info()    { printf "${_BLU}==>${_RST} %s\n" "$*"; }
+success() { printf "${_GRN}✓${_RST} %s\n" "$*"; }
+warn()    { printf "${_YLW}WARNING:${_RST} %s\n" "$*" >&2; }
 
-# Parse --prefix for rootless local testing; pass all other args to install.sh
+# ── Argument parsing ───────────────────────────────────────────────────────────
 PREFIX=""
+NON_INTERACTIVE=0
+UNINSTALL=0
 PASSTHROUGH_ARGS=()
+
 while [[ $# -gt 0 ]]; do
   case $1 in
-    --prefix) PREFIX="$2"; shift 2 ;;
-    *)        PASSTHROUGH_ARGS+=("$1"); shift ;;
+    --target)          TARGET="$2"; shift 2 ;;
+    --install-dir)     INSTALL_DIR_CSP="$2"; shift 2 ;;
+    --prefix)          PREFIX="$2"; shift 2 ;;
+    --non-interactive) NON_INTERACTIVE=1; PASSTHROUGH_ARGS+=("$1"); shift ;;
+    --uninstall)       UNINSTALL=1; shift ;;
+    --force)           PASSTHROUGH_ARGS+=("$1"); shift ;;
+    *)                 PASSTHROUGH_ARGS+=("$1"); shift ;;
   esac
 done
 
-export RUNEVAULT_LOCAL_BINARY="$LOCAL_BINARY"
-export RUNEVAULT_SKIP_VERIFY=1
+# Auto-set non-interactive when stdin is not a TTY
+[[ -t 0 ]] || NON_INTERACTIVE=1
 
-if [[ -n "$PREFIX" ]]; then
-  export RUNEVAULT_INSTALL_PREFIX="$PREFIX"
-  export RUNEVAULT_BINARY_PATH="${PREFIX}/runevault"
-  export RUNEVAULT_SKIP_SERVICE=1
-fi
+# ── Platform detection ─────────────────────────────────────────────────────────
+case "$(uname -s)" in
+  Linux)  HOST_OS=linux ;;
+  Darwin) HOST_OS=darwin ;;
+  *)      die "Unsupported host OS: $(uname -s). Only Linux and macOS are supported." ;;
+esac
+case "$(uname -m)" in
+  x86_64|amd64)  HOST_ARCH=amd64 ;;
+  arm64|aarch64) HOST_ARCH=arm64 ;;
+  *)             die "Unsupported host architecture: $(uname -m)." ;;
+esac
+
+# ── Banner ─────────────────────────────────────────────────────────────────────
+print_banner() {
+  local commit
+  commit=$(cd "$REPO_ROOT" && git rev-parse --short HEAD 2>/dev/null || echo unknown)
+  printf '\n'
+  printf '  ╭───────────────────────────────────────────────────────────────────╮\n'
+  printf '  │  Rune-Vault dev installer                                         │\n'
+  printf '  │  Source: local working tree (not a published release)             │\n'
+  printf '  │  Commit: %-56s │\n' "$commit"
+  printf '  ╰───────────────────────────────────────────────────────────────────╯\n'
+  printf '\n'
+}
+
+# ── Helpers (mirror install.sh) ───────────────────────────────────────────────
+_prompt() {
+  local varname=$1 label=$2 default=${3:-}
+  [[ -n "${!varname:-}" ]] && return 0
+  local val
+  if [[ -n "$default" ]]; then
+    read -r -p "${label} [${default}]: " val
+    printf -v "$varname" '%s' "${val:-$default}"
+  else
+    read -r -p "${label}: " val
+    printf -v "$varname" '%s' "$val"
+  fi
+}
+
+# Escape for embedding inside a double-quoted Terraform string.
+escape_tf() { printf '%s' "$1" | sed 's/\\/\\\\/g; s/"/\\"/g'; }
+
+# Escape for embedding inside a single-quoted shell argument.
+# Replaces every ' with '\''.
+escape_single() {
+  local s=$1
+  printf '%s' "${s//\'/\'\\\'\'}"
+}
+
+# ── Target resolution (mirror install.sh:198–226) ─────────────────────────────
+resolve_target() {
+  if [[ -n "${TARGET:-}" ]]; then
+    case "$TARGET" in
+      local|aws|gcp|oci) ;;
+      *) die "Invalid --target value: ${TARGET}. Valid: local, aws, gcp, oci." ;;
+    esac
+    return 0
+  fi
+  if [[ "$NON_INTERACTIVE" -eq 0 && -t 0 ]]; then
+    local action="install"
+    [[ "$UNINSTALL" -eq 1 ]] && action="uninstall"
+    printf '  Select %s target:\n' "$action"
+    printf '    1) Local (this machine)\n'
+    printf '    2) AWS\n'
+    printf '    3) GCP\n'
+    printf '    4) OCI\n'
+    printf '\n'
+    local choice
+    read -r -p "  Choice [1]: " choice
+    case "${choice:-1}" in
+      1|local) TARGET=local ;;
+      2|aws)   TARGET=aws ;;
+      3|gcp)   TARGET=gcp ;;
+      4|oci)   TARGET=oci ;;
+      *) die "Invalid choice: ${choice}" ;;
+    esac
+  else
+    TARGET=local
+  fi
+}
+
+# ── Preflight ──────────────────────────────────────────────────────────────────
+dev_preflight() {
+  info "Running dev preflight checks..."
+
+  # Rootless local test (--prefix) is the one path that doesn't require sudo.
+  if [[ "$TARGET" != "local" || -z "$PREFIX" ]]; then
+    [[ "$(id -u)" -eq 0 ]] || die "This installer must be run as root (use sudo)."
+  fi
+
+  [[ -d "${REPO_ROOT}/vault" ]] \
+    || die "vault/ directory not found under ${REPO_ROOT}. Run from a clone of rune-admin."
+
+  local missing=()
+  for tool in git mise; do
+    command -v "$tool" >/dev/null 2>&1 || missing+=("$tool")
+  done
+  [[ ${#missing[@]} -gt 0 ]] && die "Missing required tools: ${missing[*]}"
+
+  if [[ "$TARGET" != "local" ]]; then
+    [[ -z "$PREFIX" ]] || die "--prefix is local-only."
+    dev_check_docker
+  fi
+
+  success "Preflight passed."
+}
+
+dev_check_docker() {
+  command -v docker >/dev/null 2>&1 \
+    || die "docker is required for CSP targets. Install Docker Desktop / Docker Engine and retry."
 
-# Dev defaults for non-interactive installs
-export RUNEVAULT_TEAM_NAME="${RUNEVAULT_TEAM_NAME:-dev-team}"
-export RUNEVAULT_ENVECTOR_ENDPOINT="${RUNEVAULT_ENVECTOR_ENDPOINT:-https://envector.example.com}"
-export RUNEVAULT_ENVECTOR_API_KEY="${RUNEVAULT_ENVECTOR_API_KEY:-dev-api-key-placeholder}"
+  local docker_user="${SUDO_USER:-$(id -un)}"
+  if ! sudo -u "$docker_user" -H bash -lc 'docker info' >/dev/null 2>&1; then
+    die "docker daemon is not reachable for user '${docker_user}'. Start Docker (Docker Desktop / 'colima start' / 'systemctl start docker') and retry."
+  fi
 
-exec bash "${REPO_ROOT}/install.sh" "${PASSTHROUGH_ARGS[@]+"${PASSTHROUGH_ARGS[@]}"}"
+  # Cross-arch builder probe — fails fast if binfmt handlers are missing.
+  if ! sudo -u "$docker_user" -H bash -lc \
+    "docker run --rm --platform ${TARGET_OS}/${TARGET_ARCH} alpine:latest true" >/dev/null 2>&1; then
+    die "docker cannot run ${TARGET_OS}/${TARGET_ARCH} images. Install qemu binfmt handlers:
+       docker run --rm --privileged tonistiigi/binfmt --install all"
+  fi
+}
+
+# ── Build ──────────────────────────────────────────────────────────────────────
+dev_build_local_binary() {
+  info "Building runevault for host (${HOST_OS}/${HOST_ARCH})..."
+  local build_user="${SUDO_USER:-$(id -un)}"
+  (cd "$REPO_ROOT" && sudo -u "$build_user" -H bash -lc 'mise run go:build')
+  [[ -x "$LOCAL_BINARY_HOST" ]] || die "Build did not produce ${LOCAL_BINARY_HOST}."
+  success "Built: ${LOCAL_BINARY_HOST}"
+}
+
+dev_build_linux_binary() {
+  info "Building runevault for ${TARGET_OS}/${TARGET_ARCH} via Docker (${BUILDER_IMAGE})..."
+  local build_user="${SUDO_USER:-$(id -un)}"
+  local user_home commit version date pkg
+  user_home="${SUDO_USER:+$(eval echo ~"${SUDO_USER}")}"
+  user_home="${user_home:-$HOME}"
+  commit=$(cd "$REPO_ROOT" && git rev-parse --short HEAD 2>/dev/null || echo none)
+  version=dev
+  date=$(date -u +%Y-%m-%dT%H:%M:%SZ)
+  pkg="github.com/CryptoLabInc/rune-admin/vault/internal/commands"
+
+  local ldflags="-X '${pkg}.buildVersion=${version}' -X '${pkg}.buildCommit=${commit}' -X '${pkg}.buildDate=${date}'"
+  local out_rel="bin/runevault-${TARGET_OS}-${TARGET_ARCH}"
+
+  mkdir -p "${user_home}/go/pkg/mod"
+  mkdir -p "${REPO_ROOT}/vault/bin"
+  [[ -n "${SUDO_USER:-}" ]] && chown "${SUDO_USER}" "${REPO_ROOT}/vault/bin"
+
+  # Run docker as the invoking user so written files are owned correctly and
+  # the user's go module cache is reused for speed.
+  sudo -u "$build_user" -H docker run --rm \
+    --platform "${TARGET_OS}/${TARGET_ARCH}" \
+    -v "${REPO_ROOT}/vault:/src" \
+    -v "${user_home}/go/pkg/mod:/go/pkg/mod" \
+    -w /src \
+    -e CGO_ENABLED=1 \
+    -e LDFLAGS="$ldflags" \
+    -e OUTPUT="$out_rel" \
+    "${BUILDER_IMAGE}" \
+    bash -c '
+      set -e
+      apt-get update -qq && apt-get install -y -qq libssl-dev >/dev/null
+      go build -ldflags "$LDFLAGS" -o "$OUTPUT" ./cmd
+    ' || die "Docker build failed."
+
+  [[ -x "$LINUX_BINARY" ]] || die "Build did not produce ${LINUX_BINARY}."
+  success "Built: ${LINUX_BINARY}"
+}
+
+# ── Local config prompts (mirror dev_csp_prompt_config) ───────────────────────
+dev_local_prompt_config() {
+  if [[ "$NON_INTERACTIVE" -eq 0 ]]; then
+    printf '\n'
+    printf '══════════════════════════════════════════════════════════\n'
+    printf '  Local install configuration (dev mode)\n'
+    printf '══════════════════════════════════════════════════════════\n'
+    printf '\n'
+
+    _prompt RUNEVAULT_TEAM_NAME         "Team name"         "devteam"
+    _prompt RUNEVAULT_ENVECTOR_ENDPOINT "enVector endpoint" ""
+    _prompt RUNEVAULT_ENVECTOR_API_KEY  "enVector API key"  ""
+    printf '\n'
+
+    [[ -n "${RUNEVAULT_ENVECTOR_ENDPOINT:-}" ]] || die "enVector endpoint is required."
+    [[ -n "${RUNEVAULT_ENVECTOR_API_KEY:-}" ]]  || die "enVector API key is required."
+  else
+    RUNEVAULT_TEAM_NAME="${RUNEVAULT_TEAM_NAME:-devteam}"
+    RUNEVAULT_ENVECTOR_ENDPOINT="${RUNEVAULT_ENVECTOR_ENDPOINT:-https://envector.example.com}"
+    RUNEVAULT_ENVECTOR_API_KEY="${RUNEVAULT_ENVECTOR_API_KEY:-dev-api-key-placeholder}"
+  fi
+}
+
+# ── Local install branch ──────────────────────────────────────────────────────
+dev_local_install() {
+  dev_build_local_binary
+  dev_local_prompt_config
+
+  export RUNEVAULT_LOCAL_BINARY="$LOCAL_BINARY_HOST"
+  export RUNEVAULT_SKIP_VERIFY=1
+  export RUNEVAULT_TEAM_NAME
+  export RUNEVAULT_ENVECTOR_ENDPOINT
+  export RUNEVAULT_ENVECTOR_API_KEY
+
+  if [[ -n "$PREFIX" ]]; then
+    export RUNEVAULT_INSTALL_PREFIX="$PREFIX"
+    export RUNEVAULT_BINARY_PATH="${PREFIX}/runevault"
+    export RUNEVAULT_SKIP_SERVICE=1
+  fi
+
+  exec bash "${REPO_ROOT}/install.sh" --target local "${PASSTHROUGH_ARGS[@]+"${PASSTHROUGH_ARGS[@]}"}"
+}
+
+# ── Uninstall forward ─────────────────────────────────────────────────────────
+# install-dev.sh defers all uninstall logic to install.sh. install.sh handles
+# both local (service + files) and CSP (terraform destroy + dir cleanup).
+dev_forward_uninstall() {
+  info "Forwarding uninstall to install.sh (target: ${TARGET})..."
+  local args=(--uninstall --target "$TARGET")
+  [[ -n "$INSTALL_DIR_CSP" ]] && args+=(--install-dir "$INSTALL_DIR_CSP")
+  [[ "$NON_INTERACTIVE" -eq 1 ]] && args+=(--non-interactive)
+
+  if [[ "$TARGET" = "local" && -n "$PREFIX" ]]; then
+    export RUNEVAULT_INSTALL_PREFIX="$PREFIX"
+    export RUNEVAULT_BINARY_PATH="${PREFIX}/runevault"
+  fi
+
+  exec bash "${REPO_ROOT}/install.sh" "${args[@]}"
+}
+
+# ── CSP preflight (mirror install.sh:228–285) ─────────────────────────────────
+dev_csp_preflight() {
+  local csp=$1
+  info "Running CSP preflight checks for ${csp}..."
+
+  command -v terraform >/dev/null 2>&1 \
+    || die "terraform is not installed. Install it (https://developer.hashicorp.com/terraform/install) and retry."
+
+  local csp_cli auth_cmd auth_setup
+  case "$csp" in
+    aws)
+      csp_cli=aws
+      auth_cmd='aws sts get-caller-identity'
+      auth_setup='aws configure'
+      ;;
+    gcp)
+      csp_cli=gcloud
+      auth_cmd='gcloud auth application-default print-access-token'
+      auth_setup='gcloud auth application-default login'
+      ;;
+    oci)
+      csp_cli=oci
+      auth_cmd='oci iam region list'
+      auth_setup='oci setup config'
+      ;;
+  esac
+
+  local tf_user="${SUDO_USER:-$(id -un)}"
+
+  if ! sudo -u "$tf_user" -H bash -lc "command -v ${csp_cli}" >/dev/null 2>&1; then
+    die "'${csp_cli}' CLI not found in PATH for user '${tf_user}'. Install it and re-run."
+  fi
+
+  if ! sudo -u "$tf_user" -H bash -lc "${auth_cmd}" >/dev/null 2>&1; then
+    die "'${csp_cli}' is not authenticated for user '${tf_user}'. Authenticate and re-run: ${auth_setup}"
+  fi
+
+  success "CSP preflight passed."
+}
+
+# ── CSP config prompts (mirror install.sh:287–347) ────────────────────────────
+dev_csp_prompt_config() {
+  local csp=$1
+
+  if [[ "$NON_INTERACTIVE" -eq 0 ]]; then
+    printf '\n'
+    printf '══════════════════════════════════════════════════════════\n'
+    printf '  Cloud deployment configuration (dev mode)\n'
+    printf '══════════════════════════════════════════════════════════\n'
+    printf '\n'
+
+    _prompt TEAM_NAME          "Team name"          "devteam"
+    _prompt ENVECTOR_ENDPOINT  "enVector endpoint"  ""
+    _prompt ENVECTOR_API_KEY   "enVector API key"   ""
+
+    case "$csp" in
+      aws) _prompt CSP_REGION "AWS region"   "us-east-1"   ;;
+      gcp)
+        _prompt CSP_REGION    "GCP region"   "us-central1"
+        _prompt GCP_PROJECT_ID "GCP project ID" ""
+        ;;
+      oci)
+        _prompt CSP_REGION         "OCI region"          "us-ashburn-1"
+        _prompt OCI_COMPARTMENT_ID "OCI compartment OCID" ""
+        ;;
+    esac
+    printf '\n'
+  else
+    TEAM_NAME="${RUNEVAULT_TEAM_NAME:-}"
+    ENVECTOR_ENDPOINT="${RUNEVAULT_ENVECTOR_ENDPOINT:-}"
+    ENVECTOR_API_KEY="${RUNEVAULT_ENVECTOR_API_KEY:-}"
+    CSP_REGION="${RUNEVAULT_CSP_REGION:-}"
+    GCP_PROJECT_ID="${RUNEVAULT_GCP_PROJECT_ID:-}"
+    OCI_COMPARTMENT_ID="${RUNEVAULT_OCI_COMPARTMENT_ID:-}"
+
+    local missing=()
+    [[ -z "$TEAM_NAME" ]]         && missing+=("RUNEVAULT_TEAM_NAME")
+    [[ -z "$ENVECTOR_ENDPOINT" ]] && missing+=("RUNEVAULT_ENVECTOR_ENDPOINT")
+    [[ -z "$ENVECTOR_API_KEY" ]]  && missing+=("RUNEVAULT_ENVECTOR_API_KEY")
+    [[ "$csp" = gcp && -z "$GCP_PROJECT_ID" ]]      && missing+=("RUNEVAULT_GCP_PROJECT_ID")
+    [[ "$csp" = oci && -z "$OCI_COMPARTMENT_ID" ]]  && missing+=("RUNEVAULT_OCI_COMPARTMENT_ID")
+    if [[ ${#missing[@]} -gt 0 ]]; then
+      printf 'ERROR: Missing required env vars:\n' >&2
+      for v in "${missing[@]}"; do printf '  %s\n' "$v" >&2; done
+      exit 1
+    fi
+  fi
+
+  [[ -n "$TEAM_NAME" ]]          || die "Team name is required."
+  [[ -n "$ENVECTOR_ENDPOINT" ]]  || die "enVector endpoint is required."
+  [[ -n "$ENVECTOR_API_KEY" ]]   || die "enVector API key is required."
+  if [[ "$csp" = gcp ]]; then
+    [[ -n "$GCP_PROJECT_ID" ]]     || die "GCP project ID is required."
+  fi
+  if [[ "$csp" = oci ]]; then
+    [[ -n "$OCI_COMPARTMENT_ID" ]] || die "OCI compartment OCID is required."
+  fi
+}
+
+# ── SSH key (identical to install.sh:349–361) ─────────────────────────────────
+dev_csp_generate_ssh_key() {
+  local key_path="${INSTALL_DIR_CSP}/ssh_key"
+  if [[ -f "$key_path" ]]; then
+    info "SSH key already exists: ${key_path}"
+    return 0
+  fi
+  ssh-keygen -t ed25519 -N '' -f "$key_path" -q
+  chmod 0600 "$key_path"
+  chmod 0644 "${key_path}.pub"
+  [[ -n "${SUDO_USER:-}" ]] \
+    && chown "${SUDO_USER}" "$key_path" "${key_path}.pub"
+  success "SSH key generated: ${key_path}"
+}
+
+# ── Terraform files (mirror install.sh:373–399, swap to *-dev variants) ──────
+dev_csp_copy_terraform_files() {
+  local csp=$1
+  local tf_src="${REPO_ROOT}/deployment/${csp}"
+  local tf_dest="${INSTALL_DIR_CSP}/deployment"
+  mkdir -p "$tf_dest"
+
+  cp "${tf_src}/main.tf" "${tf_dest}/main.tf"
+
+  # Use the *-dev variant of cloud-init / startup-script, but rename to the
+  # canonical filename so main.tf's templatefile() reference keeps working
+  # without Terraform changes.
+  case "$csp" in
+    aws)
+      [[ -f "${tf_src}/cloud-init-dev.yaml" ]] \
+        || die "Missing ${tf_src}/cloud-init-dev.yaml."
+      cp "${tf_src}/cloud-init-dev.yaml" "${tf_dest}/cloud-init.yaml"
+      ;;
+    gcp|oci)
+      [[ -f "${tf_src}/startup-script-dev.sh" ]] \
+        || die "Missing ${tf_src}/startup-script-dev.sh."
+      cp "${tf_src}/startup-script-dev.sh" "${tf_dest}/startup-script.sh"
+      ;;
+  esac
+
+  printf '*.tfvars\nterraform.tfstate*\n.terraform/\n' > "${INSTALL_DIR_CSP}/.gitignore"
+  [[ -n "${SUDO_USER:-}" ]] && chown -R "${SUDO_USER}" "$tf_dest" "${INSTALL_DIR_CSP}/.gitignore"
+  success "Terraform files (dev variant) ready: ${tf_dest}"
+}
+
+# ── tfvars (mirror install.sh:403–439) ────────────────────────────────────────
+dev_csp_render_tfvars() {
+  local csp=$1
+  local tf_dir="${INSTALL_DIR_CSP}/deployment"
+  local tfvars="${tf_dir}/terraform.tfvars"
+  local public_key=""
+
+  if [[ -f "${tf_dir}/terraform.tfstate" ]]; then
+    if [[ "$NON_INTERACTIVE" -eq 0 ]]; then
+      local answer=n
+      read -r -p "terraform.tfstate already exists in ${tf_dir}. Re-apply? [y/N] " answer
+      [[ "$answer" =~ ^[Yy] ]] || { info "Aborted."; exit 0; }
+    else
+      warn "terraform.tfstate exists — re-applying (idempotent)."
+    fi
+  fi
+
+  [[ -f "${INSTALL_DIR_CSP}/ssh_key.pub" ]] \
+    && public_key=$(cat "${INSTALL_DIR_CSP}/ssh_key.pub")
+
+  {
+    printf 'team_name          = "%s"\n' "$(escape_tf "${TEAM_NAME:-default}")"
+    printf 'tls_mode           = "self-signed"\n'
+    printf 'envector_endpoint  = "%s"\n' "$(escape_tf "${ENVECTOR_ENDPOINT}")"
+    printf 'envector_api_key   = "%s"\n' "$(escape_tf "${ENVECTOR_API_KEY}")"
+    printf 'runevault_version  = "dev"\n'
+    printf 'public_key         = "%s"\n' "$(escape_tf "${public_key}")"
+    printf 'region             = "%s"\n' "$(escape_tf "${CSP_REGION}")"
+    case "$csp" in
+      gcp) printf 'project_id         = "%s"\n' "$(escape_tf "${GCP_PROJECT_ID}")" ;;
+      oci) printf 'compartment_id     = "%s"\n' "$(escape_tf "${OCI_COMPARTMENT_ID}")" ;;
+    esac
+  } > "$tfvars"
+
+  chmod 0600 "$tfvars"
+  [[ -n "${SUDO_USER:-}" ]] && chown "${SUDO_USER}" "$tfvars"
+  success "terraform.tfvars written: ${tfvars}"
+}
+
+# ── Terraform apply (mirror install.sh:441–453) ───────────────────────────────
+dev_csp_run_terraform() {
+  local tf_dir="${INSTALL_DIR_CSP}/deployment"
+  local tf_user="${SUDO_USER:-$(id -un)}"
+
+  info "Running terraform init..."
+  (cd "$tf_dir" && sudo -u "$tf_user" terraform init -input=false)
+  info "Running terraform apply..."
+  (cd "$tf_dir" && sudo -u "$tf_user" terraform apply -auto-approve -input=false)
+
+  chmod 0600 "${tf_dir}/terraform.tfstate" 2>/dev/null || true
+  chmod 0600 "${tf_dir}/terraform.tfstate.backup" 2>/dev/null || true
+  success "Terraform apply complete."
+}
+
+# ── Upload + remote install (replaces csp_post_deploy for dev mode) ───────────
+dev_csp_upload_and_install() {
+  local csp=$1
+  local tf_dir="${INSTALL_DIR_CSP}/deployment"
+  local tf_user="${SUDO_USER:-$(id -un)}"
+  local key_path="${INSTALL_DIR_CSP}/ssh_key"
+  local ssh_user=ubuntu
+
+  local public_ip
+  public_ip=$(cd "$tf_dir" && sudo -u "$tf_user" terraform output -raw vault_public_ip 2>/dev/null) \
+    || die "Could not read vault_public_ip from terraform output."
+  CSP_PUBLIC_IP="$public_ip"
+
+  local ssh_opts="-o BatchMode=yes -o StrictHostKeyChecking=no -o ConnectTimeout=15"
+  local ssh_prefix="sudo -u ${tf_user}"
+
+  # 1. Wait for SSH on the VM.
+  info "Waiting for SSH on ${ssh_user}@${public_ip} (up to 30 min)..."
+  local timeout_secs=1800
+  local deadline=$(( $(date +%s) + timeout_secs ))
+  local ssh_ready=0
+  while [[ $(date +%s) -lt $deadline ]]; do
+    # shellcheck disable=SC2086
+    if $ssh_prefix ssh $ssh_opts -i "$key_path" "${ssh_user}@${public_ip}" true 2>/dev/null; then
+      ssh_ready=1
+      break
+    fi
+    sleep 15
+  done
+  [[ "$ssh_ready" -eq 1 ]] \
+    || die "Timed out waiting for SSH. ssh -i ${key_path} ${ssh_user}@${public_ip}"
+  success "SSH reachable."
+
+  # 2. Wait for cloud-init-dev to finish (cosign is the last thing it installs).
+  info "Waiting for cloud-init-dev to finish (cosign + apt prereqs)..."
+  deadline=$(( $(date +%s) + 600 ))
+  local prereqs_ready=0
+  while [[ $(date +%s) -lt $deadline ]]; do
+    # shellcheck disable=SC2086
+    if $ssh_prefix ssh $ssh_opts -i "$key_path" "${ssh_user}@${public_ip}" \
+         "test -x /usr/local/bin/cosign && test -x /usr/bin/openssl" 2>/dev/null; then
+      prereqs_ready=1
+      break
+    fi
+    sleep 10
+  done
+  [[ "$prereqs_ready" -eq 1 ]] \
+    || die "Timed out waiting for cloud-init-dev. SSH in to debug: ssh -i ${key_path} ${ssh_user}@${public_ip}"
+  success "Cloud-init-dev complete."
+
+  # 3. SCP install.sh + linux/amd64 binary to /tmp.
+  info "Uploading install.sh and runevault binary to ${public_ip}..."
+  # shellcheck disable=SC2086
+  $ssh_prefix scp $ssh_opts -i "$key_path" \
+    "${REPO_ROOT}/install.sh" \
+    "${LINUX_BINARY}" \
+    "${ssh_user}@${public_ip}:/tmp/" \
+    || die "SCP upload failed."
+  success "Artifacts uploaded."
+
+  # 4. Run install.sh on the VM with dev hooks.
+  info "Running install.sh on the VM..."
+  local tn ee ek
+  tn=$(escape_single "$TEAM_NAME")
+  ee=$(escape_single "$ENVECTOR_ENDPOINT")
+  ek=$(escape_single "$ENVECTOR_API_KEY")
+  local remote_cmd
+  remote_cmd="sudo \
+    RUNEVAULT_LOCAL_BINARY=/tmp/runevault-${TARGET_OS}-${TARGET_ARCH} \
+    RUNEVAULT_SKIP_VERIFY=1 \
+    RUNEVAULT_TEAM_NAME='${tn}' \
+    RUNEVAULT_ENVECTOR_ENDPOINT='${ee}' \
+    RUNEVAULT_ENVECTOR_API_KEY='${ek}' \
+    bash /tmp/install.sh --target local --non-interactive --version dev"
+
+  # shellcheck disable=SC2086
+  $ssh_prefix ssh $ssh_opts -i "$key_path" "${ssh_user}@${public_ip}" "$remote_cmd" \
+    || die "Remote install.sh failed. SSH in to debug: ssh -i ${key_path} ${ssh_user}@${public_ip}"
+  success "Remote install complete."
+
+  # 5. Pull CA cert back to the operator workstation.
+  info "Fetching CA certificate..."
+  mkdir -p "${INSTALL_DIR_CSP}/certs"
+  [[ -n "${SUDO_USER:-}" ]] && chown "${SUDO_USER}" "${INSTALL_DIR_CSP}/certs"
+  # shellcheck disable=SC2086
+  $ssh_prefix scp $ssh_opts -i "$key_path" \
+    "${ssh_user}@${public_ip}:/opt/runevault/certs/ca.pem" \
+    "${INSTALL_DIR_CSP}/certs/ca.pem" \
+    || die "CA cert fetch failed."
+  success "CA certificate saved: ${INSTALL_DIR_CSP}/certs/ca.pem"
+}
+
+# ── Summary (mirror install.sh:491–518 + dev banner) ──────────────────────────
+dev_csp_summary() {
+  local csp=$1
+  local tf_dir="${INSTALL_DIR_CSP}/deployment"
+  local key_path="${INSTALL_DIR_CSP}/ssh_key"
+  local public_ip="${CSP_PUBLIC_IP:-<unknown>}"
+  local commit
+  commit=$(cd "$REPO_ROOT" && git rev-parse --short HEAD 2>/dev/null || echo unknown)
+
+  printf '\n'
+  success "Rune-Vault deployed to $(printf '%s' "$csp" | tr 'a-z' 'A-Z') (dev mode)."
+  printf '\n'
+  printf '  Endpoint:  %s:%s\n' "$public_ip" "$GRPC_PORT"
+  printf '  CA cert:   %s\n'    "${INSTALL_DIR_CSP}/certs/ca.pem"
+  printf '  SSH:       ssh -i %s ubuntu@%s\n' "$key_path" "$public_ip"
+  printf '  Terraform: %s\n'    "$tf_dir"
+  printf '  Source:    local working tree (commit %s)\n' "$commit"
+  printf '\n'
+  printf 'Tear down:\n'
+  printf '  cd %s && terraform destroy -auto-approve\n' "$tf_dir"
+  printf '\n'
+  printf 'Next steps (SSH into the VM, then run on the VM):\n'
+  printf '  ssh -i %s ubuntu@%s\n' "$key_path" "$public_ip"
+  printf '\n'
+  printf '  Issue a token:  runevault token issue --user <name> --role member\n'
+  printf '  Check status:   runevault status\n'
+  printf '  View logs:      runevault logs\n'
+  printf '  Manage daemon:  sudo systemctl start|stop|restart runevault\n'
+  printf '\n'
+  warn "BACKUP: Keep this safe — it cannot be recovered if lost:"
+  warn "  Terraform state: ${tf_dir}/terraform.tfstate"
+}
+
+# ── CSP dispatch (mirror install.sh:520–549) ──────────────────────────────────
+dev_csp_dispatch() {
+  local csp="$TARGET"
+  local user_home="${SUDO_USER:+$(eval echo ~"${SUDO_USER}")}"
+  user_home="${user_home:-$HOME}"
+  INSTALL_DIR_CSP="${INSTALL_DIR_CSP:-${user_home}/rune-vault-${csp}}"
+  mkdir -p "$INSTALL_DIR_CSP"
+  [[ -n "${SUDO_USER:-}" ]] && chown "${SUDO_USER}" "$INSTALL_DIR_CSP"
+
+  dev_csp_preflight "$csp"
+  dev_csp_prompt_config "$csp"
+  dev_csp_generate_ssh_key
+  dev_build_linux_binary
+  dev_csp_copy_terraform_files "$csp"
+  dev_csp_render_tfvars "$csp"
+  dev_csp_run_terraform
+  dev_csp_upload_and_install "$csp"
+  dev_csp_summary "$csp"
+  exit 0
+}
+
+# ── Main ───────────────────────────────────────────────────────────────────────
+print_banner
+resolve_target
+
+[[ "$UNINSTALL" -eq 1 ]] && dev_forward_uninstall
+
+dev_preflight
+
+if [[ "$TARGET" = "local" ]]; then
+  dev_local_install
+else
+  dev_csp_dispatch
+fi

From c5c09ed93645b3e1b3c8a3b47aedc3509d43acfc Mon Sep 17 00:00:00 2001
From: Jeonghwan Lee <jhlee@cryptolab.co.kr>
Date: Thu, 30 Apr 2026 10:24:16 +0900
Subject: [PATCH 21/27] docs: refresh markdown docs for Go migration and CSP
 installer

Realign README, CONTRIBUTING, ARCHITECTURE, AGENTS, and tests/FIXTURES
with the actual state of epic/go-migration: single-binary `runevault`
daemon, native systemd/launchd service, admin Unix domain socket,
YAML-only config (`runevault.conf`), install.sh with --target
local|aws|gcp|oci, scripts/install-dev.sh sibling, Sigstore-signed
release pipeline, and Ubuntu 24.04 cloud images. Drop stale references
to Python modules, Docker Compose / GHCR, port-8081 HTTP admin,
env-var fallback, and aspirational HA / restore-from-backup terraform
variables that don't exist. Add an [Unreleased] CHANGELOG section
capturing the BREAKING Go rewrite plus the installer, CSP, and release
pipeline work landed on this branch.
---
 AGENTS.md            |   9 +-
 CHANGELOG.md         |  31 +++++
 CONTRIBUTING.md      |  75 +++++++----
 README.md            | 159 ++++++++++++++--------
 docs/ARCHITECTURE.md | 310 +++++++++++++++++++++----------------------
 tests/FIXTURES.md    |   2 +-
 6 files changed, 337 insertions(+), 249 deletions(-)

diff --git a/AGENTS.md b/AGENTS.md
index c86beb2..82f38bd 100644
--- a/AGENTS.md
+++ b/AGENTS.md
@@ -16,10 +16,11 @@ Do NOT run go, gofmt, or buf directly.
 | Command | Description |
 |---------|-------------|
 | `mise run setup` | Bootstrap (Go modules + proto stubs) |
-| `mise run check` | All checks: gofmt + go vet + go test (race) |
-| `mise run go:build` | Build the runevault binary |
-| `mise run go:test` | Run Go unit + integration tests with race detector |
-| `mise run go:test:unit` | Run Go unit tests only (skip CLI smoke E2E) |
+| `mise run check` | All checks: gofmt + go vet + unit tests (race) |
+| `mise run go:build` | Build the runevault binary to `vault/bin/runevault` |
+| `mise run go:test` | Run all tests including E2E (requires `RUNEVAULT_TEST_BINARY`) |
+| `mise run go:test:unit` | Run unit tests only (E2E excluded by build tag) |
+| `mise run go:test:e2e` | Run E2E tests against pre-built binary (run `go:build` first) |
 | `mise run go:vet` | Run go vet on all Go packages |
 | `mise run go:fmt` | Format Go source files |
 | `mise run go:fmt:check` | Check Go formatting without modifying |
diff --git a/CHANGELOG.md b/CHANGELOG.md
index 46e6b53..e155a8b 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -5,6 +5,37 @@ All notable changes to Rune-Vault will be documented in this file.
 The format is based on [Keep a Changelog](https://keepachangelog.com/en/1.0.0/),
 and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0.html).
 
+## [Unreleased]
+
+### ⚠ BREAKING CHANGES
+
+- **Vault rewritten in Go as the single binary `runevault`** (#61). YAML config (`runevault.conf`) is now the only configuration source — env-var fallback removed, no migration helper, no deprecation banners. Existing Python-based deployments must be reinstalled via `install.sh`.
+
+### Added
+
+- Production installer `install.sh` with `--target local|aws|gcp|oci`, Sigstore signature verification, systemd/launchd service registration, and `--uninstall` flow
+- Dev installer `scripts/install-dev.sh` (structural sibling of `install.sh`) for local/CSP testing without GitHub releases
+- CSP provisioning via Terraform for AWS, GCP, and OCI: preflight CLI/auth checks, cloud-init bootstrap, CA-cert SCP polling
+- CSP uninstall flow that wraps `terraform destroy`
+- `runevault status` (daemon + admin-socket health) and `runevault logs` (audit log tail) subcommands
+- `runevault` group lets members run the CLI without `sudo`
+- Multi-platform release pipeline (linux/darwin × amd64/arm64) with `SHA256SUMS` + Sigstore keyless signing
+- `EnsureVault` startup hook to activate keys and ensure index on first run
+
+### Changed
+
+- Cloud VM images bumped to Ubuntu 24.04 LTS
+- OCI SCP user is now `ubuntu`
+- Daemon lifecycle delegated to the OS service manager (systemd / launchd) instead of Docker
+- Admin transport: HTTP on `127.0.0.1:8081` → Unix domain socket at `/opt/runevault/admin.sock` (mode 0600)
+- Token / role storage: standalone `vault-tokens.yml` / `vault-roles.yml` → fields under `runevault.conf` with `*_file` indirection support
+
+### Removed
+
+- Python sources, `docker-compose.yml`, `Dockerfile`, GHCR-published Docker image
+- `pyenvector` runtime dependency
+- Env-var configuration fallback (`VAULT_TLS_DISABLE`, `VAULT_TEAM_SECRET`, `VAULT_AUDIT_LOG`, etc.)
+
 ## [0.3.0] - 2026-04-07
 
 ### ⚠ BREAKING CHANGES
diff --git a/CONTRIBUTING.md b/CONTRIBUTING.md
index 209b466..4b5aa7c 100644
--- a/CONTRIBUTING.md
+++ b/CONTRIBUTING.md
@@ -36,8 +36,8 @@ Feature requests should include:
 - [mise](https://mise.jdx.dev): `curl https://mise.jdx.dev/install.sh | sh`
 
 **CSP deployment only:**
-- Access to cloud provider (OCI/AWS/GCP)
-- GitHub CLI (`gh`) with GHCR push access to the CryptoLabInc organization
+- Access to a cloud provider (AWS, GCP, or OCI) and the matching CLI authenticated locally
+- Docker (used by `scripts/install-dev.sh` to cross-compile a Linux/amd64 binary for cloud VMs)
 
 ### Local Setup
 
@@ -55,7 +55,7 @@ Feature requests should include:
 
 3. **Verify setup**
    ```bash
-   mise run test:unit  # Run unit tests to verify
+   mise run go:test:unit  # Run unit tests to verify
    ```
 
 4. **(Optional) Activate mise in your shell**
@@ -69,7 +69,7 @@ Feature requests should include:
 
 All commands **must** be run via `mise run` to ensure correct tool versions.
 
-See [CLAUDE.md](CLAUDE.md#commands) for the complete task table.
+See [CLAUDE.md](CLAUDE.md#commands) (or [AGENTS.md](AGENTS.md#commands)) for the complete task table.
 
 ## Testing
 
@@ -79,22 +79,23 @@ See [CLAUDE.md](CLAUDE.md#commands) for the complete task table.
 vault/internal/
 ├── tokens/        # Token store + role/rate-limit unit tests
 ├── crypto/        # HKDF + AES-CTR + envector-go-sdk wrappers
-├── server/        # gRPC handlers, interceptors, audit, admin UDS, pidfile
+├── server/        # gRPC handlers, interceptors, audit, admin UDS, config
 ├── commands/      # CLI subcommands + admin client
-├── integration/   # E2E: decrypt pipeline (fixture-based) + CLI smoke
-└── testutil/      # Fixture path resolver
+└── tests/         # E2E (build tag `e2e`): decrypt pipeline (fixture-based) + CLI smoke
 ```
 
 ### Running Tests
 
 ```bash
-mise run go:test          # All tests with race detector
-mise run go:test:unit     # Skip CLI smoke E2E (faster)
+mise run go:test:unit     # Unit tests only (E2E excluded by build tag)
+mise run go:build         # Build vault/bin/runevault first…
+mise run go:test:e2e      # …then run E2E against the built binary
+mise run go:test          # All tests including E2E (requires RUNEVAULT_TEST_BINARY)
 ```
 
 ### Test Fixtures
 
-Integration tests use GPG-encrypted fixtures containing FHE keys and ciphertext blobs. See [tests/FIXTURES.md](tests/FIXTURES.md) for the full update procedure, including passphrase rotation and re-encryption steps. The fixture-based decrypt-pipeline test under `vault/internal/integration/` skips automatically when `tests/fixtures/` is not decrypted.
+Integration tests use GPG-encrypted fixtures containing FHE keys and ciphertext blobs. See [tests/FIXTURES.md](tests/FIXTURES.md) for the full update procedure, including passphrase rotation and re-encryption steps. The fixture-based decrypt-pipeline test under `vault/internal/tests/` skips automatically when `tests/fixtures/` is not decrypted.
 
 ### Test Requirements
 
@@ -145,22 +146,29 @@ Integration tests use GPG-encrypted fixtures containing FHE keys and ciphertext
 ### Local Testing
 
 ```bash
-mise run dev    # Start local Vault via Docker Compose
-mise run build  # Build Docker image locally
+mise run dev         # Run runevault daemon in foreground (uses vault/dev/runevault.conf)
+mise run go:build    # Build runevault binary to vault/bin/runevault
 ```
 
 ### Testing the Installer Locally
 
-Use `scripts/install-dev.sh` to test the full installation flow using local working tree files instead of downloading from GitHub.
+`scripts/install-dev.sh` is a structural sibling of `install.sh` that
+exercises the full install flow against a locally built binary instead
+of a published GitHub release.
 
 ```bash
-sudo bash scripts/install-dev.sh
+# Local install into a rootless prefix (no service registration)
+RUNEVAULT_SKIP_SERVICE=1 \
+  bash scripts/install-dev.sh --target local --prefix "$HOME/runevault-test"
+
+# Cloud install: cross-compiles linux/amd64 in golang:1.25-bookworm,
+# uploads via SCP, and runs install.sh on the remote VM.
+bash scripts/install-dev.sh --target oci --install-dir "$HOME/rune-vault-oci"
 ```
 
-This script behaves identically to `install.sh` but:
-- Copies `docker-compose.yml`, TLS scripts, and Terraform configs from the local repo
-- Uses a locally built Docker image (`mise run build`) instead of pulling from GHCR
-- Requires no network access to GitHub
+Flags mirror `install.sh`: `--target`, `--install-dir`, `--prefix`,
+`--non-interactive`, `--uninstall`, `--force`. Uninstall is delegated to
+`install.sh --uninstall`.
 
 ## Submitting Changes
 
@@ -233,12 +241,23 @@ Closes #123
 
 ```
 rune-admin/
-├── vault/                  # Rune-Vault gRPC server (see [Architecture](docs/ARCHITECTURE.md))
-├── deployment/            # Terraform configs (OCI, AWS, GCP) + monitoring
+├── vault/
+│   ├── cmd/                       # runevault binary entry point
+│   ├── internal/                  # commands, server, tokens, crypto, tests
+│   ├── pkg/vaultpb/               # generated gRPC stubs
+│   ├── proto/                     # .proto source
+│   └── dev/                       # local dev config (gitignored)
+├── deployment/
+│   ├── aws/  gcp/  oci/           # Terraform per CSP
+│   ├── systemd/runevault.service  # Linux service unit
+│   └── launchd/com.cryptolabinc.runevault.plist  # macOS service
 ├── scripts/
-├── tests/                 # Unit, integration tests
-├── docs/                  # Architecture docs
-└── install.sh             # Interactive installer
+│   ├── install-dev.sh             # Dev sibling of install.sh
+│   ├── generate-certs.sh          # Self-signed TLS certs for dev
+│   └── generate-test-fixtures.py  # Generates GPG-encrypted test fixtures
+├── tests/                         # Encrypted fixture archive (see FIXTURES.md)
+├── docs/ARCHITECTURE.md           # Architecture & data flow
+└── install.sh                     # Production installer (Sigstore-verified)
 ```
 
 ## Vault Architecture
@@ -247,11 +266,11 @@ Core server code is in `vault/`. See [docs/ARCHITECTURE.md](docs/ARCHITECTURE.md
 
 ## Security Considerations
 
-- Secret key (`vault_keys/`) must never be logged, returned in API responses, or leave the server process
-- Admin server binds to `127.0.0.1` only — never expose externally
-- Never commit private keys (SecKey.json)
-- Token secrets must come from environment variables, never hardcoded
-- TLS is required for all cloud deployments
+- Secret key (`vault-keys/<key-id>/SecKey.json`) must never be logged, returned in API responses, or leave the server process
+- Admin transport is a Unix domain socket (mode 0600, vault-user owned) — never expose externally
+- Never commit private keys (`SecKey.json`) or filled-in `runevault.conf` files
+- Token secrets and FHE keys live in `runevault.conf` (mode 0600); secret YAML fields support `*_file` indirection for KMS-backed deployments
+- TLS is required for all cloud deployments (`server.grpc.tls.disable: true` is dev-only)
 - Review security implications of changes
 - Test authentication and authorization
 
diff --git a/README.md b/README.md
index a125008..14bb58f 100644
--- a/README.md
+++ b/README.md
@@ -19,14 +19,14 @@ For system architecture and data flow details, see [docs/ARCHITECTURE.md](docs/A
 
 ### Platform
 
-- **macOS** or **Linux** (Windows is not supported — pyenvector requires Unix)
+- **macOS** or **Linux** (Windows is not supported — `runevault` registers a systemd or launchd service)
 
 ### For Administrators
 
 1. **enVector Cloud account** at [https://envector.io](https://envector.io) — Cluster Endpoint and API Key
-2. **Cloud provider account** (OCI, AWS, or GCP) — only needed for cloud deployment
+2. **Cloud provider account** (AWS, GCP, or OCI) — only needed for cloud deployment
 
-The [installer](#quick-start) will automatically check and install required tools (Docker, Terraform, etc.).
+The [installer](#quick-start) auto-checks for the tools it needs (`cosign` for signature verification, plus `terraform` and the relevant cloud CLI when targeting a CSP).
 
 ### For Team Members
 
@@ -38,50 +38,46 @@ Team members install [Rune](https://github.com/CryptoLabInc/rune) from Claude Ma
 
 ## Quick Start
 
-### 1. Build and run Rune-Vault
+### 1. Install Rune-Vault
 
-Phase 1 of the Go runtime migration ships the daemon as a single binary
-`runevault`. The cloud installer (binary distribution + Terraform) lands
-in Phase 3 (issue #64); until then, build from source:
+The interactive installer downloads a Sigstore-signed `runevault` binary,
+verifies the signature, renders `runevault.conf`, generates TLS certs,
+and registers a `runevault` service (systemd on Linux, launchd on macOS):
 
 ```bash
-git clone https://github.com/CryptoLabInc/rune-admin.git
-cd rune-admin/vault
-go build -o /usr/local/bin/runevault ./cmd/runevault
-```
+# Local install
+curl -fsSL https://raw.githubusercontent.com/CryptoLabInc/rune-admin/main/install.sh \
+  | sudo bash -s -- --target local
 
-Render `runevault.conf` from the template (paths, TLS cert/key, envector
-credentials, team secret) and place it at
-`/opt/rune-vault/configs/runevault.conf`:
-
-```bash
-# Template
-cat vault/internal/server/testdata/runevault.conf.example
-# (then write your filled-in copy)
-sudo install -m 0600 -o "$(id -un)" runevault.conf /opt/rune-vault/configs/runevault.conf
+# Cloud install (provisions a VM + bootstraps it via Terraform)
+curl -fsSL https://raw.githubusercontent.com/CryptoLabInc/rune-admin/main/install.sh \
+  | sudo bash -s -- --target aws    # or gcp, oci
 ```
 
-Generate self-signed TLS certs (or supply your own) and start the daemon:
+The installer prompts for team name, enVector endpoint, and CSP-specific
+inputs (region, GCP project ID, OCI compartment OCID). Use `--non-interactive`
+plus the `RUNEVAULT_*` env vars listed in [`install.sh`](install.sh) for CI.
 
-```bash
-mise run certs                       # writes certs/server.{pem,key}
-runevault daemon start               # foreground; Ctrl+C or `runevault daemon stop` to exit
-```
+For tighter supply-chain assurance, download `install.sh` first and verify
+its signature before running it — see [Release Signature Verification](#release-signature-verification).
 
 ### 2. Verify Deployment
 
 ```bash
 # gRPC health check (requires grpcurl: brew install grpcurl)
-grpcurl -cacert ca.pem <your-vault-host>:50051 grpc.health.v1.Health/Check
+grpcurl -cacert /opt/runevault/certs/ca.pem <your-vault-host>:50051 grpc.health.v1.Health/Check
 
 # Expected: { "status": "SERVING" }
+
+# Or use the runevault CLI to query daemon status via the admin socket
+runevault status
 ```
 
 ### 3. Onboard Team Members
 
 ```bash
-# Issue a per-user token
-runevault token issue --user alice --role member
+# Issue a per-user token (90-day expiry)
+sudo runevault token issue --user alice --role member --expires 90d
 
 # Share via secure channel (1Password, Signal, etc.):
 #   - Vault Endpoint
@@ -90,20 +86,54 @@ runevault token issue --user alice --role member
 #   - enVector API Key
 ```
 
+Members of the `runevault` group can run the CLI without `sudo`.
+
 Team members install [Rune](https://github.com/CryptoLabInc/rune) and configure with the provided credentials.
 
+### From Source (development)
+
+```bash
+git clone https://github.com/CryptoLabInc/rune-admin.git
+cd rune-admin
+mise install            # Go 1.25, buf, terraform, cloud CLIs
+mise run setup          # Resolve Go modules + generate proto stubs
+mise run go:build       # Builds vault/bin/runevault
+# Copy + edit a dev config (the vault/dev/ tree is gitignored):
+cp vault/internal/server/testdata/runevault.conf.example vault/dev/runevault.conf
+mise run dev            # Run the daemon in the foreground (uses vault/dev/runevault.conf)
+```
+
 ## Admin Workflows
 
-### Rotate Token
+All admin commands talk to the daemon over a Unix domain socket
+(`/opt/runevault/admin.sock`). Members of the `runevault` group can run
+them without `sudo`.
+
+### Manage Tokens
 
 ```bash
-# Rotate a single user's token
-runevault token rotate --user alice
+runevault token issue   --user alice --role member --expires 90d
+runevault token list
+runevault token rotate  --user alice         # or --all
+runevault token revoke  --user alice
+```
 
-# Rotate all tokens
-runevault token rotate --all
+### Manage Roles
 
-# Distribute new tokens to team members via secure channel
+```bash
+runevault role list
+runevault role create --name <name> --scope a,b,c --top-k 10 --rate-limit 30/60s
+runevault role update --name <name> [--scope ...] [--top-k ...] [--rate-limit ...]
+runevault role delete --name <name>
+```
+
+### Daemon Health & Logs
+
+```bash
+runevault status                              # health + socket liveness
+runevault logs                                # tail audit log
+sudo systemctl restart runevault              # Linux
+sudo launchctl kickstart -k system/com.cryptolabinc.runevault   # macOS
 ```
 
 ## Security
@@ -149,13 +179,27 @@ pass verification.
 
 ## Deployment Targets
 
-Cloud deployment automation (Terraform modules under `deployment/`) is
-on hold during the Phase 1 → Phase 3 transition. Deploy the binary
-directly to your VM of choice for now.
+`install.sh --target <provider>` provisions a VM via Terraform and
+bootstraps `runevault` on it end-to-end. Each target lives under
+`deployment/`:
 
-- **OCI** (Oracle Cloud Infrastructure): `deployment/oci/` (Phase 3)
-- **AWS** (Amazon Web Services): `deployment/aws/` (Phase 3)
-- **GCP** (Google Cloud Platform): `deployment/gcp/` (Phase 3)
+- **AWS** (Amazon Web Services): `deployment/aws/`
+- **GCP** (Google Cloud Platform): `deployment/gcp/`
+- **OCI** (Oracle Cloud Infrastructure): `deployment/oci/`
+
+Service files for native installs are under `deployment/systemd/` and
+`deployment/launchd/`.
+
+## Uninstall
+
+```bash
+# Local: stops the service and removes /opt/runevault (prompts to keep data)
+sudo bash install.sh --uninstall --target local
+
+# Cloud: runs `terraform destroy` against the install dir created earlier
+sudo bash install.sh --uninstall --target aws \
+  --install-dir "$HOME/rune-vault-aws"
+```
 
 ## Development
 
@@ -167,39 +211,42 @@ See [CONTRIBUTING.md](CONTRIBUTING.md) for development setup, commands, and guid
 
 ```bash
 # Check Vault is reachable
-grpcurl -cacert ca.pem vault-yourteam.oci.envector.io:50051 grpc.health.v1.Health/Check
+grpcurl -cacert /opt/runevault/certs/ca.pem <vault-host>:50051 grpc.health.v1.Health/Check
 
-# Check firewall rules (port 50051 must be open)
-cd deployment/oci
-terraform state show oci_core_security_list.vault
+# Inspect the security group / firewall rule (port 50051 must be open)
+cd "$HOME/rune-vault-<csp>"
+terraform show | grep -A5 -E 'security_(group|list)'
 
-# Verify token — have team member re-enter carefully
+# Verify the token — have the team member re-enter it carefully
 ```
 
 ### Issue: Slow decryption
 
 ```bash
-# Check Vault CPU usage — increase instance resources if >80%
-ssh admin@vault-yourteam.oci.envector.io
+# Check Vault CPU usage — re-provision with a larger VM if >80%
+ssh ubuntu@<vault-host>     # or ec2-user@... / opc@... depending on CSP
 top
 
-# Check audit log for latency (mounted to host ./logs/)
-tail -20 /opt/rune/logs/audit.log
+# Tail audit log for latency
+sudo tail -20 /opt/runevault/logs/audit.log
+# Or via the CLI:
+runevault logs
 ```
 
 ### Issue: Vault crashed
 
 ```bash
-# Check logs
-docker logs rune-vault --tail 100
+# Inspect logs
+sudo journalctl -u runevault -n 100        # Linux
+sudo log show --predicate 'process == "runevault"' --last 10m   # macOS
 
 # Restart
-docker restart rune-vault
+sudo systemctl restart runevault           # Linux
+sudo launchctl kickstart -k system/com.cryptolabinc.runevault   # macOS
 
-# If persistent, redeploy
-cd deployment/oci
-terraform destroy
-terraform apply
+# If persistent, re-provision the VM:
+sudo bash install.sh --uninstall --target <csp> --install-dir "$HOME/rune-vault-<csp>"
+sudo bash install.sh --target <csp>
 ```
 
 ## Documentation
diff --git a/docs/ARCHITECTURE.md b/docs/ARCHITECTURE.md
index 2e0d154..f78565a 100644
--- a/docs/ARCHITECTURE.md
+++ b/docs/ARCHITECTURE.md
@@ -73,10 +73,10 @@ Rune-Vault is the **infrastructure backbone** for team-shared FHE-encrypted orga
 
 ## Port Summary
 
-| Port | Protocol | Purpose | Exposure |
-|------|----------|---------|----------|
-| 50051 | gRPC + TLS | Vault service, health check, reflection | Public (team members) |
-| 8081 | HTTP | Admin token/role CRUD + health check | Container-internal only |
+| Endpoint | Protocol | Purpose | Exposure |
+|----------|----------|---------|----------|
+| `:50051` | gRPC + TLS | Vault service, health check, reflection | Public (team members) |
+| `/opt/runevault/admin.sock` | Unix domain socket (mode 0600) | Admin token/role CRUD + status | Local only — `runevault` CLI |
 
 ## Component Details
 
@@ -91,20 +91,21 @@ Rune-Vault is the **infrastructure backbone** for team-shared FHE-encrypted orga
 - **On-Premise** (Self-hosted)
 
 **Runtime**:
-- Python 3.12 gRPC server
+- Single-binary Go gRPC daemon (`runevault`) — no runtime dependencies beyond TLS
 - gRPC server on port 50051 (used by envector-mcp-server)
 - gRPC health check via `grpc.health.v1` protocol
-- Internal admin HTTP API on port 8081 (container-local only)
+- Admin Unix domain socket at `/opt/runevault/admin.sock` (mode 0600, vault-user owned)
+- Registered as a native systemd unit (`runevault.service`) on Linux or a launchd job (`com.cryptolabinc.runevault`) on macOS
 
-**Key Storage** (`vault_keys/vault-key/`):
+**Key Storage** (`/opt/runevault/vault-keys/<key-id>/`, default `<key-id>` = `vault-key`):
 ```
-vault_keys/vault-key/
+/opt/runevault/vault-keys/vault-key/
 ├── EncKey.json      # Public encryption key (distributed to agents)
 ├── EvalKey.json     # Public evaluation key (for FHE operations)
 └── SecKey.json      # Secret decryption key (NEVER leaves Vault)
 ```
 
-Keys are auto-generated on first startup via `ensure_vault()`.
+Keys are auto-generated on first startup by `EnsureVault` (in `vault/internal/server/ensure_vault.go`).
 
 **Security Properties**:
 - Secret key stored encrypted at rest (filesystem encryption)
@@ -119,11 +120,10 @@ Defined in `proto/vault_service.proto` (`rune.vault.v1.VaultService`).
 
 **Server Configuration**:
 - Max message size: 256 MB (for EvalKey transfer)
-- Thread pool: 4 workers
-- Interceptor chain: `ValidationInterceptor` (protovalidate + runtime checks)
+- Interceptor chain: validation (protovalidate + runtime checks) → auth/RBAC → audit
 - gRPC reflection enabled (for grpcurl discovery)
 - gRPC health checking (`grpc.health.v1`) enabled
-- TLS required by default (disable via `VAULT_TLS_DISABLE=true`)
+- TLS required by default (`server.grpc.tls.disable: true` is dev only — never in production)
 
 **`GetPublicKey()`**
 - Returns: JSON bundle containing EncKey, EvalKey, index_name, key_id, agent_id, agent_dek (per-user derived encryption key)
@@ -146,15 +146,15 @@ Defined in `proto/vault_service.proto` (`rune.vault.v1.VaultService`).
 
 ### 3. Authentication & Access Control
 
-**Token Format**: `evt_` prefix + 32 hex characters (total 36 chars), generated via `secrets.token_hex(16)`.
+**Token Format**: `evt_` prefix + 32 hex characters (total 36 chars), generated from `crypto/rand`.
 - Example: `evt_a1b2c3d4e5f6a7b8c9d0e1f2a3b4c5d6`
 - Proto-level validation enforces exactly 36 characters.
 
-**Per-User RBAC** (managed by `TokenStore`):
+**Per-User RBAC** (managed by the `tokens` package):
 - Each user gets their own token assigned to a role.
-- `validate()` returns `(username, Role)` tuple.
+- Validation returns the matched user and role.
 - Checks: token existence, expiration, rate limit (per-user sliding window).
-- Scope checked separately per gRPC method.
+- Scope is checked separately per gRPC method.
 
 **Default Roles:**
 
@@ -163,42 +163,47 @@ Defined in `proto/vault_service.proto` (`rune.vault.v1.VaultService`).
 | admin | get_public_key, decrypt_scores, decrypt_metadata, manage_tokens | 50 | 150/60s |
 | member | get_public_key, decrypt_scores, decrypt_metadata | 10 | 30/60s |
 
-Custom roles can be created via the Admin API or CLI.
+Custom roles can be created via `runevault role create`.
 
 **Token Lifecycle:**
 - Issue: `runevault token issue --user alice --role member --expires 90d`
-- Rotate: `runevault token rotate --user alice` (atomic revoke + reissue)
+- Rotate: `runevault token rotate --user alice` (atomic revoke + reissue) or `--all`
 - Revoke: `runevault token revoke --user alice`
-- Persistence: async YAML writes to `vault-tokens.yml` / `vault-roles.yml` (atomic via temp file + `os.replace`)
-
-**Configuration Priority** (at startup):
-1. YAML config files (`vault-roles.yml`, `vault-tokens.yml`)
-2. Legacy env var (`VAULT_TOKENS`)
-3. Demo mode (auto-generated demo token)
-
-### 4. Admin Server & CLI
-
-**Admin Server** (`admin_server.py`):
-- HTTP on `127.0.0.1:8081` (not exposed via Docker; access via `docker exec`)
-- No authentication (protected by container isolation)
-- REST API for token and role CRUD operations
-
-| Method | Path | Purpose |
-|--------|------|---------|
-| GET | /health | Health check (queries gRPC health servicer) |
-| GET | /tokens | List all tokens |
-| POST | /tokens | Issue new token |
-| DELETE | /tokens/{user} | Revoke token |
-| POST | /tokens/{user}/rotate | Rotate single token |
-| POST | /tokens/_rotate_all | Rotate all tokens |
-| GET | /roles | List all roles |
-| POST | /roles | Create role |
-| PUT | /roles/{name} | Update role |
-| DELETE | /roles/{name} | Delete role |
-
-**CLI** (`vault_admin_cli.py` / `runevault`):
-- Wraps the Admin HTTP API for operator convenience
-- Available inside the container
+- Persistence: atomic YAML writes to the files referenced by `tokens.tokens_file` and `tokens.roles_file` in `runevault.conf` (defaults: `/opt/runevault/configs/{tokens,roles}.yml`).
+
+**Configuration Source**: `runevault.conf` (YAML) is the single source of truth — no env-var fallback or migration helper. Lookup order:
+1. `--config <path>` CLI flag
+2. `/opt/runevault/configs/runevault.conf`
+3. `./runevault.conf` (cwd, dev only)
+
+Secret YAML fields (`tokens.team_secret`, `envector.api_key`) accept a sibling `*_file` key for KMS-backed deployments.
+
+### 4. Admin Socket & CLI
+
+**Admin Socket** (`vault/internal/server/admin.go`):
+- Unix domain socket at `/opt/runevault/admin.sock` (mode 0600, vault-user owned)
+- Filesystem permissions are the only authorization gate; never expose externally
+- Used by the `runevault` CLI and by the daemon's lifecycle hooks (e.g. `ErrRestartRequested` after token rotation)
+
+**CLI** (`runevault`):
+
+| Command | Purpose |
+|---------|---------|
+| `runevault status` | Daemon health and socket liveness |
+| `runevault logs` | Tail audit log output |
+| `runevault token issue --user <name> --role <role> [--expires 90d]` | Issue a new per-user token |
+| `runevault token list` | List issued tokens |
+| `runevault token rotate --user <name>` / `--all` | Atomic revoke + reissue |
+| `runevault token revoke --user <name>` | Revoke a token |
+| `runevault role list` | List configured roles |
+| `runevault role create --name <name> --scope a,b,c --top-k N --rate-limit N/Ts` | Create a custom role |
+| `runevault role update --name <name> [--scope] [--top-k] [--rate-limit]` | Update an existing role |
+| `runevault role delete --name <name>` | Delete a role |
+| `runevault version` | Print build version (works without daemon or socket) |
+
+The `daemon start` subcommand is invoked by systemd / launchd; operators
+control lifecycle via `systemctl … runevault` (Linux) or
+`launchctl … system/com.cryptolabinc.runevault` (macOS) rather than directly.
 
 ### 5. Input Validation
 
@@ -214,7 +219,7 @@ Non-Vault methods (health check, reflection) pass through untouched.
 Each agent gets a unique 32-byte AES-256 DEK (Data Encryption Key):
 
 ```
-DEK = HKDF-SHA256(key=VAULT_TEAM_SECRET, info=agent_id)
+DEK = HKDF-SHA256(key=tokens.team_secret, info=agent_id)
 agent_id = SHA256(token)[:32]
 ```
 
@@ -225,20 +230,19 @@ agent_id = SHA256(token)[:32]
 
 ### 7. Audit Logging
 
-Structured JSON logging for all gRPC operations (`audit.py`):
+Structured JSON logging for all gRPC operations (`vault/internal/server/audit.go`):
 
 - One JSON line per request: timestamp, user_id, method, top_k, result_count, status, source_ip, latency_ms, error
-- Source IP extracted from gRPC `context.peer()`
+- Source IP extracted from the gRPC peer context
+- File output uses `lumberjack` for size-based rotation
 
-**Configuration** (via `VAULT_AUDIT_LOG` env var):
+**Configuration** in `runevault.conf`:
 
-| Value | Behavior |
-|-------|----------|
-| *(empty)* | Disabled |
-| `file` | `/var/log/rune-vault/audit.log` (daily rotation, 30-day retention) |
-| `file:/path` | Custom file path |
-| `stdout` | JSON lines to stdout (for cloud log aggregators) |
-| `file+stdout` | Both |
+```yaml
+audit:
+  mode: file+stdout         # one of: "" (disabled), file, stdout, file+stdout
+  path: /opt/runevault/logs/audit.log
+```
 
 ## Data Flow
 
@@ -377,90 +381,80 @@ EvalKey: Distributed to all team members (safe to share, FHE operations)
 
 ### Cloud Deployment (Terraform)
 
+`install.sh --target <aws|gcp|oci>` wraps Terraform end-to-end:
+preflight checks → `terraform apply` → cloud-init bootstrap → CA-cert SCP
+poll → remote `install.sh` execution.
+
 ```
 Terraform Configuration
     │
-    ├── deployment/oci/main.tf    # Oracle Cloud
     ├── deployment/aws/main.tf    # Amazon Web Services
-    └── deployment/gcp/main.tf    # Google Cloud Platform
+    ├── deployment/gcp/main.tf    # Google Cloud Platform
+    └── deployment/oci/main.tf    # Oracle Cloud Infrastructure
         │
         ▼
 Cloud Resources Created
     │
     ├── Compute Instance (VM)
-    │   ├── OS: Ubuntu 22.04 LTS
-    │   ├── Shape: 2 OCPU, 8GB RAM, 50GB disk
-    │   └── Software:
-    │       ├── Python 3.12
-    │       └── pyenvector (FHE SDK)
+    │   ├── OS: Ubuntu 24.04 LTS
+    │   └── Software (installed via cloud-init startup script):
+    │       ├── runevault binary (Sigstore-verified)
+    │       └── runevault.service (systemd) registered
     │
     ├── Networking
     │   ├── Public IP address
-    │   ├── Security group (allow 50051/gRPC)
-    │   └── DNS: vault-{team}.oci.envector.io
+    │   └── Security group / list / firewall rule (allow 50051/gRPC)
     │
     ├── Storage
-    │   ├── /vault_keys/ (encrypted volume)
-    │   └── Backup to cloud storage (optional)
+    │   └── /opt/runevault/vault-keys/<key-id>/  (FHE keys)
     │
     └── Audit Logging
-        └── /var/log/rune-vault/audit.log
+        └── /opt/runevault/logs/audit.log
 ```
 
-### High Availability (Optional)
-
-```
-Load Balancer (HTTPS)
-    │
-    ├── Vault Instance 1 (Primary)
-    ├── Vault Instance 2 (Standby)
-    └── Vault Instance N (Standby)
-        │
-        └── Shared Storage (NFS/EFS)
-            └── /vault_keys/ (same keys across instances)
-```
-
-**Setup**:
-```bash
-cd deployment/oci
-terraform apply -var="ha_enabled=true" \
-                -var="instance_count=3"
-```
+Common Terraform variables across all CSPs: `team_name`, `tls_mode`,
+`envector_endpoint`, `envector_api_key`, `runevault_version`,
+`public_key`, `region`. CSP-specific: `instance_type` (AWS),
+`project_id` / `zone` / `machine_type` (GCP), `oci_profile` /
+`compartment_id` (OCI). Output: `vault_public_ip`.
 
-**Failover**:
-- Health checks every 10s
-- Auto-failover <30s
-- Shared keys (no key synchronization needed)
+Horizontal scaling and multi-instance HA are not currently supported.
+For higher capacity, re-provision with a larger VM shape via your cloud
+provider.
 
 ## Operational Considerations
 
 ### Backup & Recovery
 
 **Critical Assets**:
-- `/vault_keys/vault-key/SecKey.json` - **MUST backup** (cannot regenerate)
-- `VAULT_TEAM_SECRET` - **MUST backup** (needed for DEK re-derivation)
-- Vault token - Rotatable via CLI
+- `/opt/runevault/vault-keys/<key-id>/SecKey.json` — **MUST backup** (cannot regenerate)
+- `tokens.team_secret` from `runevault.conf` — **MUST backup** (needed for DEK re-derivation)
+- Per-user tokens — rotatable via `runevault token rotate`
 
 **Backup Strategy**:
 ```bash
-# Manually back up vault keys
-tar czf vault_keys_backup_$(date +%Y-%m-%d).tar.gz vault/vault_keys/
+# Manually back up vault keys (run on the VM)
+sudo tar czf vault-keys_backup_$(date +%Y-%m-%d).tar.gz -C /opt/runevault vault-keys/
 
-# Store in:
-# 1. Offline (USB drive in safe)
-# 2. Cloud (different provider, encrypted)
-# 3. Password manager (1Password secure notes)
+# Also archive runevault.conf or at minimum the tokens.team_secret value
+# Store in: offline media, a different cloud provider, or a password manager
 ```
 
 **Recovery Procedure**:
 ```bash
-# If Vault VM fails
-cd deployment/oci
-terraform apply -var="restore_from_backup=true" \
-                -var="backup_path=/path/to/backup.tar.gz.enc"
+# 1. Re-provision a fresh VM via the installer
+sudo bash install.sh --target <aws|gcp|oci>
+
+# 2. Stop the daemon before restoring keys
+sudo systemctl stop runevault
+
+# 3. Restore vault-keys and team_secret
+sudo tar xzf vault-keys_backup_YYYY-MM-DD.tar.gz -C /opt/runevault
+# Edit /opt/runevault/configs/runevault.conf and restore tokens.team_secret
 
-# Vault restarts with same keys
-# Team members continue without reconfiguration
+# 4. Bring the daemon back up
+sudo systemctl start runevault
+# Team members continue without reconfiguration.
 ```
 
 ### Token Rotation
@@ -472,61 +466,54 @@ runevault token rotate --user alice
 # Rotate all tokens
 runevault token rotate --all
 
-# Distribute new tokens to team members via secure channel
+# Distribute new tokens to team members via a secure channel
 ```
 
-### Scaling Strategies
+### Scaling Strategy
 
-**Vertical Scaling** (increase VM size):
-```bash
-terraform apply -var="instance_shape=VM.Standard.E4.Flex" \
-                -var="instance_ocpu=4" \
-                -var="instance_memory_gb=16"
-```
+Re-provision with a larger VM shape via your cloud provider's console or
+by editing the relevant `instance_type` (AWS) / `machine_type` (GCP) /
+shape configuration (OCI) and re-running `terraform apply` from your
+install directory.
 
-**Horizontal Scaling** (add more instances):
-```bash
-terraform apply -var="ha_enabled=true" \
-                -var="instance_count=3"
-```
-
-**When to Scale**:
-- CPU >80% sustained → Add OCPU or scale out
-- Latency P95 >200ms → Add instances
-- Error rate >1% → Investigate (likely config issue, not scale)
+When to scale:
+- CPU >80% sustained
+- Latency P95 >200ms
+- Error rate >1% (investigate first — usually a config issue, not scale)
 
 ## Module Reference
 
-| Module | Purpose |
-|--------|---------|
-| `vault_core.py` | Core business logic: key management, decryption, DEK derivation |
-| `vault_grpc_server.py` | gRPC server, TLS, entrypoint, orchestrates all subsystems |
-| `token_store.py` | Per-user RBAC: Token/Role dataclasses, validation, rate limiting, YAML persistence |
-| `admin_server.py` | Internal HTTP admin API for token/role CRUD |
-| `validation_interceptor.py` | gRPC interceptor: protovalidate + runtime input checks |
-| `request_validator.py` | Runtime validation rules (control chars, whitespace) |
-| `audit.py` | Structured JSON audit logging with file rotation |
-| `vault_admin_cli.py` | CLI for token/role management (`runevault` command) |
+| Package | Purpose |
+|---------|---------|
+| `vault/cmd` | Binary entry point — wires Cobra root command and runs `Execute()` |
+| `vault/internal/commands` | CLI subcommands (`daemon`, `token`, `role`, `status`, `logs`, `version`) and admin-socket client |
+| `vault/internal/server` | gRPC server, config loader, audit logger, admin UDS, `EnsureVault` startup hook, interceptors |
+| `vault/internal/tokens` | Per-user RBAC store: tokens, roles, validation, rate limiting, YAML persistence |
+| `vault/internal/crypto` | FHE key management + HKDF/AES wrappers around `envector-go-sdk` |
+| `vault/internal/tests` | E2E tests gated by build tag `e2e` (decrypt pipeline + CLI smoke) |
+| `vault/pkg/vaultpb` | Generated gRPC stubs from `vault/proto/*.proto` |
 
 ## Troubleshooting
 
 ### Issue: High Latency
 
-**Symptoms**: decrypt_scores() taking >200ms
+**Symptoms**: `DecryptScores` taking >200ms
 
 **Diagnosis**:
 ```bash
 # Check Vault CPU on the server
-ssh admin@vault-yourteam.oci.envector.io
+ssh ubuntu@<vault-host>     # or ec2-user@... / opc@... depending on CSP
 top
 
-# Check audit log for latency
-docker exec rune-vault tail -20 /var/log/rune-vault/audit.log
+# Tail the audit log for latency
+sudo tail -20 /opt/runevault/logs/audit.log
+# Or use the CLI from the host:
+runevault logs
 ```
 
 **Solutions**:
-- CPU bottleneck → Scale up (add OCPU)
-- Large Top-K → Reduce max results
+- CPU bottleneck → Re-provision with a larger VM shape
+- Large Top-K → Reduce max results (or tighten role `top_k`)
 - High dimension → Acceptable (dim=1024 is standard)
 
 ### Issue: Authentication Failures
@@ -535,37 +522,40 @@ docker exec rune-vault tail -20 /var/log/rune-vault/audit.log
 
 **Diagnosis**:
 ```bash
-# Check token is correct
-echo $RUNEVAULT_TOKEN
+# Verify the daemon is up
+runevault status
 
-# Verify Vault sees requests
-ssh admin@vault-yourteam.oci.envector.io
-sudo journalctl -u vault | grep "denied"
+# Inspect server logs for denied requests
+sudo journalctl -u runevault | grep -i "denied\|unauthenticated"
 ```
 
 **Solutions**:
-- Wrong token → Re-share correct token
-- Token rotated → Distribute new token to all team members
-- Token expired → Issue new token via `runevault token issue`
-- Rate limited → Wait for window reset or adjust role rate_limit
-- Firewall → Check security group allows 50051 from team IPs
+- Wrong token → Re-share the correct token
+- Token rotated → Distribute the new token to all team members
+- Token expired → Issue a fresh token via `runevault token issue`
+- Rate limited → Wait for the window to reset, or adjust the role's `rate_limit`
+- Firewall → Check the security group allows 50051 from team IPs
 
 ### Issue: Vault Crashed
 
-**Symptoms**: Health check fails, 503 Service Unavailable
+**Symptoms**: Health check fails, daemon not responsive
 
 **Diagnosis**:
 ```bash
-ssh admin@vault-yourteam.oci.envector.io
-sudo systemctl status vault
-sudo journalctl -u vault -n 100
+# Linux
+sudo systemctl status runevault
+sudo journalctl -u runevault -n 100
+
+# macOS
+sudo launchctl print system/com.cryptolabinc.runevault
+sudo log show --predicate 'process == "runevault"' --last 10m
 ```
 
 **Solutions**:
 - OOM killer → Increase VM memory
-- Disk full → Rotate logs (`logrotate`)
-- Crashed process → Restart (`systemctl restart vault`)
-- Persistent crash → Redeploy with backup keys
+- Disk full → Rotate logs (`lumberjack` handles size-based rotation, but free disk first)
+- Crashed process → `sudo systemctl restart runevault` (Linux) / `sudo launchctl kickstart -k system/com.cryptolabinc.runevault` (macOS)
+- Persistent crash → Re-provision with `install.sh --uninstall` then `install.sh --target <provider>`, restoring `vault-keys/` from backup before first start
 
 ## Next Steps
 
diff --git a/tests/FIXTURES.md b/tests/FIXTURES.md
index a7ce2d2..7549fe1 100644
--- a/tests/FIXTURES.md
+++ b/tests/FIXTURES.md
@@ -104,7 +104,7 @@ To run integration tests locally, you need the current passphrase:
 ```bash
 export FIXTURES_GPG_PASSPHRASE="<current passphrase>"
 mise run fixtures:decrypt
-mise run test
+mise run go:test:unit
 ```
 
 ## Fixture Contents

From 3260d7649b3c27052db9eef4ea5e72049a1c7255 Mon Sep 17 00:00:00 2001
From: Jeonghwan Lee <jhlee@cryptolab.co.kr>
Date: Thu, 30 Apr 2026 10:51:55 +0900
Subject: [PATCH 22/27] =?UTF-8?q?chore:=20drop=20cosign/Sigstore=20?=
 =?UTF-8?q?=E2=80=94=20keep=20SHA256SUMS-only=20release=20verification?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Per prior decision that cosign-based hashsum verification was operationally
heavy, remove every cosign/Sigstore dependency:

- install.sh: drop cosign from preflight tools, _install_tool case, and
  Phase 2/3 verify-blob block. Stop downloading SHA256SUMS.{sig,pem}.
  RUNEVAULT_SKIP_VERIFY now toggles the SHA256SUMS check.
- release.yaml: drop sigstore/cosign-installer step and cosign sign-blob
  step. Release artifacts are now <archive> + SHA256SUMS only.
- deployment/{aws,gcp,oci}/cloud-init.yaml + startup-script.sh: drop the
  cosign download (no longer needed since install.sh doesn't use it).
- deployment/{aws,gcp,oci}/cloud-init-dev.yaml + startup-script-dev.sh:
  replace the cosign-as-sentinel pattern with a plain
  /var/run/runevault-dev-ready file. install-dev.sh polls the new sentinel.
- install-dev.sh: drop RUNEVAULT_SKIP_VERIFY=1 (LOCAL_BINARY already
  short-circuits download_and_verify so verification never runs in dev).
- README, CONTRIBUTING, CHANGELOG, ARCHITECTURE: replace
  Sigstore/signature-verification language with checksum verification.

SHA256SUMS integrity now relies on GitHub HTTPS for the release-page download.
---
 .github/workflows/release.yaml       | 17 +---------
 CHANGELOG.md                         |  4 +--
 CONTRIBUTING.md                      |  2 +-
 README.md                            | 32 ++++++++-----------
 deployment/aws/cloud-init-dev.yaml   |  5 +--
 deployment/aws/cloud-init.yaml       |  4 ---
 deployment/gcp/startup-script-dev.sh |  5 +--
 deployment/gcp/startup-script.sh     |  4 ---
 deployment/oci/startup-script-dev.sh |  5 +--
 deployment/oci/startup-script.sh     |  4 ---
 docs/ARCHITECTURE.md                 |  2 +-
 install.sh                           | 46 +++++-----------------------
 scripts/install-dev.sh               |  8 ++---
 13 files changed, 31 insertions(+), 107 deletions(-)

diff --git a/.github/workflows/release.yaml b/.github/workflows/release.yaml
index 7a9c452..ad4b1b1 100644
--- a/.github/workflows/release.yaml
+++ b/.github/workflows/release.yaml
@@ -110,12 +110,11 @@ jobs:
           retention-days: 7
 
   publish:
-    name: Sign and publish
+    name: Publish
     runs-on: ubuntu-latest
     needs: build
     permissions:
       contents: write
-      id-token: write
 
     steps:
       - uses: actions/checkout@v4
@@ -126,9 +125,6 @@ jobs:
           path: dist/
           merge-multiple: true
 
-      - name: Install cosign
-        uses: sigstore/cosign-installer@v3
-
       - name: Resolve version
         id: meta
         run: |
@@ -142,15 +138,6 @@ jobs:
         working-directory: dist/
         run: sha256sum *.tar.gz > SHA256SUMS
 
-      - name: Sign SHA256SUMS
-        working-directory: dist/
-        run: |
-          cosign sign-blob \
-            --yes \
-            --output-signature SHA256SUMS.sig \
-            --output-certificate SHA256SUMS.pem \
-            SHA256SUMS
-
       - name: Upload to GitHub Release
         if: github.event_name == 'release'
         working-directory: dist/
@@ -160,6 +147,4 @@ jobs:
           gh release upload "${{ github.event.release.tag_name }}" \
             *.tar.gz \
             SHA256SUMS \
-            SHA256SUMS.sig \
-            SHA256SUMS.pem \
             --repo "${{ github.repository }}"
diff --git a/CHANGELOG.md b/CHANGELOG.md
index e155a8b..3d4563e 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -13,13 +13,13 @@ and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0
 
 ### Added
 
-- Production installer `install.sh` with `--target local|aws|gcp|oci`, Sigstore signature verification, systemd/launchd service registration, and `--uninstall` flow
+- Production installer `install.sh` with `--target local|aws|gcp|oci`, SHA256SUMS checksum verification, systemd/launchd service registration, and `--uninstall` flow
 - Dev installer `scripts/install-dev.sh` (structural sibling of `install.sh`) for local/CSP testing without GitHub releases
 - CSP provisioning via Terraform for AWS, GCP, and OCI: preflight CLI/auth checks, cloud-init bootstrap, CA-cert SCP polling
 - CSP uninstall flow that wraps `terraform destroy`
 - `runevault status` (daemon + admin-socket health) and `runevault logs` (audit log tail) subcommands
 - `runevault` group lets members run the CLI without `sudo`
-- Multi-platform release pipeline (linux/darwin × amd64/arm64) with `SHA256SUMS` + Sigstore keyless signing
+- Multi-platform release pipeline (linux/darwin × amd64/arm64) with `SHA256SUMS` checksum manifest
 - `EnsureVault` startup hook to activate keys and ensure index on first run
 
 ### Changed
diff --git a/CONTRIBUTING.md b/CONTRIBUTING.md
index 4b5aa7c..2065723 100644
--- a/CONTRIBUTING.md
+++ b/CONTRIBUTING.md
@@ -257,7 +257,7 @@ rune-admin/
 │   └── generate-test-fixtures.py  # Generates GPG-encrypted test fixtures
 ├── tests/                         # Encrypted fixture archive (see FIXTURES.md)
 ├── docs/ARCHITECTURE.md           # Architecture & data flow
-└── install.sh                     # Production installer (Sigstore-verified)
+└── install.sh                     # Production installer (SHA256SUMS-verified)
 ```
 
 ## Vault Architecture
diff --git a/README.md b/README.md
index 14bb58f..a32d06a 100644
--- a/README.md
+++ b/README.md
@@ -26,7 +26,7 @@ For system architecture and data flow details, see [docs/ARCHITECTURE.md](docs/A
 1. **enVector Cloud account** at [https://envector.io](https://envector.io) — Cluster Endpoint and API Key
 2. **Cloud provider account** (AWS, GCP, or OCI) — only needed for cloud deployment
 
-The [installer](#quick-start) auto-checks for the tools it needs (`cosign` for signature verification, plus `terraform` and the relevant cloud CLI when targeting a CSP).
+The [installer](#quick-start) auto-checks for the tools it needs (`terraform` and the relevant cloud CLI when targeting a CSP).
 
 ### For Team Members
 
@@ -40,8 +40,8 @@ Team members install [Rune](https://github.com/CryptoLabInc/rune) from Claude Ma
 
 ### 1. Install Rune-Vault
 
-The interactive installer downloads a Sigstore-signed `runevault` binary,
-verifies the signature, renders `runevault.conf`, generates TLS certs,
+The interactive installer downloads the `runevault` binary, verifies its
+`SHA256SUMS` checksum, renders `runevault.conf`, generates TLS certs,
 and registers a `runevault` service (systemd on Linux, launchd on macOS):
 
 ```bash
@@ -58,8 +58,9 @@ The installer prompts for team name, enVector endpoint, and CSP-specific
 inputs (region, GCP project ID, OCI compartment OCID). Use `--non-interactive`
 plus the `RUNEVAULT_*` env vars listed in [`install.sh`](install.sh) for CI.
 
-For tighter supply-chain assurance, download `install.sh` first and verify
-its signature before running it — see [Release Signature Verification](#release-signature-verification).
+If you'd rather inspect the script before running it, download `install.sh`
+and the `SHA256SUMS` file from the release page first, then run `install.sh`
+with the binary it pulls down — see [Release Checksum Verification](#release-checksum-verification).
 
 ### 2. Verify Deployment
 
@@ -155,27 +156,18 @@ Vault communications MUST use TLS. The installer automatically configures TLS ce
 - **EncKey/EvalKey**: Safe to distribute (public keys)
 - Per-agent metadata encryption uses HKDF-derived DEKs (no separate key file)
 
-### Release Signature Verification
+### Release Checksum Verification
 
-Every GitHub release ships `SHA256SUMS`, `SHA256SUMS.sig`, and `SHA256SUMS.pem`.
-The checksum file is signed keylessly via [Sigstore](https://sigstore.dev) from the
-`release.yaml` workflow. Verify before installing:
+Every GitHub release ships a `SHA256SUMS` file alongside the binaries.
+`install.sh` downloads it and runs `sha256sum --check` automatically. To
+verify by hand:
 
 ```bash
-cosign verify-blob \
-  --signature SHA256SUMS.sig \
-  --certificate SHA256SUMS.pem \
-  --certificate-oidc-issuer https://token.actions.githubusercontent.com \
-  --certificate-identity-regexp "^https://github.com/CryptoLabInc/rune-admin/.github/workflows/release.yaml@" \
-  SHA256SUMS
-
 sha256sum --check --ignore-missing SHA256SUMS
 ```
 
-The `--certificate-oidc-issuer` and `--certificate-identity-regexp` flags are
-required to pin the signature to this repository's workflow — without them,
-any Fulcio-issued certificate (including one from a different repository) would
-pass verification.
+Trust in the `SHA256SUMS` file itself relies on GitHub's HTTPS download
+of the release page.
 
 ## Deployment Targets
 
diff --git a/deployment/aws/cloud-init-dev.yaml b/deployment/aws/cloud-init-dev.yaml
index 76dbf8a..d6424ae 100644
--- a/deployment/aws/cloud-init-dev.yaml
+++ b/deployment/aws/cloud-init-dev.yaml
@@ -4,7 +4,4 @@ package_update: true
 packages: [ca-certificates, curl, openssl]
 
 runcmd:
-  - |
-      arch=$(dpkg --print-architecture); [ "$arch" = "amd64" ] && carch=amd64 || carch=arm64
-      curl -fsSL "https://github.com/sigstore/cosign/releases/latest/download/cosign-linux-$${carch}" -o /usr/local/bin/cosign
-      chmod 0755 /usr/local/bin/cosign
+  - touch /var/run/runevault-dev-ready
diff --git a/deployment/aws/cloud-init.yaml b/deployment/aws/cloud-init.yaml
index 78e4643..54bdacd 100644
--- a/deployment/aws/cloud-init.yaml
+++ b/deployment/aws/cloud-init.yaml
@@ -12,10 +12,6 @@ write_files:
 
 runcmd:
   - exec > /var/log/runevault-install.log 2>&1
-  - |
-      arch=$(dpkg --print-architecture); [ "$arch" = "amd64" ] && carch=amd64 || carch=arm64
-      curl -fsSL "https://github.com/sigstore/cosign/releases/latest/download/cosign-linux-$${carch}" -o /usr/local/bin/cosign
-      chmod 0755 /usr/local/bin/cosign
   - set -a; . /etc/profile.d/runevault-installer-env.sh; set +a
   - |
       INSTALL_URL="https://raw.githubusercontent.com/CryptoLabInc/rune-admin/${runevault_version}/install.sh"
diff --git a/deployment/gcp/startup-script-dev.sh b/deployment/gcp/startup-script-dev.sh
index 26d08e3..55dea6f 100755
--- a/deployment/gcp/startup-script-dev.sh
+++ b/deployment/gcp/startup-script-dev.sh
@@ -9,8 +9,5 @@ for i in $(seq 1 30); do
   echo "apt retry $i..." && sleep 10
 done
 
-arch=$(dpkg --print-architecture); [ "$arch" = "amd64" ] && carch=amd64 || carch=arm64
-curl -fsSL "https://github.com/sigstore/cosign/releases/latest/download/cosign-linux-$${carch}" -o /usr/local/bin/cosign
-chmod 0755 /usr/local/bin/cosign
-
+touch /var/run/runevault-dev-ready
 echo "=== prereqs ready at $(date), waiting for install-dev.sh injection ==="
diff --git a/deployment/gcp/startup-script.sh b/deployment/gcp/startup-script.sh
index 141fee4..217f7a6 100644
--- a/deployment/gcp/startup-script.sh
+++ b/deployment/gcp/startup-script.sh
@@ -8,10 +8,6 @@ for i in $(seq 1 30); do
   echo "apt retry $i..." && sleep 10
 done
 
-arch=$(dpkg --print-architecture); [ "$arch" = "amd64" ] && carch=amd64 || carch=arm64
-curl -fsSL "https://github.com/sigstore/cosign/releases/latest/download/cosign-linux-$${carch}" -o /usr/local/bin/cosign
-chmod 0755 /usr/local/bin/cosign
-
 cat > /etc/profile.d/runevault-installer-env.sh <<'ENVFILE'
 export RUNEVAULT_TEAM_NAME='${team_name}'
 export RUNEVAULT_ENVECTOR_ENDPOINT='${envector_endpoint}'
diff --git a/deployment/oci/startup-script-dev.sh b/deployment/oci/startup-script-dev.sh
index e813044..ea13143 100755
--- a/deployment/oci/startup-script-dev.sh
+++ b/deployment/oci/startup-script-dev.sh
@@ -12,8 +12,5 @@ for i in $(seq 1 30); do
   echo "apt retry $i..." && sleep 10
 done
 
-arch=$(dpkg --print-architecture); [ "$arch" = "amd64" ] && carch=amd64 || carch=arm64
-curl -fsSL "https://github.com/sigstore/cosign/releases/latest/download/cosign-linux-$${carch}" -o /usr/local/bin/cosign
-chmod 0755 /usr/local/bin/cosign
-
+touch /var/run/runevault-dev-ready
 echo "=== prereqs ready at $(date), waiting for install-dev.sh injection ==="
diff --git a/deployment/oci/startup-script.sh b/deployment/oci/startup-script.sh
index 78c881e..6ecfaea 100644
--- a/deployment/oci/startup-script.sh
+++ b/deployment/oci/startup-script.sh
@@ -11,10 +11,6 @@ for i in $(seq 1 30); do
   echo "apt retry $i..." && sleep 10
 done
 
-arch=$(dpkg --print-architecture); [ "$arch" = "amd64" ] && carch=amd64 || carch=arm64
-curl -fsSL "https://github.com/sigstore/cosign/releases/latest/download/cosign-linux-$${carch}" -o /usr/local/bin/cosign
-chmod 0755 /usr/local/bin/cosign
-
 cat > /etc/profile.d/runevault-installer-env.sh <<'ENVFILE'
 export RUNEVAULT_TEAM_NAME='${team_name}'
 export RUNEVAULT_ENVECTOR_ENDPOINT='${envector_endpoint}'
diff --git a/docs/ARCHITECTURE.md b/docs/ARCHITECTURE.md
index f78565a..355be82 100644
--- a/docs/ARCHITECTURE.md
+++ b/docs/ARCHITECTURE.md
@@ -398,7 +398,7 @@ Cloud Resources Created
     ├── Compute Instance (VM)
     │   ├── OS: Ubuntu 24.04 LTS
     │   └── Software (installed via cloud-init startup script):
-    │       ├── runevault binary (Sigstore-verified)
+    │       ├── runevault binary (SHA256SUMS-verified)
     │       └── runevault.service (systemd) registered
     │
     ├── Networking
diff --git a/install.sh b/install.sh
index b11ef54..4833620 100755
--- a/install.sh
+++ b/install.sh
@@ -37,8 +37,8 @@
 #   RUNEVAULT_OCI_COMPARTMENT_ID     OCI: compartment OCID (required for OCI)
 #
 # Dev/testing env vars (set by scripts/install-dev.sh):
-#   RUNEVAULT_LOCAL_BINARY    Path to local binary; skips download + verification
-#   RUNEVAULT_SKIP_VERIFY     Set to 1 to skip cosign verification
+#   RUNEVAULT_LOCAL_BINARY    Path to local binary; skips download + checksum verify
+#   RUNEVAULT_SKIP_VERIFY     Set to 1 to skip checksum verification (dev only)
 #   RUNEVAULT_INSTALL_PREFIX  Override /opt/runevault (default)
 #   RUNEVAULT_BINARY_PATH     Override /usr/local/bin/runevault (default)
 #   RUNEVAULT_SKIP_SERVICE    Set to 1 to skip systemd/launchd installation
@@ -47,8 +47,6 @@ set -euo pipefail
 
 # ── Constants ──────────────────────────────────────────────────────────────────
 REPO=CryptoLabInc/rune-admin
-OIDC_ISSUER=https://token.actions.githubusercontent.com
-CERT_REGEXP="^https://github.com/CryptoLabInc/rune-admin/.github/workflows/release.yaml@"
 SERVICE_USER=runevault
 GRPC_PORT=50051
 
@@ -635,15 +633,6 @@ _install_tool() {
   local tool=$1
   info "Installing ${tool}..."
   case "$OS_SLUG:$tool" in
-    linux:cosign)
-      # Download pre-built binary from sigstore releases (no apt repo needed)
-      local arch_suffix=amd64
-      [[ "$ARCH_SLUG" = arm64 ]] && arch_suffix=arm64
-      curl -fsSL \
-        "https://github.com/sigstore/cosign/releases/latest/download/cosign-linux-${arch_suffix}" \
-        -o /usr/local/bin/cosign
-      chmod 0755 /usr/local/bin/cosign
-      ;;
     linux:openssl)  _pkg_install openssl ;;
     linux:sha256sum) _pkg_install coreutils ;;
     linux:terraform)
@@ -663,7 +652,6 @@ _install_tool() {
       install -m 0755 "${tmpdir}/terraform" /usr/local/bin/terraform
       rm -rf "${tmpdir}"
       ;;
-    darwin:cosign)  _brew install cosign ;;
     darwin:openssl) _brew install openssl ;;
     darwin:terraform) _brew install terraform ;;
     darwin:shasum)
@@ -685,7 +673,6 @@ preflight() {
   [[ "$(id -u)" -eq 0 ]] || die "This installer must be run as root (use sudo)."
 
   local tools=(curl)
-  [[ "$SKIP_VERIFY" -eq 0 && -z "$LOCAL_BINARY" ]] && tools+=(cosign)
   if [[ "$OS_SLUG" = linux ]]; then
     tools+=(sha256sum systemctl)
   else
@@ -728,10 +715,8 @@ preflight() {
         printf 'Install them manually and re-run the installer:\n' >&2
         for tool in "${missing[@]}"; do
           case "$OS_SLUG:$tool" in
-            linux:cosign)   printf '  cosign:    https://docs.sigstore.dev/cosign/system_config/installation/\n' >&2 ;;
             linux:openssl)  printf '  openssl:   apt install openssl\n' >&2 ;;
             linux:sha256sum) printf '  sha256sum: apt install coreutils\n' >&2 ;;
-            darwin:cosign)  printf '  cosign:    brew install cosign\n' >&2 ;;
             darwin:openssl) printf '  openssl:   brew install openssl\n' >&2 ;;
           esac
         done
@@ -826,32 +811,17 @@ download_and_verify() {
   local base_url="https://github.com/${REPO}/releases/download/${VERSION}"
 
   info "Downloading ${archive}..."
-  _curl_retry "${base_url}/${archive}"         "$SCRATCH/${archive}"
-  _curl_retry "${base_url}/SHA256SUMS"         "$SCRATCH/SHA256SUMS"
-  _curl_retry "${base_url}/SHA256SUMS.sig"     "$SCRATCH/SHA256SUMS.sig"
-  _curl_retry "${base_url}/SHA256SUMS.pem"     "$SCRATCH/SHA256SUMS.pem"
+  _curl_retry "${base_url}/${archive}"  "$SCRATCH/${archive}"
+  _curl_retry "${base_url}/SHA256SUMS"  "$SCRATCH/SHA256SUMS"
 
   if [[ "$SKIP_VERIFY" -eq 1 ]]; then
-    warn "SKIP_VERIFY=1: skipping cosign verification (development only)."
+    warn "SKIP_VERIFY=1: skipping checksum verification (development only)."
   else
-    info "Verifying release signature..."
-    local cosign_err
-    cosign_err=$(mktemp)
-    cosign verify-blob \
-      --signature   "$SCRATCH/SHA256SUMS.sig" \
-      --certificate "$SCRATCH/SHA256SUMS.pem" \
-      --certificate-oidc-issuer "$OIDC_ISSUER" \
-      --certificate-identity-regexp "$CERT_REGEXP" \
-      "$SCRATCH/SHA256SUMS" 2>"$cosign_err" \
-      || { cat "$cosign_err" >&2
-           die "Signature verification failed — aborting before any installation."; }
-    success "Signature verified."
+    info "Verifying checksum..."
+    _checksum_verify "$SCRATCH/SHA256SUMS" "$SCRATCH/${archive}"
+    success "Checksum verified."
   fi
 
-  info "Verifying checksum..."
-  _checksum_verify "$SCRATCH/SHA256SUMS" "$SCRATCH/${archive}"
-  success "Checksum verified."
-
   info "Extracting binary..."
   tar -xzf "$SCRATCH/${archive}" -C "$SCRATCH" ./runevault
   "$SCRATCH/runevault" version >/dev/null 2>&1 \
diff --git a/scripts/install-dev.sh b/scripts/install-dev.sh
index 90336cf..48c4c68 100755
--- a/scripts/install-dev.sh
+++ b/scripts/install-dev.sh
@@ -292,7 +292,6 @@ dev_local_install() {
   dev_local_prompt_config
 
   export RUNEVAULT_LOCAL_BINARY="$LOCAL_BINARY_HOST"
-  export RUNEVAULT_SKIP_VERIFY=1
   export RUNEVAULT_TEAM_NAME
   export RUNEVAULT_ENVECTOR_ENDPOINT
   export RUNEVAULT_ENVECTOR_API_KEY
@@ -554,14 +553,14 @@ dev_csp_upload_and_install() {
     || die "Timed out waiting for SSH. ssh -i ${key_path} ${ssh_user}@${public_ip}"
   success "SSH reachable."
 
-  # 2. Wait for cloud-init-dev to finish (cosign is the last thing it installs).
-  info "Waiting for cloud-init-dev to finish (cosign + apt prereqs)..."
+  # 2. Wait for cloud-init-dev to finish — sentinel file is touched at end of runcmd.
+  info "Waiting for cloud-init-dev to finish (apt prereqs + sentinel)..."
   deadline=$(( $(date +%s) + 600 ))
   local prereqs_ready=0
   while [[ $(date +%s) -lt $deadline ]]; do
     # shellcheck disable=SC2086
     if $ssh_prefix ssh $ssh_opts -i "$key_path" "${ssh_user}@${public_ip}" \
-         "test -x /usr/local/bin/cosign && test -x /usr/bin/openssl" 2>/dev/null; then
+         "test -e /var/run/runevault-dev-ready" 2>/dev/null; then
       prereqs_ready=1
       break
     fi
@@ -590,7 +589,6 @@ dev_csp_upload_and_install() {
   local remote_cmd
   remote_cmd="sudo \
     RUNEVAULT_LOCAL_BINARY=/tmp/runevault-${TARGET_OS}-${TARGET_ARCH} \
-    RUNEVAULT_SKIP_VERIFY=1 \
     RUNEVAULT_TEAM_NAME='${tn}' \
     RUNEVAULT_ENVECTOR_ENDPOINT='${ee}' \
     RUNEVAULT_ENVECTOR_API_KEY='${ek}' \

From 24bdd3da430fb7dca7179ed8d8a2f9d7e2720b7a Mon Sep 17 00:00:00 2001
From: Jeonghwan Lee <jhlee@cryptolab.co.kr>
Date: Thu, 30 Apr 2026 14:38:02 +0900
Subject: [PATCH 23/27] docs: remove stale pyenvector compatibility notes and
 add GCM TODO

Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>
---
 vault/internal/crypto/metadata.go | 14 ++++++++------
 1 file changed, 8 insertions(+), 6 deletions(-)

diff --git a/vault/internal/crypto/metadata.go b/vault/internal/crypto/metadata.go
index eb880d0..b7bb685 100644
--- a/vault/internal/crypto/metadata.go
+++ b/vault/internal/crypto/metadata.go
@@ -1,13 +1,16 @@
 // Package crypto provides metadata key derivation, AES-256-CTR metadata
-// encryption (wire-compatible with pyenvector.utils.aes), and FHE key
-// lifecycle wrappers around envector-go-sdk.
+// encryption, and FHE key lifecycle wrappers around envector-go-sdk.
 //
-// Wire format for metadata ciphertext (mirrors pyenvector.utils.aes.AESHelper):
+// Wire format for metadata ciphertext:
 //
 //	base64( IV (16 bytes) || ciphertext (variable) )
 //
 // AES-256-CTR is unauthenticated; integrity is enforced by upstream JSON
 // envelopes and HKDF-derived per-agent keys.
+//
+// TODO: migrate to AES-256-GCM (AEAD) — keys are issued directly between
+// rune and rune-vault so there is no external wire-format compatibility
+// constraint. Requires coordinated update of the rune-side encryption path.
 package crypto
 
 import (
@@ -56,9 +59,8 @@ func AgentIDFromToken(token string) string {
 	return hex.EncodeToString(sum[:])[:32]
 }
 
-// EncryptMetadata produces a base64-encoded ciphertext compatible with
-// pyenvector.utils.aes.encrypt_metadata: AES-256-CTR with a random 16-byte
-// IV prefixed to the ciphertext.
+// EncryptMetadata produces a base64-encoded AES-256-CTR ciphertext with a
+// random 16-byte IV prefixed to the ciphertext.
 func EncryptMetadata(plaintext, key []byte) (string, error) {
 	if len(key) != dekLen {
 		return "", ErrInvalidKey

From f36a6a0a975ff856ab7ecc1992832f82528edae2 Mon Sep 17 00:00:00 2001
From: Jeonghwan Lee <jhlee@cryptolab.co.kr>
Date: Thu, 30 Apr 2026 15:01:32 +0900
Subject: [PATCH 24/27] fix: reject permissive secret file modes at config load

checkSecretMode was warning-only, which let runevault.conf, api_key_file,
and team_secret_file slip through with world-readable bits set. Convert
the helper to return an error and propagate it through LoadConfig and
readSecretFile so the daemon refuses to start when any secret file is
looser than 0640. Tests cover both the main config and the
team_secret_file indirection paths.

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
---
 vault/internal/server/config.go      | 32 +++++++++++++------------
 vault/internal/server/config_test.go | 36 ++++++++++++++++++++++++++++
 2 files changed, 53 insertions(+), 15 deletions(-)

diff --git a/vault/internal/server/config.go b/vault/internal/server/config.go
index 1ddaeb3..8f0d036 100644
--- a/vault/internal/server/config.go
+++ b/vault/internal/server/config.go
@@ -7,7 +7,6 @@ import (
 	"errors"
 	"fmt"
 	"io/fs"
-	"log/slog"
 	"os"
 	"path/filepath"
 	"strings"
@@ -116,7 +115,9 @@ func LoadConfig(override string) (*Config, error) {
 	}
 	cfg.Source = path
 
-	checkSecretMode(path, "runevault.conf")
+	if err := checkSecretMode(path, "runevault.conf"); err != nil {
+		return nil, err
+	}
 
 	if err := cfg.Resolve(); err != nil {
 		return nil, fmt.Errorf("resolve config %s: %w", path, err)
@@ -145,8 +146,9 @@ func resolveConfigPath(override string) (path string, searched []string, err err
 	return "", searched, fmt.Errorf("config file not found (searched: %s)", strings.Join(searched, ", "))
 }
 
-// Resolve materialises *_file indirections into their inline equivalents
-// and warns about any non-0600 secret files. Idempotent.
+// Resolve materialises *_file indirections into their inline equivalents.
+// Returns an error if any referenced secret file has a permissive mode
+// (anything looser than 0o640). Idempotent.
 func (c *Config) Resolve() error {
 	if c.Envector.APIKeyFile != "" {
 		val, err := readSecretFile(c.Envector.APIKeyFile, "envector.api_key_file")
@@ -168,7 +170,9 @@ func (c *Config) Resolve() error {
 }
 
 func readSecretFile(path, label string) (string, error) {
-	checkSecretMode(path, label)
+	if err := checkSecretMode(path, label); err != nil {
+		return "", err
+	}
 	b, err := os.ReadFile(path)
 	if err != nil {
 		return "", fmt.Errorf("read %s %s: %w", label, path, err)
@@ -176,22 +180,20 @@ func readSecretFile(path, label string) (string, error) {
 	return strings.TrimRight(string(b), "\n"), nil
 }
 
-// checkSecretMode emits a warning (does not fail) if the file mode is
-// less restrictive than 0600. The warning is only written for non-empty
-// paths that exist; missing files are surfaced by the caller's read.
-func checkSecretMode(path, label string) {
+// checkSecretMode returns an error if the file's mode permits any access
+// beyond owner read/write and group read (i.e., any bit outside 0o640).
+// A missing file is treated as "not our problem" — the caller's subsequent
+// read surfaces the not-found error with the right context.
+func checkSecretMode(path, label string) error {
 	info, err := os.Stat(path)
 	if err != nil {
-		return
+		return nil
 	}
 	mode := info.Mode().Perm()
 	if mode&^expectedSecretMode != 0 {
-		slog.Warn("config: secret file mode is too permissive",
-			"label", label,
-			"path", path,
-			"mode", fmt.Sprintf("%04o", mode),
-			"expected", "0640")
+		return fmt.Errorf("config: %s %s mode %04o is too permissive (expected at most 0640)", label, path, mode)
 	}
+	return nil
 }
 
 // Redact returns a copy of c with secret fields replaced by sentinel
diff --git a/vault/internal/server/config_test.go b/vault/internal/server/config_test.go
index c791341..85d8f60 100644
--- a/vault/internal/server/config_test.go
+++ b/vault/internal/server/config_test.go
@@ -150,6 +150,42 @@ func TestLoadConfigTeamSecretFileIndirection(t *testing.T) {
 	}
 }
 
+func TestLoadConfigRejectsWorldReadableConfig(t *testing.T) {
+	path := writeConfig(t, minimalValidConfig(t))
+	if err := os.Chmod(path, 0o644); err != nil {
+		t.Fatal(err)
+	}
+	_, err := LoadConfig(path)
+	if err == nil {
+		t.Fatal("expected error for world-readable config, got nil")
+	}
+	if !strings.Contains(err.Error(), "too permissive") {
+		t.Errorf("err missing 'too permissive': %v", err)
+	}
+}
+
+func TestLoadConfigRejectsWorldReadableSecretFile(t *testing.T) {
+	dir := t.TempDir()
+	secretFile := filepath.Join(dir, "team.secret")
+	if err := os.WriteFile(secretFile, []byte("file-team-secret"), 0o644); err != nil {
+		t.Fatal(err)
+	}
+	body := strings.Replace(
+		minimalValidConfig(t),
+		"  team_secret: inline-team-secret-deadbeef",
+		"  team_secret_file: "+secretFile,
+		1,
+	)
+	path := writeConfig(t, body)
+	_, err := LoadConfig(path)
+	if err == nil {
+		t.Fatal("expected error for world-readable team_secret_file, got nil")
+	}
+	if !strings.Contains(err.Error(), "too permissive") {
+		t.Errorf("err missing 'too permissive': %v", err)
+	}
+}
+
 func TestLoadConfigSecretFileMissing(t *testing.T) {
 	body := strings.Replace(
 		minimalValidConfig(t),

From c526b26a9d9c0b4ecf9c7019a3dd173823bf93bf Mon Sep 17 00:00:00 2001
From: Jeonghwan Lee <jhlee@cryptolab.co.kr>
Date: Thu, 30 Apr 2026 15:02:06 +0900
Subject: [PATCH 25/27] fix: return gRPC status errors from Decrypt handlers

DecryptScores and DecryptMetadata previously returned the in-band
.Error field but a nil gRPC status on five paths (base64 decode, FHE
decrypt, JSON envelope decode, DEK derivation, metadata decrypt, and
the missing-team-secret guard). Clients that key on standard gRPC
codes silently missed those failures. Map each path to InvalidArgument
or Internal so the wire-level status is consistent with the rest of
the handler set.

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
---
 vault/internal/server/grpc.go      | 12 ++++++------
 vault/internal/server/grpc_test.go |  4 ++--
 2 files changed, 8 insertions(+), 8 deletions(-)

diff --git a/vault/internal/server/grpc.go b/vault/internal/server/grpc.go
index 8625f69..aff2758 100644
--- a/vault/internal/server/grpc.go
+++ b/vault/internal/server/grpc.go
@@ -208,7 +208,7 @@ func (s *VaultGRPC) DecryptScores(ctx context.Context, req *pb.DecryptScoresRequ
 		statusStr = "error"
 		msg := fmt.Sprintf("Deserialization failed: %s", err.Error())
 		errDetail = &msg
-		return &pb.DecryptScoresResponse{Error: msg}, nil
+		return &pb.DecryptScoresResponse{Error: msg}, status.Error(codes.InvalidArgument, msg)
 	}
 	if s.v.keys == nil {
 		statusStr = "error"
@@ -221,7 +221,7 @@ func (s *VaultGRPC) DecryptScores(ctx context.Context, req *pb.DecryptScoresRequ
 		statusStr = "error"
 		msg := err.Error()
 		errDetail = &msg
-		return &pb.DecryptScoresResponse{Error: msg}, nil
+		return &pb.DecryptScoresResponse{Error: msg}, status.Error(codes.Internal, msg)
 	}
 	entries := topK_FromShards(scores2D, shardIdx, int(topK))
 	resultCount = len(entries)
@@ -300,7 +300,7 @@ func (s *VaultGRPC) DecryptMetadata(ctx context.Context, req *pb.DecryptMetadata
 		statusStr = "error"
 		msg := "VAULT_TEAM_SECRET not configured"
 		errDetail = &msg
-		return &pb.DecryptMetadataResponse{Error: msg}, nil
+		return &pb.DecryptMetadataResponse{Error: msg}, status.Error(codes.Internal, msg)
 	}
 
 	out := make([]string, 0, len(req.GetEncryptedMetadataList()))
@@ -310,21 +310,21 @@ func (s *VaultGRPC) DecryptMetadata(ctx context.Context, req *pb.DecryptMetadata
 			statusStr = "error"
 			msg := fmt.Sprintf("Metadata decryption failed: %s", err.Error())
 			errDetail = &msg
-			return &pb.DecryptMetadataResponse{Error: msg}, nil
+			return &pb.DecryptMetadataResponse{Error: msg}, status.Error(codes.InvalidArgument, msg)
 		}
 		dek, err := crypto.DeriveAgentKey(s.v.cfg.Tokens.TeamSecret, env.AgentID)
 		if err != nil {
 			statusStr = "error"
 			msg := fmt.Sprintf("Metadata decryption failed: %s", err.Error())
 			errDetail = &msg
-			return &pb.DecryptMetadataResponse{Error: msg}, nil
+			return &pb.DecryptMetadataResponse{Error: msg}, status.Error(codes.Internal, msg)
 		}
 		pt, err := crypto.DecryptMetadata(env.Cipher, dek)
 		if err != nil {
 			statusStr = "error"
 			msg := fmt.Sprintf("Metadata decryption failed: %s", err.Error())
 			errDetail = &msg
-			return &pb.DecryptMetadataResponse{Error: msg}, nil
+			return &pb.DecryptMetadataResponse{Error: msg}, status.Error(codes.Internal, msg)
 		}
 		out = append(out, string(pt))
 	}
diff --git a/vault/internal/server/grpc_test.go b/vault/internal/server/grpc_test.go
index 391b266..f9ca24b 100644
--- a/vault/internal/server/grpc_test.go
+++ b/vault/internal/server/grpc_test.go
@@ -166,8 +166,8 @@ func TestDecryptMetadataMalformedEnvelope(t *testing.T) {
 		Token:                 tokens.DemoToken,
 		EncryptedMetadataList: []string{"not-json"},
 	})
-	if err != nil {
-		t.Fatalf("unexpected err: %v", err)
+	if status.Code(err) != codes.InvalidArgument {
+		t.Errorf("code = %v, want InvalidArgument", status.Code(err))
 	}
 	if !strings.Contains(resp.GetError(), "Metadata decryption failed") {
 		t.Errorf("error = %q, want 'Metadata decryption failed'", resp.GetError())

From 9888411ff252224fd7d8b86d34492b1cbb1c4811 Mon Sep 17 00:00:00 2001
From: Jeonghwan Lee <jhlee@cryptolab.co.kr>
Date: Thu, 30 Apr 2026 15:02:43 +0900
Subject: [PATCH 26/27] refactor: drop admin /shutdown and /restart endpoints
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Daemon lifecycle belongs to the OS service manager (systemd / launchd),
not to the admin socket. The endpoints duplicated systemctl and
launchctl, and the runevault-group permission model meant any group
member could trigger a process kill — too broad for a control plane.

Remove POST /shutdown and POST /restart from buildAdminMux, drop the
matching onShutdown plumbing in AdminFromConfig, delete
Vault.RequestRestart / RestartRequested, ErrRestartRequested, and the
restart-aware exit branch in main. Operators stop and restart via
systemctl / launchctl, which the install scripts already document.

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
---
 vault/cmd/main.go                   |  9 +-------
 vault/internal/server/admin.go      | 32 ++++-------------------------
 vault/internal/server/admin_test.go |  2 +-
 vault/internal/server/grpc.go       | 13 ------------
 vault/internal/server/serve.go      |  9 --------
 5 files changed, 6 insertions(+), 59 deletions(-)

diff --git a/vault/cmd/main.go b/vault/cmd/main.go
index bd1b0be..0850431 100644
--- a/vault/cmd/main.go
+++ b/vault/cmd/main.go
@@ -1,22 +1,15 @@
 package main
 
 import (
-	"errors"
 	"fmt"
 	"os"
 
 	"github.com/CryptoLabInc/rune-admin/vault/internal/commands"
-	"github.com/CryptoLabInc/rune-admin/vault/internal/server"
 )
 
 func main() {
 	if err := commands.Execute(); err != nil {
-		// ErrRestartRequested is intentional: exit 1 silently so the service
-		// manager (systemd Restart=on-failure / launchd KeepAlive) restarts
-		// the process without noisy stderr output.
-		if !errors.Is(err, server.ErrRestartRequested) {
-			fmt.Fprintln(os.Stderr, err)
-		}
+		fmt.Fprintln(os.Stderr, err)
 		os.Exit(1)
 	}
 }
diff --git a/vault/internal/server/admin.go b/vault/internal/server/admin.go
index a04ea15..ca74b78 100644
--- a/vault/internal/server/admin.go
+++ b/vault/internal/server/admin.go
@@ -53,13 +53,7 @@ func AdminFromConfig(ctx context.Context, v *Vault) (func(context.Context) error
 		return nil, fmt.Errorf("admin: chmod socket: %w", err)
 	}
 
-	onShutdown := func() {
-		go func() {
-			time.Sleep(100 * time.Millisecond) // let response flush
-			_ = syscall.Kill(os.Getpid(), syscall.SIGTERM)
-		}()
-	}
-	mux := buildAdminMux(v, onShutdown)
+	mux := buildAdminMux(v)
 	srv := &http.Server{
 		Handler:           mux,
 		ReadHeaderTimeout: 5 * time.Second,
@@ -83,33 +77,15 @@ func AdminFromConfig(ctx context.Context, v *Vault) (func(context.Context) error
 }
 
 // buildAdminMux wires the admin route table. Exposed for tests.
-// onShutdown is called (in a goroutine, after response) when POST /shutdown is
-// received; pass nil to disable the endpoint (tests).
-func buildAdminMux(v *Vault, onShutdown func()) http.Handler {
+// Daemon lifecycle (start/stop/restart) is owned by the OS service manager
+// (systemd / launchd) and is intentionally not exposed over the admin socket.
+func buildAdminMux(v *Vault) http.Handler {
 	mux := http.NewServeMux()
 
 	mux.HandleFunc("GET /health", func(w http.ResponseWriter, r *http.Request) {
 		writeJSON(w, http.StatusOK, map[string]string{"status": "ok"})
 	})
 
-	mux.HandleFunc("POST /shutdown", func(w http.ResponseWriter, r *http.Request) {
-		if onShutdown == nil {
-			writeError(w, http.StatusNotImplemented, "shutdown not enabled")
-			return
-		}
-		writeJSON(w, http.StatusOK, map[string]string{"message": "shutdown initiated"})
-		onShutdown()
-	})
-
-	mux.HandleFunc("POST /restart", func(w http.ResponseWriter, r *http.Request) {
-		if onShutdown == nil {
-			writeError(w, http.StatusNotImplemented, "restart not enabled")
-			return
-		}
-		writeJSON(w, http.StatusOK, map[string]string{"message": "restart initiated"})
-		v.RequestRestart()
-		onShutdown()
-	})
 	mux.HandleFunc("GET /tokens", func(w http.ResponseWriter, r *http.Request) {
 		writeJSON(w, http.StatusOK, map[string]any{"tokens": v.Tokens().ListTokens()})
 	})
diff --git a/vault/internal/server/admin_test.go b/vault/internal/server/admin_test.go
index e84d55b..a1a7726 100644
--- a/vault/internal/server/admin_test.go
+++ b/vault/internal/server/admin_test.go
@@ -32,7 +32,7 @@ func newAdminTestVault(t *testing.T) *Vault {
 func adminTestServer(t *testing.T) (*httptest.Server, *Vault) {
 	t.Helper()
 	v := newAdminTestVault(t)
-	ts := httptest.NewServer(buildAdminMux(v, nil))
+	ts := httptest.NewServer(buildAdminMux(v))
 	t.Cleanup(ts.Close)
 	return ts, v
 }
diff --git a/vault/internal/server/grpc.go b/vault/internal/server/grpc.go
index aff2758..cb05a13 100644
--- a/vault/internal/server/grpc.go
+++ b/vault/internal/server/grpc.go
@@ -7,7 +7,6 @@ import (
 	"errors"
 	"fmt"
 	"sort"
-	"sync/atomic"
 	"time"
 
 	"google.golang.org/grpc/codes"
@@ -34,11 +33,6 @@ type Vault struct {
 	// Cached bundle pieces from disk. Re-read on demand to pick up
 	// rotated keys without restarting; kept here for zero-copy reuse.
 	bundleParams crypto.KeysParams
-
-	// restartRequested is set by the admin /restart endpoint so that
-	// Serve can return ErrRestartRequested and the process exits with
-	// code 1, triggering service-manager (systemd/launchd) restart.
-	restartRequested atomic.Bool
 }
 
 // NewVault wires all subsystems together. Caller is responsible for Close.
@@ -65,13 +59,6 @@ func defaultKeyID(_ *Config) string {
 // Tokens exposes the token store for the admin UDS server.
 func (v *Vault) Tokens() *tokens.Store { return v.tokens }
 
-// RequestRestart marks the vault for restart. Serve returns ErrRestartRequested
-// after the current shutdown sequence completes.
-func (v *Vault) RequestRestart() { v.restartRequested.Store(true) }
-
-// RestartRequested reports whether RequestRestart was called.
-func (v *Vault) RestartRequested() bool { return v.restartRequested.Load() }
-
 // Config exposes the resolved config (e.g., for status reporting).
 func (v *Vault) Config() *Config { return v.cfg }
 
diff --git a/vault/internal/server/serve.go b/vault/internal/server/serve.go
index 7e02e94..97def9e 100644
--- a/vault/internal/server/serve.go
+++ b/vault/internal/server/serve.go
@@ -21,12 +21,6 @@ import (
 	pb "github.com/CryptoLabInc/rune-admin/vault/pkg/vaultpb"
 )
 
-// ErrRestartRequested is returned by Serve when the admin POST /restart
-// endpoint was called. The caller (daemon start) should propagate this as a
-// non-zero exit so the service manager (systemd Restart=on-failure / launchd
-// KeepAlive) restarts the process.
-var ErrRestartRequested = errors.New("restart requested by admin socket")
-
 // Serve starts the gRPC + admin UDS listeners with the given Vault and
 // blocks until ctx is cancelled or a SIGTERM/SIGINT is received. The
 // admin listener is constructed by AdminFactory; passing nil disables the
@@ -121,9 +115,6 @@ func Serve(ctx context.Context, v *Vault, adminFactory AdminFactory) error {
 		defer cancel()
 		_ = adminShutdown(shCtx)
 	}
-	if v.RestartRequested() {
-		return ErrRestartRequested
-	}
 	return nil
 }
 

From ad52b6bd549daab869b67fceff6d1a47ce35682e Mon Sep 17 00:00:00 2001
From: Jeonghwan Lee <jhlee@cryptolab.co.kr>
Date: Wed, 6 May 2026 14:50:25 +0900
Subject: [PATCH 27/27] refactor: rename GetPublicKey to GetAgentManifest, drop
 EvalKey from manifest
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

- Proto: GetPublicKey → GetAgentManifest, key_bundle_json → manifest_json
- crypto: ReadPublicKeyBundle → ReadEncKey (string return, no EvalKey read)
- buildBundle: remove EvalKey.json field; avoid unnecessary multi-MB disk read
- Update interceptor method map, type switch, and all tests
---
 vault/internal/crypto/keys.go              | 24 ++-----
 vault/internal/crypto/keys_test.go         |  6 +-
 vault/internal/server/grpc.go              | 27 ++++----
 vault/internal/server/grpc_test.go         |  4 +-
 vault/internal/server/interceptors.go      |  8 +--
 vault/internal/server/interceptors_test.go | 14 ++--
 vault/pkg/vaultpb/vault_service.pb.go      | 78 +++++++++++-----------
 vault/pkg/vaultpb/vault_service_grpc.pb.go | 38 +++++------
 vault/proto/vault_service.proto            | 14 ++--
 9 files changed, 100 insertions(+), 113 deletions(-)

diff --git a/vault/internal/crypto/keys.go b/vault/internal/crypto/keys.go
index bfa74ce..0374e62 100644
--- a/vault/internal/crypto/keys.go
+++ b/vault/internal/crypto/keys.go
@@ -86,26 +86,14 @@ func (f *EnvectorKeys) Decrypt(blob []byte) (scores [][]float64, shardIdx []int3
 	return f.keys.Decrypt(blob)
 }
 
-// PublicKeyBundle reads EncKey.json and EvalKey.json file contents from
-// disk. The strings are returned verbatim for inclusion in the GetPublicKey
-// gRPC response — clients re-parse them with their own SDK.
-type PublicKeyBundle struct {
-	EncKey  string
-	EvalKey string
-}
-
-func ReadPublicKeyBundle(p KeysParams) (*PublicKeyBundle, error) {
-	encPath := filepath.Join(p.keyDir(), "EncKey.json")
-	evalPath := filepath.Join(p.keyDir(), "EvalKey.json")
-	enc, err := os.ReadFile(encPath)
-	if err != nil {
-		return nil, fmt.Errorf("crypto: read EncKey.json: %w", err)
-	}
-	eval, err := os.ReadFile(evalPath)
+// ReadEncKey reads EncKey.json from disk and returns its contents verbatim
+// for inclusion in the GetAgentManifest gRPC response.
+func ReadEncKey(p KeysParams) (string, error) {
+	enc, err := os.ReadFile(filepath.Join(p.keyDir(), "EncKey.json"))
 	if err != nil {
-		return nil, fmt.Errorf("crypto: read EvalKey.json: %w", err)
+		return "", fmt.Errorf("crypto: read EncKey.json: %w", err)
 	}
-	return &PublicKeyBundle{EncKey: string(enc), EvalKey: string(eval)}, nil
+	return string(enc), nil
 }
 
 func (f *EnvectorKeys) Close() error {
diff --git a/vault/internal/crypto/keys_test.go b/vault/internal/crypto/keys_test.go
index fdbaebd..ce36329 100644
--- a/vault/internal/crypto/keys_test.go
+++ b/vault/internal/crypto/keys_test.go
@@ -27,10 +27,10 @@ func TestOpenSecretKeyMissingReturnsError(t *testing.T) {
 	}
 }
 
-func TestReadPublicKeyBundleMissingReturnsError(t *testing.T) {
+func TestReadEncKeyMissingReturnsError(t *testing.T) {
 	p := KeysParams{Root: t.TempDir(), KeyID: "vault-key", Dim: 1024}
-	if _, err := ReadPublicKeyBundle(p); err == nil {
-		t.Error("ReadPublicKeyBundle on missing keys returned nil error")
+	if _, err := ReadEncKey(p); err == nil {
+		t.Error("ReadEncKey on missing keys returned nil error")
 	}
 }
 
diff --git a/vault/internal/server/grpc.go b/vault/internal/server/grpc.go
index cb05a13..582724b 100644
--- a/vault/internal/server/grpc.go
+++ b/vault/internal/server/grpc.go
@@ -18,7 +18,7 @@ import (
 	pb "github.com/CryptoLabInc/rune-admin/vault/pkg/vaultpb"
 )
 
-// MaxMessageSize bounds gRPC frames. EvalKey alone can be tens of MB.
+// MaxMessageSize bounds gRPC frames.
 const MaxMessageSize = 256 * 1024 * 1024
 
 // Vault is the runtime container shared by all RPC handlers and the
@@ -79,9 +79,9 @@ type VaultGRPC struct {
 
 func NewVaultGRPC(v *Vault) *VaultGRPC { return &VaultGRPC{v: v} }
 
-// ── GetPublicKey ──────────────────────────────────────────────────
+// ── GetAgentManifest ─────────────────────────────────────────────
 
-func (s *VaultGRPC) GetPublicKey(ctx context.Context, req *pb.GetPublicKeyRequest) (*pb.GetPublicKeyResponse, error) {
+func (s *VaultGRPC) GetAgentManifest(ctx context.Context, req *pb.GetAgentManifestRequest) (*pb.GetAgentManifestResponse, error) {
 	start := time.Now()
 	user := s.v.tokens.GetUsername(req.GetToken())
 	if user == "" {
@@ -91,21 +91,21 @@ func (s *VaultGRPC) GetPublicKey(ctx context.Context, req *pb.GetPublicKeyReques
 	statusStr := "success"
 	var errDetail *string
 	defer func() {
-		s.emit(ctx, "get_public_key", user, nil, resultCount, statusStr, errDetail, time.Since(start))
+		s.emit(ctx, "get_agent_manifest", user, nil, resultCount, statusStr, errDetail, time.Since(start))
 	}()
 
 	username, role, err := s.v.tokens.Validate(req.GetToken())
 	if err != nil {
 		st, msg := mapTokenError(err)
 		statusStr, errDetail = errStatus(err)
-		return &pb.GetPublicKeyResponse{Error: msg}, status.Error(st, msg)
+		return &pb.GetAgentManifestResponse{Error: msg}, status.Error(st, msg)
 	}
 	user = username
 	if err := role.CheckScope("get_public_key"); err != nil {
 		statusStr = "denied"
 		ed := err.Error()
 		errDetail = &ed
-		return &pb.GetPublicKeyResponse{Error: err.Error()}, status.Error(codes.PermissionDenied, err.Error())
+		return &pb.GetAgentManifestResponse{Error: err.Error()}, status.Error(codes.PermissionDenied, err.Error())
 	}
 
 	bundle, err := s.v.buildBundle(req.GetToken())
@@ -113,30 +113,29 @@ func (s *VaultGRPC) GetPublicKey(ctx context.Context, req *pb.GetPublicKeyReques
 		statusStr = "error"
 		ed := err.Error()
 		errDetail = &ed
-		return &pb.GetPublicKeyResponse{Error: err.Error()}, status.Error(codes.Internal, err.Error())
+		return &pb.GetAgentManifestResponse{Error: err.Error()}, status.Error(codes.Internal, err.Error())
 	}
 	js, err := json.Marshal(bundle)
 	if err != nil {
 		statusStr = "error"
 		ed := err.Error()
 		errDetail = &ed
-		return &pb.GetPublicKeyResponse{Error: err.Error()}, status.Error(codes.Internal, err.Error())
+		return &pb.GetAgentManifestResponse{Error: err.Error()}, status.Error(codes.Internal, err.Error())
 	}
 	resultCount = 1
-	return &pb.GetPublicKeyResponse{KeyBundleJson: string(js)}, nil
+	return &pb.GetAgentManifestResponse{ManifestJson: string(js)}, nil
 }
 
-// buildBundle assembles the per-token JSON bundle returned by GetPublicKey.
+// buildBundle assembles the per-token JSON manifest returned by GetAgentManifest.
 // Order of keys is irrelevant — clients parse by name.
 func (s *Vault) buildBundle(token string) (map[string]any, error) {
-	pub, err := crypto.ReadPublicKeyBundle(s.bundleParams)
+	encKey, err := crypto.ReadEncKey(s.bundleParams)
 	if err != nil {
 		return nil, err
 	}
 	bundle := map[string]any{
-		"EncKey.json":  pub.EncKey,
-		"EvalKey.json": pub.EvalKey,
-		"key_id":       s.bundleParams.KeyID,
+		"EncKey.json": encKey,
+		"key_id":      s.bundleParams.KeyID,
 	}
 	if s.cfg.Keys.IndexName != "" {
 		bundle["index_name"] = s.cfg.Keys.IndexName
diff --git a/vault/internal/server/grpc_test.go b/vault/internal/server/grpc_test.go
index f9ca24b..8b913c9 100644
--- a/vault/internal/server/grpc_test.go
+++ b/vault/internal/server/grpc_test.go
@@ -103,10 +103,10 @@ func newTestVault(t *testing.T) *Vault {
 	return NewVault(cfg, store, nil, audit)
 }
 
-func TestGetPublicKeyInvalidToken(t *testing.T) {
+func TestGetAgentManifestInvalidToken(t *testing.T) {
 	v := newTestVault(t)
 	srv := NewVaultGRPC(v)
-	resp, err := srv.GetPublicKey(context.Background(), &pb.GetPublicKeyRequest{
+	resp, err := srv.GetAgentManifest(context.Background(), &pb.GetAgentManifestRequest{
 		Token: "evt_ffffffffffffffffffffffffffffffff",
 	})
 	if status.Code(err) != codes.Unauthenticated {
diff --git a/vault/internal/server/interceptors.go b/vault/internal/server/interceptors.go
index eea9c7c..6de1fd8 100644
--- a/vault/internal/server/interceptors.go
+++ b/vault/internal/server/interceptors.go
@@ -19,9 +19,9 @@ import (
 // vaultMethods enumerates the gRPC method paths owned by VaultService.
 // Other services routed through the same gRPC server bypass runtime checks.
 var vaultMethods = map[string]bool{
-	"/rune.vault.v1.VaultService/GetPublicKey":    true,
-	"/rune.vault.v1.VaultService/DecryptScores":   true,
-	"/rune.vault.v1.VaultService/DecryptMetadata": true,
+	"/rune.vault.v1.VaultService/GetAgentManifest": true,
+	"/rune.vault.v1.VaultService/DecryptScores":    true,
+	"/rune.vault.v1.VaultService/DecryptMetadata":  true,
 }
 
 // NewValidationInterceptor returns a unary server interceptor that runs
@@ -55,7 +55,7 @@ func NewValidationInterceptor() (grpc.UnaryServerInterceptor, error) {
 func runtimeCheckToken(req any) error {
 	var token string
 	switch r := req.(type) {
-	case *pb.GetPublicKeyRequest:
+	case *pb.GetAgentManifestRequest:
 		token = r.GetToken()
 	case *pb.DecryptScoresRequest:
 		token = r.GetToken()
diff --git a/vault/internal/server/interceptors_test.go b/vault/internal/server/interceptors_test.go
index 4d66d66..f30021a 100644
--- a/vault/internal/server/interceptors_test.go
+++ b/vault/internal/server/interceptors_test.go
@@ -52,8 +52,8 @@ func vaultMethodInfo(name string) *grpc.UnaryServerInfo {
 
 func TestInterceptorPassesValidRequest(t *testing.T) {
 	ic := mustInterceptor(t)
-	req := &pb.GetPublicKeyRequest{Token: "evt_0123456789abcdef0123456789abcdef"}
-	out, err := ic(context.Background(), req, vaultMethodInfo("GetPublicKey"), noopHandler)
+	req := &pb.GetAgentManifestRequest{Token: "evt_0123456789abcdef0123456789abcdef"}
+	out, err := ic(context.Background(), req, vaultMethodInfo("GetAgentManifest"), noopHandler)
 	if err != nil {
 		t.Fatalf("err = %v, want nil", err)
 	}
@@ -65,8 +65,8 @@ func TestInterceptorPassesValidRequest(t *testing.T) {
 func TestInterceptorRejectsBadProtovalidate(t *testing.T) {
 	ic := mustInterceptor(t)
 	// Token shorter than 36 fails the proto-level constraint.
-	req := &pb.GetPublicKeyRequest{Token: "too_short"}
-	_, err := ic(context.Background(), req, vaultMethodInfo("GetPublicKey"), noopHandler)
+	req := &pb.GetAgentManifestRequest{Token: "too_short"}
+	_, err := ic(context.Background(), req, vaultMethodInfo("GetAgentManifest"), noopHandler)
 	if err == nil {
 		t.Fatal("err = nil, want validation error")
 	}
@@ -79,11 +79,11 @@ func TestInterceptorRejectsControlCharToken(t *testing.T) {
 	ic := mustInterceptor(t)
 	// 36-char token containing a control byte (\x00) inside.
 	// protovalidate only checks length, so the runtime layer catches this.
-	req := &pb.GetPublicKeyRequest{Token: "evt_0123456789abcdef0123456789abc\x00ef"}
+	req := &pb.GetAgentManifestRequest{Token: "evt_0123456789abcdef0123456789abc\x00ef"}
 	if len(req.Token) != 36 {
 		t.Fatalf("test setup: token length = %d, want 36", len(req.Token))
 	}
-	_, err := ic(context.Background(), req, vaultMethodInfo("GetPublicKey"), noopHandler)
+	_, err := ic(context.Background(), req, vaultMethodInfo("GetAgentManifest"), noopHandler)
 	if err == nil {
 		t.Fatal("err = nil, want runtime error")
 	}
@@ -97,7 +97,7 @@ func TestInterceptorAllowsNonVaultMethod(t *testing.T) {
 	// Whitespace-around token would normally fail runtime check, but
 	// non-Vault methods skip runtime checks (and the proto for this
 	// dummy message doesn't apply).
-	req := &pb.GetPublicKeyRequest{Token: "evt_0123456789abcdef0123456789abcdef"}
+	req := &pb.GetAgentManifestRequest{Token: "evt_0123456789abcdef0123456789abcdef"}
 	info := &grpc.UnaryServerInfo{FullMethod: "/grpc.health.v1.Health/Check"}
 	if _, err := ic(context.Background(), req, info, noopHandler); err != nil {
 		t.Errorf("non-vault method blocked: %v", err)
diff --git a/vault/pkg/vaultpb/vault_service.pb.go b/vault/pkg/vaultpb/vault_service.pb.go
index e2ba23d..0ecb708 100644
--- a/vault/pkg/vaultpb/vault_service.pb.go
+++ b/vault/pkg/vaultpb/vault_service.pb.go
@@ -22,7 +22,7 @@ const (
 	_ = protoimpl.EnforceVersion(protoimpl.MaxVersion - 20)
 )
 
-type GetPublicKeyRequest struct {
+type GetAgentManifestRequest struct {
 	state protoimpl.MessageState `protogen:"open.v1"`
 	// Auth token. Required, Fixed 36 chars (evt_ + 32 hex).
 	Token         string `protobuf:"bytes,1,opt,name=token,proto3" json:"token,omitempty"`
@@ -30,20 +30,20 @@ type GetPublicKeyRequest struct {
 	sizeCache     protoimpl.SizeCache
 }
 
-func (x *GetPublicKeyRequest) Reset() {
-	*x = GetPublicKeyRequest{}
+func (x *GetAgentManifestRequest) Reset() {
+	*x = GetAgentManifestRequest{}
 	mi := &file_vault_service_proto_msgTypes[0]
 	ms := protoimpl.X.MessageStateOf(protoimpl.Pointer(x))
 	ms.StoreMessageInfo(mi)
 }
 
-func (x *GetPublicKeyRequest) String() string {
+func (x *GetAgentManifestRequest) String() string {
 	return protoimpl.X.MessageStringOf(x)
 }
 
-func (*GetPublicKeyRequest) ProtoMessage() {}
+func (*GetAgentManifestRequest) ProtoMessage() {}
 
-func (x *GetPublicKeyRequest) ProtoReflect() protoreflect.Message {
+func (x *GetAgentManifestRequest) ProtoReflect() protoreflect.Message {
 	mi := &file_vault_service_proto_msgTypes[0]
 	if x != nil {
 		ms := protoimpl.X.MessageStateOf(protoimpl.Pointer(x))
@@ -55,41 +55,41 @@ func (x *GetPublicKeyRequest) ProtoReflect() protoreflect.Message {
 	return mi.MessageOf(x)
 }
 
-// Deprecated: Use GetPublicKeyRequest.ProtoReflect.Descriptor instead.
-func (*GetPublicKeyRequest) Descriptor() ([]byte, []int) {
+// Deprecated: Use GetAgentManifestRequest.ProtoReflect.Descriptor instead.
+func (*GetAgentManifestRequest) Descriptor() ([]byte, []int) {
 	return file_vault_service_proto_rawDescGZIP(), []int{0}
 }
 
-func (x *GetPublicKeyRequest) GetToken() string {
+func (x *GetAgentManifestRequest) GetToken() string {
 	if x != nil {
 		return x.Token
 	}
 	return ""
 }
 
-type GetPublicKeyResponse struct {
+type GetAgentManifestResponse struct {
 	state protoimpl.MessageState `protogen:"open.v1"`
-	// JSON string: {"EncKey.json": "...", "EvalKey.json": "...", "index_name": "..."}
-	KeyBundleJson string `protobuf:"bytes,1,opt,name=key_bundle_json,json=keyBundleJson,proto3" json:"key_bundle_json,omitempty"`
+	// JSON string: {"EncKey.json": "...", "index_name": "...", "agent_id": "...", ...}
+	ManifestJson  string `protobuf:"bytes,1,opt,name=manifest_json,json=manifestJson,proto3" json:"manifest_json,omitempty"`
 	Error         string `protobuf:"bytes,2,opt,name=error,proto3" json:"error,omitempty"` // Non-empty on error
 	unknownFields protoimpl.UnknownFields
 	sizeCache     protoimpl.SizeCache
 }
 
-func (x *GetPublicKeyResponse) Reset() {
-	*x = GetPublicKeyResponse{}
+func (x *GetAgentManifestResponse) Reset() {
+	*x = GetAgentManifestResponse{}
 	mi := &file_vault_service_proto_msgTypes[1]
 	ms := protoimpl.X.MessageStateOf(protoimpl.Pointer(x))
 	ms.StoreMessageInfo(mi)
 }
 
-func (x *GetPublicKeyResponse) String() string {
+func (x *GetAgentManifestResponse) String() string {
 	return protoimpl.X.MessageStringOf(x)
 }
 
-func (*GetPublicKeyResponse) ProtoMessage() {}
+func (*GetAgentManifestResponse) ProtoMessage() {}
 
-func (x *GetPublicKeyResponse) ProtoReflect() protoreflect.Message {
+func (x *GetAgentManifestResponse) ProtoReflect() protoreflect.Message {
 	mi := &file_vault_service_proto_msgTypes[1]
 	if x != nil {
 		ms := protoimpl.X.MessageStateOf(protoimpl.Pointer(x))
@@ -101,19 +101,19 @@ func (x *GetPublicKeyResponse) ProtoReflect() protoreflect.Message {
 	return mi.MessageOf(x)
 }
 
-// Deprecated: Use GetPublicKeyResponse.ProtoReflect.Descriptor instead.
-func (*GetPublicKeyResponse) Descriptor() ([]byte, []int) {
+// Deprecated: Use GetAgentManifestResponse.ProtoReflect.Descriptor instead.
+func (*GetAgentManifestResponse) Descriptor() ([]byte, []int) {
 	return file_vault_service_proto_rawDescGZIP(), []int{1}
 }
 
-func (x *GetPublicKeyResponse) GetKeyBundleJson() string {
+func (x *GetAgentManifestResponse) GetManifestJson() string {
 	if x != nil {
-		return x.KeyBundleJson
+		return x.ManifestJson
 	}
 	return ""
 }
 
-func (x *GetPublicKeyResponse) GetError() string {
+func (x *GetAgentManifestResponse) GetError() string {
 	if x != nil {
 		return x.Error
 	}
@@ -407,11 +407,11 @@ var File_vault_service_proto protoreflect.FileDescriptor
 
 const file_vault_service_proto_rawDesc = "" +
 	"\n" +
-	"\x13vault_service.proto\x12\rrune.vault.v1\x1a\x1bbuf/validate/validate.proto\"6\n" +
-	"\x13GetPublicKeyRequest\x12\x1f\n" +
-	"\x05token\x18\x01 \x01(\tB\t\xbaH\x06r\x04\x10$\x18$R\x05token\"T\n" +
-	"\x14GetPublicKeyResponse\x12&\n" +
-	"\x0fkey_bundle_json\x18\x01 \x01(\tR\rkeyBundleJson\x12\x14\n" +
+	"\x13vault_service.proto\x12\rrune.vault.v1\x1a\x1bbuf/validate/validate.proto\":\n" +
+	"\x17GetAgentManifestRequest\x12\x1f\n" +
+	"\x05token\x18\x01 \x01(\tB\t\xbaH\x06r\x04\x10$\x18$R\x05token\"U\n" +
+	"\x18GetAgentManifestResponse\x12#\n" +
+	"\rmanifest_json\x18\x01 \x01(\tR\fmanifestJson\x12\x14\n" +
 	"\x05error\x18\x02 \x01(\tR\x05error\"\x8f\x01\n" +
 	"\x14DecryptScoresRequest\x12\x1f\n" +
 	"\x05token\x18\x01 \x01(\tB\t\xbaH\x06r\x04\x10$\x18$R\x05token\x125\n" +
@@ -431,9 +431,9 @@ const file_vault_service_proto_rawDesc = "" +
 	"\x17encrypted_metadata_list\x18\x02 \x03(\tB\x11\xbaH\x0e\x92\x01\v\b\x01\x10\xe8\a\"\x04r\x02\x10\x01R\x15encryptedMetadataList\"^\n" +
 	"\x17DecryptMetadataResponse\x12-\n" +
 	"\x12decrypted_metadata\x18\x01 \x03(\tR\x11decryptedMetadata\x12\x14\n" +
-	"\x05error\x18\x02 \x01(\tR\x05error2\xa5\x02\n" +
-	"\fVaultService\x12W\n" +
-	"\fGetPublicKey\x12\".rune.vault.v1.GetPublicKeyRequest\x1a#.rune.vault.v1.GetPublicKeyResponse\x12Z\n" +
+	"\x05error\x18\x02 \x01(\tR\x05error2\xb1\x02\n" +
+	"\fVaultService\x12c\n" +
+	"\x10GetAgentManifest\x12&.rune.vault.v1.GetAgentManifestRequest\x1a'.rune.vault.v1.GetAgentManifestResponse\x12Z\n" +
 	"\rDecryptScores\x12#.rune.vault.v1.DecryptScoresRequest\x1a$.rune.vault.v1.DecryptScoresResponse\x12`\n" +
 	"\x0fDecryptMetadata\x12%.rune.vault.v1.DecryptMetadataRequest\x1a&.rune.vault.v1.DecryptMetadataResponseb\x06proto3"
 
@@ -451,20 +451,20 @@ func file_vault_service_proto_rawDescGZIP() []byte {
 
 var file_vault_service_proto_msgTypes = make([]protoimpl.MessageInfo, 7)
 var file_vault_service_proto_goTypes = []any{
-	(*GetPublicKeyRequest)(nil),     // 0: rune.vault.v1.GetPublicKeyRequest
-	(*GetPublicKeyResponse)(nil),    // 1: rune.vault.v1.GetPublicKeyResponse
-	(*DecryptScoresRequest)(nil),    // 2: rune.vault.v1.DecryptScoresRequest
-	(*ScoreEntry)(nil),              // 3: rune.vault.v1.ScoreEntry
-	(*DecryptScoresResponse)(nil),   // 4: rune.vault.v1.DecryptScoresResponse
-	(*DecryptMetadataRequest)(nil),  // 5: rune.vault.v1.DecryptMetadataRequest
-	(*DecryptMetadataResponse)(nil), // 6: rune.vault.v1.DecryptMetadataResponse
+	(*GetAgentManifestRequest)(nil),  // 0: rune.vault.v1.GetAgentManifestRequest
+	(*GetAgentManifestResponse)(nil), // 1: rune.vault.v1.GetAgentManifestResponse
+	(*DecryptScoresRequest)(nil),     // 2: rune.vault.v1.DecryptScoresRequest
+	(*ScoreEntry)(nil),               // 3: rune.vault.v1.ScoreEntry
+	(*DecryptScoresResponse)(nil),    // 4: rune.vault.v1.DecryptScoresResponse
+	(*DecryptMetadataRequest)(nil),   // 5: rune.vault.v1.DecryptMetadataRequest
+	(*DecryptMetadataResponse)(nil),  // 6: rune.vault.v1.DecryptMetadataResponse
 }
 var file_vault_service_proto_depIdxs = []int32{
 	3, // 0: rune.vault.v1.DecryptScoresResponse.results:type_name -> rune.vault.v1.ScoreEntry
-	0, // 1: rune.vault.v1.VaultService.GetPublicKey:input_type -> rune.vault.v1.GetPublicKeyRequest
+	0, // 1: rune.vault.v1.VaultService.GetAgentManifest:input_type -> rune.vault.v1.GetAgentManifestRequest
 	2, // 2: rune.vault.v1.VaultService.DecryptScores:input_type -> rune.vault.v1.DecryptScoresRequest
 	5, // 3: rune.vault.v1.VaultService.DecryptMetadata:input_type -> rune.vault.v1.DecryptMetadataRequest
-	1, // 4: rune.vault.v1.VaultService.GetPublicKey:output_type -> rune.vault.v1.GetPublicKeyResponse
+	1, // 4: rune.vault.v1.VaultService.GetAgentManifest:output_type -> rune.vault.v1.GetAgentManifestResponse
 	4, // 5: rune.vault.v1.VaultService.DecryptScores:output_type -> rune.vault.v1.DecryptScoresResponse
 	6, // 6: rune.vault.v1.VaultService.DecryptMetadata:output_type -> rune.vault.v1.DecryptMetadataResponse
 	4, // [4:7] is the sub-list for method output_type
diff --git a/vault/pkg/vaultpb/vault_service_grpc.pb.go b/vault/pkg/vaultpb/vault_service_grpc.pb.go
index 7108750..8d48049 100644
--- a/vault/pkg/vaultpb/vault_service_grpc.pb.go
+++ b/vault/pkg/vaultpb/vault_service_grpc.pb.go
@@ -19,9 +19,9 @@ import (
 const _ = grpc.SupportPackageIsVersion9
 
 const (
-	VaultService_GetPublicKey_FullMethodName    = "/rune.vault.v1.VaultService/GetPublicKey"
-	VaultService_DecryptScores_FullMethodName   = "/rune.vault.v1.VaultService/DecryptScores"
-	VaultService_DecryptMetadata_FullMethodName = "/rune.vault.v1.VaultService/DecryptMetadata"
+	VaultService_GetAgentManifest_FullMethodName = "/rune.vault.v1.VaultService/GetAgentManifest"
+	VaultService_DecryptScores_FullMethodName    = "/rune.vault.v1.VaultService/DecryptScores"
+	VaultService_DecryptMetadata_FullMethodName  = "/rune.vault.v1.VaultService/DecryptMetadata"
 )
 
 // VaultServiceClient is the client API for VaultService service.
@@ -31,8 +31,8 @@ const (
 // Rune-Vault gRPC service.
 // Holds the FHE secret key and performs all decryption operations.
 type VaultServiceClient interface {
-	// Returns the public key bundle (EncKey, EvalKey, optional team index name).
-	GetPublicKey(ctx context.Context, in *GetPublicKeyRequest, opts ...grpc.CallOption) (*GetPublicKeyResponse, error)
+	// Returns the agent manifest (EncKey, agent credentials, optional team index name).
+	GetAgentManifest(ctx context.Context, in *GetAgentManifestRequest, opts ...grpc.CallOption) (*GetAgentManifestResponse, error)
 	// Decrypts FHE-encrypted similarity scores and applies Top-K filtering.
 	DecryptScores(ctx context.Context, in *DecryptScoresRequest, opts ...grpc.CallOption) (*DecryptScoresResponse, error)
 	// Decrypts a list of AES-encrypted metadata strings.
@@ -47,10 +47,10 @@ func NewVaultServiceClient(cc grpc.ClientConnInterface) VaultServiceClient {
 	return &vaultServiceClient{cc}
 }
 
-func (c *vaultServiceClient) GetPublicKey(ctx context.Context, in *GetPublicKeyRequest, opts ...grpc.CallOption) (*GetPublicKeyResponse, error) {
+func (c *vaultServiceClient) GetAgentManifest(ctx context.Context, in *GetAgentManifestRequest, opts ...grpc.CallOption) (*GetAgentManifestResponse, error) {
 	cOpts := append([]grpc.CallOption{grpc.StaticMethod()}, opts...)
-	out := new(GetPublicKeyResponse)
-	err := c.cc.Invoke(ctx, VaultService_GetPublicKey_FullMethodName, in, out, cOpts...)
+	out := new(GetAgentManifestResponse)
+	err := c.cc.Invoke(ctx, VaultService_GetAgentManifest_FullMethodName, in, out, cOpts...)
 	if err != nil {
 		return nil, err
 	}
@@ -84,8 +84,8 @@ func (c *vaultServiceClient) DecryptMetadata(ctx context.Context, in *DecryptMet
 // Rune-Vault gRPC service.
 // Holds the FHE secret key and performs all decryption operations.
 type VaultServiceServer interface {
-	// Returns the public key bundle (EncKey, EvalKey, optional team index name).
-	GetPublicKey(context.Context, *GetPublicKeyRequest) (*GetPublicKeyResponse, error)
+	// Returns the agent manifest (EncKey, agent credentials, optional team index name).
+	GetAgentManifest(context.Context, *GetAgentManifestRequest) (*GetAgentManifestResponse, error)
 	// Decrypts FHE-encrypted similarity scores and applies Top-K filtering.
 	DecryptScores(context.Context, *DecryptScoresRequest) (*DecryptScoresResponse, error)
 	// Decrypts a list of AES-encrypted metadata strings.
@@ -100,8 +100,8 @@ type VaultServiceServer interface {
 // pointer dereference when methods are called.
 type UnimplementedVaultServiceServer struct{}
 
-func (UnimplementedVaultServiceServer) GetPublicKey(context.Context, *GetPublicKeyRequest) (*GetPublicKeyResponse, error) {
-	return nil, status.Error(codes.Unimplemented, "method GetPublicKey not implemented")
+func (UnimplementedVaultServiceServer) GetAgentManifest(context.Context, *GetAgentManifestRequest) (*GetAgentManifestResponse, error) {
+	return nil, status.Error(codes.Unimplemented, "method GetAgentManifest not implemented")
 }
 func (UnimplementedVaultServiceServer) DecryptScores(context.Context, *DecryptScoresRequest) (*DecryptScoresResponse, error) {
 	return nil, status.Error(codes.Unimplemented, "method DecryptScores not implemented")
@@ -130,20 +130,20 @@ func RegisterVaultServiceServer(s grpc.ServiceRegistrar, srv VaultServiceServer)
 	s.RegisterService(&VaultService_ServiceDesc, srv)
 }
 
-func _VaultService_GetPublicKey_Handler(srv interface{}, ctx context.Context, dec func(interface{}) error, interceptor grpc.UnaryServerInterceptor) (interface{}, error) {
-	in := new(GetPublicKeyRequest)
+func _VaultService_GetAgentManifest_Handler(srv interface{}, ctx context.Context, dec func(interface{}) error, interceptor grpc.UnaryServerInterceptor) (interface{}, error) {
+	in := new(GetAgentManifestRequest)
 	if err := dec(in); err != nil {
 		return nil, err
 	}
 	if interceptor == nil {
-		return srv.(VaultServiceServer).GetPublicKey(ctx, in)
+		return srv.(VaultServiceServer).GetAgentManifest(ctx, in)
 	}
 	info := &grpc.UnaryServerInfo{
 		Server:     srv,
-		FullMethod: VaultService_GetPublicKey_FullMethodName,
+		FullMethod: VaultService_GetAgentManifest_FullMethodName,
 	}
 	handler := func(ctx context.Context, req interface{}) (interface{}, error) {
-		return srv.(VaultServiceServer).GetPublicKey(ctx, req.(*GetPublicKeyRequest))
+		return srv.(VaultServiceServer).GetAgentManifest(ctx, req.(*GetAgentManifestRequest))
 	}
 	return interceptor(ctx, in, info, handler)
 }
@@ -192,8 +192,8 @@ var VaultService_ServiceDesc = grpc.ServiceDesc{
 	HandlerType: (*VaultServiceServer)(nil),
 	Methods: []grpc.MethodDesc{
 		{
-			MethodName: "GetPublicKey",
-			Handler:    _VaultService_GetPublicKey_Handler,
+			MethodName: "GetAgentManifest",
+			Handler:    _VaultService_GetAgentManifest_Handler,
 		},
 		{
 			MethodName: "DecryptScores",
diff --git a/vault/proto/vault_service.proto b/vault/proto/vault_service.proto
index ab00ad3..c3e6a03 100644
--- a/vault/proto/vault_service.proto
+++ b/vault/proto/vault_service.proto
@@ -7,8 +7,8 @@ import "buf/validate/validate.proto";
 // Rune-Vault gRPC service.
 // Holds the FHE secret key and performs all decryption operations.
 service VaultService {
-  // Returns the public key bundle (EncKey, EvalKey, optional team index name).
-  rpc GetPublicKey(GetPublicKeyRequest) returns (GetPublicKeyResponse);
+  // Returns the agent manifest (EncKey, agent credentials, optional team index name).
+  rpc GetAgentManifest(GetAgentManifestRequest) returns (GetAgentManifestResponse);
 
   // Decrypts FHE-encrypted similarity scores and applies Top-K filtering.
   rpc DecryptScores(DecryptScoresRequest) returns (DecryptScoresResponse);
@@ -17,16 +17,16 @@ service VaultService {
   rpc DecryptMetadata(DecryptMetadataRequest) returns (DecryptMetadataResponse);
 }
 
-// ─── GetPublicKey ──────────────────────────────────────────────────
+// ─── GetAgentManifest ─────────────────────────────────────────────
 
-message GetPublicKeyRequest {
+message GetAgentManifestRequest {
   // Auth token. Required, Fixed 36 chars (evt_ + 32 hex).
   string token = 1 [(buf.validate.field).string = {min_len: 36, max_len: 36}];
 }
 
-message GetPublicKeyResponse {
-  // JSON string: {"EncKey.json": "...", "EvalKey.json": "...", "index_name": "..."}
-  string key_bundle_json = 1;
+message GetAgentManifestResponse {
+  // JSON string: {"EncKey.json": "...", "index_name": "...", "agent_id": "...", ...}
+  string manifest_json = 1;
   string error = 2;  // Non-empty on error
 }