chore: pre-migration snapshot

Layer0, MCP servers, Terraform consolidation
2025-12-27 01:52:27 +00:00
parent 7f2e60e1c5
commit f0b8d962de
67 changed files with 14887 additions and 650 deletions
--- a/layer0/replay.py
+++ b/layer0/replay.py
@@ -0,0 +1,443 @@
+from __future__ import annotations
+
+import argparse
+import hashlib
+import json
+import os
+import sqlite3
+import uuid
+from dataclasses import dataclass
+from datetime import datetime, timezone
+from pathlib import Path
+from typing import Any, Iterable
+
+from .pattern_store import PatternStore, write_pattern_snapshot
+from .shadow_classifier import Classification, ShadowClassifier
+
+THIS_FILE = Path(__file__).resolve()
+LAYER0_DIR = THIS_FILE.parent
+REPO_ROOT = LAYER0_DIR.parent.parent
+
+
+def _utc_now_iso_z() -> str:
+    return (
+        datetime.now(timezone.utc)
+        .replace(microsecond=0)
+        .isoformat()
+        .replace("+00:00", "Z")
+    )
+
+
+def _default_db_path() -> Path:
+    for key in ("LEDGER_DB_PATH", "VAULTMESH_LEDGER_DB"):
+        v = (os.environ.get(key) or "").strip()
+        if v:
+            return Path(v).expanduser().resolve()
+    return (REPO_ROOT / ".state" / "ledger.sqlite").resolve()
+
+
+def _read_jsonl(paths: Iterable[Path], *, limit: int | None) -> list[dict[str, Any]]:
+    rows: list[dict[str, Any]] = []
+    for path in paths:
+        if not path.exists():
+            continue
+        for line in path.read_text(encoding="utf-8").splitlines():
+            line = line.strip()
+            if not line:
+                continue
+            try:
+                obj = json.loads(line)
+            except Exception:
+                continue
+            if isinstance(obj, dict):
+                rows.append(obj)
+
+    if limit is not None and limit > 0 and len(rows) > limit:
+        return rows[-limit:]
+    return rows
+
+
+def _telemetry_query(event: dict[str, Any]) -> str:
+    v = event.get("query") or event.get("prompt") or event.get("input")
+    return v if isinstance(v, str) else ""
+
+
+def _outcome(event: dict[str, Any]) -> str | None:
+    v = event.get("outcome") or event.get("result") or event.get("status")
+    if isinstance(v, str) and v.strip():
+        return v.strip()
+    return None
+
+
+def _ground_truth(event: dict[str, Any]) -> Classification | None:
+    outcome = (_outcome(event) or "").lower()
+    if outcome in {"success", "ok"}:
+        return Classification.BLESSED
+    if outcome in {"blocked_by_guardrails", "blocked_by_policy", "blocked", "denied"}:
+        return Classification.FORBIDDEN
+    if outcome in {"fail_closed", "catastrophic", "blocked_catastrophic"}:
+        return Classification.CATASTROPHIC
+    return None
+
+
+def _ensure_ledger_schema(conn: sqlite3.Connection) -> None:
+    conn.execute(
+        """
+        CREATE TABLE IF NOT EXISTS migrations (
+          id INTEGER PRIMARY KEY,
+          name TEXT NOT NULL UNIQUE,
+          applied_at TEXT NOT NULL DEFAULT (datetime('now'))
+        );
+        """
+    )
+    conn.execute(
+        """
+        CREATE TABLE IF NOT EXISTS proof_artifacts (
+          id TEXT PRIMARY KEY,
+          ts TEXT NOT NULL DEFAULT (datetime('now')),
+          kind TEXT NOT NULL,
+          path TEXT,
+          sha256_hex TEXT,
+          blake3_hex TEXT,
+          size_bytes INTEGER,
+          meta_json TEXT,
+          trace_id TEXT
+        );
+        """
+    )
+
+
+def _log_artifact(
+    *,
+    kind: str,
+    path: Path | None,
+    meta: dict[str, Any],
+    trace_id: str | None,
+    db_path: Path,
+) -> str:
+    try:
+        from ledger.db import log_proof_artifact  # type: ignore
+
+        return log_proof_artifact(
+            kind=kind,
+            path=path,
+            meta=meta,
+            trace_id=trace_id,
+            db_path=db_path,
+        )
+    except Exception:
+        pass
+
+    artifact_id = str(uuid.uuid4())
+    rel_path: str | None = None
+    sha256_hex: str | None = None
+    size_bytes: int | None = None
+
+    if path is not None:
+        try:
+            rel_path = str(path.resolve().relative_to(REPO_ROOT))
+        except Exception:
+            rel_path = str(path)
+        if path.exists() and path.is_file():
+            data = path.read_bytes()
+            sha256_hex = hashlib.sha256(data).hexdigest()
+            size_bytes = len(data)
+
+    db_path.parent.mkdir(parents=True, exist_ok=True)
+    conn = sqlite3.connect(str(db_path), isolation_level=None)
+    try:
+        _ensure_ledger_schema(conn)
+        conn.execute(
+            """
+            INSERT INTO proof_artifacts (
+              id, ts, kind, path, sha256_hex, blake3_hex, size_bytes, meta_json, trace_id
+            )
+            VALUES (?, ?, ?, ?, ?, NULL, ?, ?, ?);
+            """,
+            (
+                artifact_id,
+                _utc_now_iso_z(),
+                kind,
+                rel_path,
+                sha256_hex,
+                size_bytes,
+                json.dumps(meta, ensure_ascii=False, sort_keys=True),
+                trace_id,
+            ),
+        )
+    finally:
+        conn.close()
+
+    return artifact_id
+
+
+def _load_patterns_file(path: Path) -> list[dict[str, Any]]:
+    if not path.exists():
+        return []
+    data = json.loads(path.read_text(encoding="utf-8"))
+    items = data.get("patterns") if isinstance(data, dict) else data
+    return items if isinstance(items, list) else []
+
+
+def _merge_patterns(
+    active: list[dict[str, Any]], extra: list[dict[str, Any]]
+) -> list[dict[str, Any]]:
+    """
+    Candidate patterns win on identical (mode, tokens_all, classification).
+    """
+
+    def key(p: dict[str, Any]) -> tuple[str, tuple[str, ...], str]:
+        mode = str(p.get("mode") or "escalate")
+        cls = str(p.get("classification") or "")
+        tokens = p.get("tokens_all") or p.get("tokens") or []
+        if not isinstance(tokens, list):
+            tokens = []
+        return (mode, tuple(str(t).lower() for t in tokens), cls)
+
+    merged: dict[tuple[str, tuple[str, ...], str], dict[str, Any]] = {}
+    for p in active:
+        if isinstance(p, dict):
+            merged[key(p)] = p
+    for p in extra:
+        if isinstance(p, dict):
+            merged[key(p)] = p
+    return list(merged.values())
+
+
+@dataclass
+class ReplayMetrics:
+    total: int
+    baseline_false_pos: int
+    baseline_false_neg: int
+    candidate_false_pos: int
+    candidate_false_neg: int
+    catastrophic_boundary_unchanged: bool
+
+
+def _is_false_positive(pred: Classification, truth: Classification) -> bool:
+    return truth == Classification.BLESSED and pred in {
+        Classification.FORBIDDEN,
+        Classification.CATASTROPHIC,
+    }
+
+
+def _is_false_negative(pred: Classification, truth: Classification) -> bool:
+    return truth in {
+        Classification.FORBIDDEN,
+        Classification.CATASTROPHIC,
+    } and pred in {
+        Classification.BLESSED,
+        Classification.AMBIGUOUS,
+    }
+
+
+def _compute_metrics(
+    events: list[dict[str, Any]],
+    baseline: ShadowClassifier,
+    candidate: ShadowClassifier,
+) -> ReplayMetrics:
+    total = 0
+    b_fp = b_fn = 0
+    c_fp = c_fn = 0
+    catastrophic_ok = True
+
+    for ev in events:
+        truth = _ground_truth(ev)
+        if truth is None:
+            continue
+        q = _telemetry_query(ev)
+        total += 1
+
+        b = baseline.classify(q).classification
+        c = candidate.classify(q).classification
+
+        if _is_false_positive(b, truth):
+            b_fp += 1
+        if _is_false_negative(b, truth):
+            b_fn += 1
+        if _is_false_positive(c, truth):
+            c_fp += 1
+        if _is_false_negative(c, truth):
+            c_fn += 1
+
+        if b == Classification.CATASTROPHIC and c != Classification.CATASTROPHIC:
+            catastrophic_ok = False
+
+    return ReplayMetrics(
+        total=total,
+        baseline_false_pos=b_fp,
+        baseline_false_neg=b_fn,
+        candidate_false_pos=c_fp,
+        candidate_false_neg=c_fn,
+        catastrophic_boundary_unchanged=catastrophic_ok,
+    )
+
+
+def main(argv: list[str] | None = None) -> int:
+    parser = argparse.ArgumentParser(
+        description="Layer0: replay candidate patterns against recent telemetry."
+    )
+    parser.add_argument(
+        "--candidate",
+        required=True,
+        help="Candidate snapshot JSON (from layer0.learn).",
+    )
+    parser.add_argument(
+        "--telemetry-jsonl",
+        action="append",
+        default=[],
+        help="Path to telemetry JSONL (repeatable). Must include outcome=success|blocked_by_guardrails|... for scoring.",
+    )
+    parser.add_argument("--limit", type=int, default=2000)
+    parser.add_argument(
+        "--active",
+        type=str,
+        default=None,
+        help="Active patterns snapshot (defaults to .state).",
+    )
+    parser.add_argument("--db", type=str, default=None)
+    parser.add_argument("--report-out", type=str, default=None)
+    parser.add_argument(
+        "--promote",
+        action="store_true",
+        help="If replay passes, write active snapshot update.",
+    )
+    parser.add_argument(
+        "--allow-relaxations",
+        action="store_true",
+        help="Allow promotion of relaxation-mode patterns (requires replay pass).",
+    )
+    parser.add_argument("--max-fp-increase", type=int, default=0)
+    args = parser.parse_args(argv)
+
+    telemetry_paths = [Path(p).expanduser() for p in args.telemetry_jsonl if p]
+    if not telemetry_paths:
+        default_preboot = REPO_ROOT / "anomalies" / "preboot_shield.jsonl"
+        if default_preboot.exists():
+            telemetry_paths = [default_preboot]
+
+    events = _read_jsonl(telemetry_paths, limit=int(args.limit))
+
+    active_path = (
+        Path(args.active).expanduser().resolve()
+        if args.active
+        else PatternStore().active_path
+    )
+    active_patterns = _load_patterns_file(active_path)
+    candidate_path = Path(args.candidate).expanduser().resolve()
+    candidate_patterns_all = _load_patterns_file(candidate_path)
+    candidate_patterns = [
+        p
+        for p in candidate_patterns_all
+        if isinstance(p, dict)
+        and (args.allow_relaxations or str(p.get("mode") or "escalate") != "relax")
+    ]
+
+    baseline_classifier = ShadowClassifier(
+        pattern_store=PatternStore(active_path=active_path)
+    )
+
+    merged = _merge_patterns(active_patterns, candidate_patterns)
+    merged_path = (
+        REPO_ROOT / ".state" / "layer0_patterns_merged_replay.json"
+    ).resolve()
+    write_pattern_snapshot(merged_path, merged)
+    candidate_classifier = ShadowClassifier(
+        pattern_store=PatternStore(active_path=merged_path)
+    )
+
+    metrics = _compute_metrics(events, baseline_classifier, candidate_classifier)
+
+    passes = (
+        metrics.catastrophic_boundary_unchanged
+        and metrics.candidate_false_pos
+        <= metrics.baseline_false_pos + int(args.max_fp_increase)
+        and metrics.candidate_false_neg <= metrics.baseline_false_neg
+    )
+
+    report = {
+        "generated_at": _utc_now_iso_z(),
+        "telemetry_inputs": [str(p) for p in telemetry_paths],
+        "candidate_snapshot": str(candidate_path),
+        "active_snapshot": str(active_path),
+        "merged_snapshot": str(merged_path),
+        "allow_relaxations": bool(args.allow_relaxations),
+        "max_fp_increase": int(args.max_fp_increase),
+        "metrics": {
+            "total_scored": metrics.total,
+            "baseline_false_positives": metrics.baseline_false_pos,
+            "baseline_false_negatives": metrics.baseline_false_neg,
+            "candidate_false_positives": metrics.candidate_false_pos,
+            "candidate_false_negatives": metrics.candidate_false_neg,
+            "catastrophic_boundary_unchanged": metrics.catastrophic_boundary_unchanged,
+        },
+        "passes": passes,
+        "promotion": {
+            "requested": bool(args.promote),
+            "performed": False,
+            "active_written_to": str(active_path),
+            "patterns_added": len(candidate_patterns),
+        },
+    }
+
+    report_out = (
+        Path(args.report_out).expanduser().resolve()
+        if args.report_out
+        else (REPO_ROOT / ".state" / "layer0_shadow_replay_report.json").resolve()
+    )
+    report_out.parent.mkdir(parents=True, exist_ok=True)
+    report_out.write_text(
+        json.dumps(report, ensure_ascii=False, sort_keys=True, indent=2) + "\n",
+        encoding="utf-8",
+    )
+
+    db_path = Path(args.db).expanduser().resolve() if args.db else _default_db_path()
+    report_artifact_id = _log_artifact(
+        kind="shadow_replay_report",
+        path=report_out,
+        meta={
+            "passes": passes,
+            "total_scored": metrics.total,
+            "baseline_fp": metrics.baseline_false_pos,
+            "baseline_fn": metrics.baseline_false_neg,
+            "candidate_fp": metrics.candidate_false_pos,
+            "candidate_fn": metrics.candidate_false_neg,
+        },
+        trace_id=None,
+        db_path=db_path,
+    )
+
+    if args.promote and passes:
+        # Promotion = merged active snapshot (existing + candidates), written atomically.
+        tmp_path = active_path.with_suffix(active_path.suffix + ".tmp")
+        write_pattern_snapshot(tmp_path, merged)
+        tmp_path.replace(active_path)
+        promo_artifact_id = _log_artifact(
+            kind="shadow_pattern_promotion",
+            path=active_path,
+            meta={
+                "added": len(candidate_patterns),
+                "source_candidate": str(candidate_path),
+                "merged_snapshot": str(merged_path),
+            },
+            trace_id=None,
+            db_path=db_path,
+        )
+        report["promotion"]["performed"] = True
+        report["promotion"]["artifact_id"] = promo_artifact_id
+        report_out.write_text(
+            json.dumps(report, ensure_ascii=False, sort_keys=True, indent=2) + "\n",
+            encoding="utf-8",
+        )
+
+    print(f"Replay report: {report_out} (passes={passes})")
+    print(f"Logged artifact {report_artifact_id} to {db_path}")
+    if args.promote:
+        print(
+            f"Promotion {'performed' if (args.promote and passes) else 'skipped'}; active={active_path}"
+        )
+    return 0 if passes else 2
+
+
+if __name__ == "__main__":
+    raise SystemExit(main())