feat: persist accountability evidence identities

2026-05-24 09:38:57 +02:00
parent 26f1913d51
commit ab7e0ccab1
7 changed files with 771 additions and 5 deletions
--- a/docs/accountability-root-manifest.md
+++ b/docs/accountability-root-manifest.md
@@ -33,6 +33,12 @@ Raw evidence run schema:
 schemas/accountability-root-evidence.schema.yaml
 ```

+Identity projection schema:
+
+```text
+schemas/accountability-identity-projection.schema.yaml
+```
+
 ## Required Sections

 - `netkingdom`: root id, name, and king actor.
@@ -78,3 +84,23 @@ The output is an `AccountabilityRootEvidenceRun`. Every evidence item carries
 provenance, source, fingerprint, `durable: true`, and
 `live_telemetry: false`, preserving the boundary between Fabric evidence and
 operational telemetry.
+
+To normalize raw evidence into reviewable identity candidates:
+
+```bash
+railiance-fabric discover-roots \
+  --identity-projection \
+  --max-items-per-root 200
+```
+
+To persist raw evidence and identity candidates in a local SQLite store:
+
+```bash
+railiance-fabric discover-roots \
+  --store-db .railiance-fabric/accountability-evidence.sqlite3 \
+  --identity-projection
+```
+
+The store is intentionally separate from accepted registry graph snapshots. It
+keeps raw evidence runs, evidence items, and identity candidates available for
+inspection before any candidate is promoted.
--- a/docs/financial-fabric-operator-guide.md
+++ b/docs/financial-fabric-operator-guide.md
@@ -56,6 +56,13 @@ To collect raw evidence from those roots without promoting graph state:
 railiance-fabric discover-roots --max-items-per-root 200
 ```

+To inspect normalized identity candidates or persist a local evidence run:
+
+```bash
+railiance-fabric discover-roots --identity-projection
+railiance-fabric discover-roots --store-db .railiance-fabric/accountability-evidence.sqlite3
+```
+
 The financial export must satisfy these invariants:

 - every accepted node has resolvable ownership;
--- a/railiance_fabric/accountability_roots.py
+++ b/railiance_fabric/accountability_roots.py
@@ -2,14 +2,16 @@ from __future__ import annotations

 import hashlib
 import json
+import sqlite3
 import subprocess
 import urllib.error
 import urllib.request
+from dataclasses import dataclass
 from datetime import datetime, timezone
 from pathlib import Path
 from typing import Any

-from .discovery import short_fingerprint
+from .discovery import normalize_identity_part, short_fingerprint
 from .loader import load_yaml, repo_root
 from .schema_validation import draft202012_validator

@@ -95,6 +97,512 @@ def collect_accountability_root_evidence(
    return result


+def build_identity_projection(
+    evidence_run: dict[str, Any],
+    manifest: dict[str, Any] | None = None,
+) -> dict[str, Any]:
+    if manifest is None:
+        manifest_path = evidence_run.get("manifest", {}).get("path")
+        manifest = load_accountability_root_manifest(_resolve_path(manifest_path), validate=True)
+
+    candidates: dict[str, dict[str, Any]] = {}
+
+    netkingdom = manifest.get("netkingdom") if isinstance(manifest.get("netkingdom"), dict) else {}
+    if netkingdom:
+        _add_identity_candidate(
+            candidates,
+            identity_type="Netkingdom",
+            label=str(netkingdom.get("name") or netkingdom.get("id")),
+            graph_id=str(netkingdom.get("id")),
+            fabric_id=None,
+            owner_actor_id=str(netkingdom.get("king_actor_id") or ""),
+            evidence_ids=[],
+            aliases=[str(netkingdom.get("id") or "")],
+            attributes={"king_actor_id": netkingdom.get("king_actor_id", "")},
+            confidence=1.0,
+        )
+
+    for actor in manifest.get("actors", []):
+        if not isinstance(actor, dict):
+            continue
+        _add_identity_candidate(
+            candidates,
+            identity_type="Actor",
+            label=str(actor.get("name") or actor.get("id")),
+            graph_id=str(actor.get("id")),
+            fabric_id=None,
+            owner_actor_id=str(actor.get("id") or ""),
+            evidence_ids=[],
+            aliases=[str(actor.get("id") or ""), str(actor.get("role") or "")],
+            attributes={"role": actor.get("role", "")},
+            confidence=1.0,
+        )
+
+    for fabric in manifest.get("fabrics", []):
+        if not isinstance(fabric, dict):
+            continue
+        owner_actor_id = str(fabric.get("tenant_actor_id") or fabric.get("lord_actor_id") or "")
+        _add_identity_candidate(
+            candidates,
+            identity_type=str(fabric.get("kind") or "Fabric"),
+            label=str(fabric.get("name") or fabric.get("id")),
+            graph_id=str(fabric.get("id")),
+            fabric_id=str(fabric.get("id") or ""),
+            subfabric_id=str(fabric.get("id")) if fabric.get("kind") == "Subfabric" else None,
+            owner_actor_id=owner_actor_id,
+            evidence_ids=[],
+            aliases=[str(fabric.get("id") or ""), str(fabric.get("parent_fabric_id") or "")],
+            attributes={
+                "status": fabric.get("status", ""),
+                "netkingdom_id": fabric.get("netkingdom_id", ""),
+                "parent_fabric_id": fabric.get("parent_fabric_id", ""),
+                "boundary": fabric.get("boundary", {}),
+            },
+            confidence=1.0,
+        )
+
+    for root in evidence_run.get("roots", []):
+        if not isinstance(root, dict):
+            continue
+        for item in root.get("evidence", []):
+            if not isinstance(item, dict):
+                continue
+            identity = _identity_from_evidence(root, item)
+            if identity is None:
+                continue
+            _add_identity_candidate(candidates, **identity)
+
+    candidate_list = _mark_ambiguous_identities(list(candidates.values()))
+    candidate_graph = _candidate_graph(candidate_list, manifest)
+    projection = {
+        "apiVersion": "railiance.fabric/v1alpha2",
+        "kind": "AccountabilityIdentityProjection",
+        "generated_at": _utc_now(),
+        "evidence_run": {
+            "manifest_id": evidence_run.get("manifest", {}).get("id", ""),
+            "manifest_fingerprint": evidence_run.get("manifest", {}).get("fingerprint", ""),
+            "generated_at": evidence_run.get("generated_at", ""),
+        },
+        "identity_candidates": sorted(candidate_list, key=lambda item: item["stable_key"]),
+        "candidate_graph": candidate_graph,
+    }
+    validator = draft202012_validator(repo_root() / "schemas" / "accountability-identity-projection.schema.yaml")
+    errors = sorted(validator.iter_errors(projection), key=lambda error: list(error.path))
+    if errors:
+        location = ".".join(str(part) for part in errors[0].path) or "<root>"
+        raise ValueError(f"invalid accountability identity projection at {location}: {errors[0].message}")
+    return projection
+
+
+@dataclass(frozen=True)
+class AccountabilityEvidenceStore:
+    path: Path
+
+    def init_schema(self) -> None:
+        if str(self.path) != ":memory:":
+            self.path.parent.mkdir(parents=True, exist_ok=True)
+        with self._connect() as db:
+            db.executescript(
+                """
+                create table if not exists accountability_evidence_runs (
+                  id integer primary key autoincrement,
+                  manifest_id text not null,
+                  manifest_path text not null,
+                  manifest_fingerprint text not null,
+                  generated_at text not null,
+                  payload_json text not null,
+                  created_at text not null
+                );
+
+                create table if not exists accountability_evidence_items (
+                  id text not null,
+                  run_id integer not null references accountability_evidence_runs(id),
+                  root_id text not null,
+                  evidence_type text not null,
+                  state text not null,
+                  durable integer not null,
+                  live_telemetry integer not null,
+                  fingerprint text not null,
+                  summary text not null,
+                  source_json text not null,
+                  attributes_json text not null,
+                  payload_json text not null,
+                  primary key (id, run_id)
+                );
+
+                create index if not exists idx_accountability_evidence_items_run
+                  on accountability_evidence_items(run_id);
+
+                create table if not exists accountability_identity_candidates (
+                  stable_key text not null,
+                  run_id integer not null references accountability_evidence_runs(id),
+                  identity_type text not null,
+                  label text not null,
+                  fabric_id text,
+                  subfabric_id text,
+                  owner_actor_id text,
+                  review_state text not null,
+                  confidence real not null,
+                  aliases_json text not null,
+                  evidence_ids_json text not null,
+                  attributes_json text not null,
+                  payload_json text not null,
+                  primary key (stable_key, run_id)
+                );
+
+                create index if not exists idx_accountability_identity_candidates_run
+                  on accountability_identity_candidates(run_id);
+                """
+            )
+
+    def add_evidence_run(
+        self,
+        evidence_run: dict[str, Any],
+        identity_projection: dict[str, Any] | None = None,
+    ) -> dict[str, Any]:
+        self.init_schema()
+        created_at = _utc_now()
+        manifest = evidence_run.get("manifest", {})
+        with self._connect() as db:
+            cursor = db.execute(
+                """
+                insert into accountability_evidence_runs (
+                  manifest_id, manifest_path, manifest_fingerprint, generated_at,
+                  payload_json, created_at
+                ) values (?, ?, ?, ?, ?, ?)
+                """,
+                (
+                    manifest.get("id", ""),
+                    manifest.get("path", ""),
+                    manifest.get("fingerprint", ""),
+                    evidence_run.get("generated_at", ""),
+                    json.dumps(evidence_run, sort_keys=True),
+                    created_at,
+                ),
+            )
+            run_id = int(cursor.lastrowid)
+            for item in _iter_evidence_items(evidence_run):
+                db.execute(
+                    """
+                    insert into accountability_evidence_items (
+                      id, run_id, root_id, evidence_type, state, durable, live_telemetry,
+                      fingerprint, summary, source_json, attributes_json, payload_json
+                    ) values (?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?)
+                    """,
+                    (
+                        item.get("id", ""),
+                        run_id,
+                        item.get("root_id", ""),
+                        item.get("evidence_type", ""),
+                        item.get("state", ""),
+                        1 if item.get("durable") else 0,
+                        1 if item.get("live_telemetry") else 0,
+                        item.get("fingerprint", ""),
+                        item.get("summary", ""),
+                        json.dumps(item.get("source", {}), sort_keys=True),
+                        json.dumps(item.get("attributes", {}), sort_keys=True),
+                        json.dumps(item, sort_keys=True),
+                    ),
+                )
+            if identity_projection is not None:
+                for candidate in identity_projection.get("identity_candidates", []):
+                    db.execute(
+                        """
+                        insert into accountability_identity_candidates (
+                          stable_key, run_id, identity_type, label, fabric_id, subfabric_id,
+                          owner_actor_id, review_state, confidence, aliases_json,
+                          evidence_ids_json, attributes_json, payload_json
+                        ) values (?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?)
+                        """,
+                        (
+                            candidate.get("stable_key", ""),
+                            run_id,
+                            candidate.get("identity_type", ""),
+                            candidate.get("label", ""),
+                            candidate.get("fabric_id", ""),
+                            candidate.get("subfabric_id", ""),
+                            candidate.get("owner_actor_id", ""),
+                            candidate.get("review_state", ""),
+                            float(candidate.get("confidence") or 0),
+                            json.dumps(candidate.get("aliases", []), sort_keys=True),
+                            json.dumps(candidate.get("evidence_ids", []), sort_keys=True),
+                            json.dumps(candidate.get("attributes", {}), sort_keys=True),
+                            json.dumps(candidate, sort_keys=True),
+                        ),
+                    )
+            return {
+                "run_id": run_id,
+                "evidence_count": len(list(_iter_evidence_items(evidence_run))),
+                "identity_candidate_count": len(identity_projection.get("identity_candidates", []))
+                if identity_projection
+                else 0,
+            }
+
+    def latest_run(self) -> dict[str, Any] | None:
+        with self._connect() as db:
+            row = db.execute(
+                """
+                select id, manifest_id, manifest_path, manifest_fingerprint, generated_at, created_at
+                from accountability_evidence_runs
+                order by id desc
+                limit 1
+                """
+            ).fetchone()
+        return dict(row) if row else None
+
+    def list_evidence(self, run_id: int) -> list[dict[str, Any]]:
+        with self._connect() as db:
+            rows = db.execute(
+                """
+                select payload_json
+                from accountability_evidence_items
+                where run_id = ?
+                order by root_id, evidence_type, id
+                """,
+                (run_id,),
+            ).fetchall()
+        return [json.loads(row["payload_json"]) for row in rows]
+
+    def list_identity_candidates(self, run_id: int) -> list[dict[str, Any]]:
+        with self._connect() as db:
+            rows = db.execute(
+                """
+                select payload_json
+                from accountability_identity_candidates
+                where run_id = ?
+                order by stable_key
+                """,
+                (run_id,),
+            ).fetchall()
+        return [json.loads(row["payload_json"]) for row in rows]
+
+    def _connect(self) -> sqlite3.Connection:
+        db = sqlite3.connect(self.path)
+        db.row_factory = sqlite3.Row
+        return db
+
+
+def _identity_from_evidence(root: dict[str, Any], item: dict[str, Any]) -> dict[str, Any] | None:
+    evidence_type = str(item.get("evidence_type") or "")
+    source = item.get("source") if isinstance(item.get("source"), dict) else {}
+    attributes = item.get("attributes") if isinstance(item.get("attributes"), dict) else {}
+    evidence_ids = [str(item.get("id", ""))]
+    fabric_id = str(root.get("fabric_id") or "")
+    subfabric_id = str(root.get("subfabric_id") or "") or None
+    owner_actor_id = str(root.get("owner_actor_id") or "")
+
+    if evidence_type in {"registered_repository", "repository_checkout"}:
+        label = str(source.get("repo_slug") or attributes.get("repo_slug") or Path(str(source.get("path") or "")).name)
+        return {
+            "identity_type": "Repository",
+            "label": label,
+            "graph_id": label,
+            "fabric_id": fabric_id,
+            "subfabric_id": subfabric_id,
+            "owner_actor_id": owner_actor_id,
+            "evidence_ids": evidence_ids,
+            "aliases": [label, str(source.get("path") or ""), str(source.get("remote_url") or "")],
+            "attributes": {**attributes, "source_evidence_type": evidence_type},
+            "confidence": 0.9 if evidence_type == "repository_checkout" else 0.85,
+        }
+    if evidence_type in {"deployment_automation", "infrastructure_manifest"}:
+        path = str(source.get("path") or "")
+        return {
+            "identity_type": "Deployable",
+            "label": Path(path).name or evidence_type,
+            "graph_id": path,
+            "fabric_id": fabric_id,
+            "subfabric_id": subfabric_id,
+            "owner_actor_id": owner_actor_id,
+            "evidence_ids": evidence_ids,
+            "aliases": [path, Path(path).stem],
+            "attributes": {**attributes, "source_evidence_type": evidence_type},
+            "confidence": 0.75,
+        }
+    if evidence_type == "service_config":
+        path = str(source.get("path") or "")
+        return {
+            "identity_type": "ServiceConfig",
+            "label": Path(path).name or "service-config",
+            "graph_id": path,
+            "fabric_id": fabric_id,
+            "subfabric_id": subfabric_id,
+            "owner_actor_id": owner_actor_id,
+            "evidence_ids": evidence_ids,
+            "aliases": [path],
+            "attributes": {**attributes, "source_evidence_type": evidence_type},
+            "confidence": 0.7,
+        }
+    if evidence_type == "endpoint_contract":
+        path = str(source.get("path") or "")
+        return {
+            "identity_type": "Endpoint",
+            "label": Path(path).name or "endpoint-contract",
+            "graph_id": path,
+            "fabric_id": fabric_id,
+            "subfabric_id": subfabric_id,
+            "owner_actor_id": owner_actor_id,
+            "evidence_ids": evidence_ids,
+            "aliases": [path],
+            "attributes": {**attributes, "source_evidence_type": evidence_type},
+            "confidence": 0.75,
+        }
+    if evidence_type == "host_path_match":
+        path = str(source.get("path") or "")
+        return {
+            "identity_type": "HostPath",
+            "label": path or "host-path",
+            "graph_id": path,
+            "fabric_id": fabric_id,
+            "subfabric_id": subfabric_id,
+            "owner_actor_id": owner_actor_id,
+            "evidence_ids": evidence_ids,
+            "aliases": [path],
+            "attributes": {**attributes, "source_evidence_type": evidence_type},
+            "confidence": 0.65,
+        }
+    if evidence_type in {"secret_root", "backup_recovery"}:
+        path = str(source.get("path") or "")
+        return {
+            "identity_type": "SecretRoot" if evidence_type == "secret_root" else "BackupRecoveryRoot",
+            "label": Path(path).name or evidence_type,
+            "graph_id": path or evidence_type,
+            "fabric_id": fabric_id,
+            "subfabric_id": subfabric_id,
+            "owner_actor_id": owner_actor_id,
+            "evidence_ids": evidence_ids,
+            "aliases": [path],
+            "attributes": {**attributes, "source_evidence_type": evidence_type},
+            "confidence": 0.65,
+        }
+    if evidence_type in {"state_hub_repo_inventory", "gitea_organization", "gitea_repository", "registry_manifest"}:
+        return {
+            "identity_type": "CatalogRoot",
+            "label": str(source.get("url") or source.get("manifest_path") or root.get("id")),
+            "graph_id": str(root.get("id") or evidence_type),
+            "fabric_id": fabric_id,
+            "subfabric_id": subfabric_id,
+            "owner_actor_id": owner_actor_id,
+            "evidence_ids": evidence_ids,
+            "aliases": [str(source.get("url") or ""), str(source.get("manifest_path") or "")],
+            "attributes": {**attributes, "source_evidence_type": evidence_type},
+            "confidence": 0.6,
+        }
+    return None
+
+
+def _add_identity_candidate(
+    candidates: dict[str, dict[str, Any]],
+    *,
+    identity_type: str,
+    label: str,
+    graph_id: str | None = None,
+    fabric_id: str | None = None,
+    subfabric_id: str | None = None,
+    owner_actor_id: str | None = None,
+    evidence_ids: list[str],
+    aliases: list[str],
+    attributes: dict[str, Any],
+    confidence: float,
+) -> None:
+    normalized_type = normalize_identity_part(identity_type)
+    identity_key = graph_id or label
+    stable_key = f"identity:{normalized_type}:{normalize_identity_part(identity_key)}"
+    incoming = {
+        "stable_key": stable_key,
+        "identity_type": identity_type,
+        "label": label or identity_key,
+        "review_state": "candidate",
+        "confidence": confidence,
+        "aliases": _unique_strings([identity_key, *aliases]),
+        "evidence_ids": _unique_strings(evidence_ids),
+        "attributes": {key: value for key, value in attributes.items() if value not in ("", None, [], {})},
+    }
+    if graph_id:
+        incoming["graph_id"] = graph_id
+    if fabric_id:
+        incoming["fabric_id"] = fabric_id
+    if subfabric_id:
+        incoming["subfabric_id"] = subfabric_id
+    if owner_actor_id:
+        incoming["owner_actor_id"] = owner_actor_id
+
+    existing = candidates.get(stable_key)
+    if existing is None:
+        candidates[stable_key] = incoming
+        return
+    existing["confidence"] = max(float(existing.get("confidence", 0)), confidence)
+    existing["aliases"] = _unique_strings([*existing.get("aliases", []), *incoming["aliases"]])
+    existing["evidence_ids"] = _unique_strings([*existing.get("evidence_ids", []), *incoming["evidence_ids"]])
+    existing["attributes"] = {**existing.get("attributes", {}), **incoming["attributes"]}
+    for key in ("fabric_id", "subfabric_id", "owner_actor_id", "graph_id"):
+        if incoming.get(key) and not existing.get(key):
+            existing[key] = incoming[key]
+
+
+def _mark_ambiguous_identities(candidates: list[dict[str, Any]]) -> list[dict[str, Any]]:
+    alias_index: dict[tuple[str, str], list[str]] = {}
+    for candidate in candidates:
+        for alias in candidate.get("aliases", []):
+            key = (str(candidate.get("identity_type")), normalize_identity_part(alias))
+            alias_index.setdefault(key, []).append(candidate["stable_key"])
+    ambiguous: dict[str, list[str]] = {}
+    for (_identity_type, alias), keys in alias_index.items():
+        unique_keys = sorted(set(keys))
+        if len(unique_keys) > 1:
+            for stable_key in unique_keys:
+                ambiguous.setdefault(stable_key, []).append(alias)
+    for candidate in candidates:
+        aliases = ambiguous.get(candidate["stable_key"])
+        if aliases:
+            candidate["review_state"] = "needs_review"
+            candidate.setdefault("attributes", {})["ambiguous_aliases"] = sorted(aliases)
+    return candidates
+
+
+def _candidate_graph(candidates: list[dict[str, Any]], manifest: dict[str, Any]) -> dict[str, Any]:
+    nodes = [
+        {
+            "id": candidate["stable_key"],
+            "kind": candidate["identity_type"],
+            "label": candidate["label"],
+            "review_state": candidate["review_state"],
+            "fabric_id": candidate.get("fabric_id", ""),
+            "subfabric_id": candidate.get("subfabric_id", ""),
+            "owner_actor_id": candidate.get("owner_actor_id", ""),
+        }
+        for candidate in sorted(candidates, key=lambda item: item["stable_key"])
+    ]
+    edges: list[dict[str, Any]] = []
+    for fabric in manifest.get("fabrics", []):
+        if not isinstance(fabric, dict):
+            continue
+        fabric_key = f"identity:{normalize_identity_part(fabric.get('kind') or 'Fabric')}:{normalize_identity_part(fabric.get('id'))}"
+        parent = fabric.get("parent_fabric_id") or manifest.get("netkingdom", {}).get("id")
+        parent_type = "Fabric" if fabric.get("parent_fabric_id") else "Netkingdom"
+        parent_key = f"identity:{normalize_identity_part(parent_type)}:{normalize_identity_part(parent)}"
+        edges.append(
+            {
+                "id": f"candidate-edge:{short_fingerprint([parent_key, 'contains', fabric_key], length=16)}",
+                "from": parent_key,
+                "to": fabric_key,
+                "type": "contains",
+                "review_state": "candidate",
+            }
+        )
+    return {"nodes": nodes, "edges": edges}
+
+
+def _iter_evidence_items(evidence_run: dict[str, Any]) -> list[dict[str, Any]]:
+    return [
+        item
+        for root in evidence_run.get("roots", [])
+        if isinstance(root, dict)
+        for item in root.get("evidence", [])
+        if isinstance(item, dict)
+    ]
+
+
 def _collect_root_evidence(root: dict[str, Any], *, include_remote: bool, max_items: int) -> list[dict[str, Any]]:
    root_type = str(root.get("type") or "")
    if root.get("status") == "disabled":
@@ -381,5 +889,17 @@ def _git_value(repo_path: Path, *args: str) -> str | None:
    return value or None


+def _unique_strings(values: list[object]) -> list[str]:
+    result: list[str] = []
+    seen: set[str] = set()
+    for value in values:
+        text = str(value or "").strip()
+        if not text or text in seen:
+            continue
+        result.append(text)
+        seen.add(text)
+    return result
+
+
 def _utc_now() -> str:
    return datetime.now(timezone.utc).replace(microsecond=0).isoformat().replace("+00:00", "Z")
--- a/railiance_fabric/cli.py
+++ b/railiance_fabric/cli.py
@@ -14,7 +14,13 @@ from pathlib import Path
 from typing import Any
 from urllib.parse import quote

-from .accountability_roots import DEFAULT_ROOT_MANIFEST_PATH, collect_accountability_root_evidence
+from .accountability_roots import (
+    DEFAULT_ROOT_MANIFEST_PATH,
+    AccountabilityEvidenceStore,
+    build_identity_projection,
+    collect_accountability_root_evidence,
+    load_accountability_root_manifest,
+)
 from .connectors import ConnectorConfig
 from .financial_baseline import financial_export_from_legacy
 from .loader import declaration_files, load_yaml
@@ -116,6 +122,8 @@ def build_parser() -> argparse.ArgumentParser:
    discover_roots.add_argument("--manifest", type=Path, default=DEFAULT_ROOT_MANIFEST_PATH)
    discover_roots.add_argument("--include-remote", action="store_true", help="Allow HTTP reads from configured remote roots.")
    discover_roots.add_argument("--max-items-per-root", type=int, default=200)
+    discover_roots.add_argument("--identity-projection", action="store_true", help="Print normalized identity candidates instead of raw evidence.")
+    discover_roots.add_argument("--store-db", type=Path, default=None, help="Persist evidence and identity candidates in a SQLite store.")

    registry = sub.add_parser("registry", help="Feed a running Railiance Fabric registry service.")
    registry_sub = registry.add_subparsers(dest="registry_command", required=True)
@@ -330,12 +338,17 @@ def main(argv: list[str] | None = None) -> int:
        return _scan_repo(args)

    if args.command == "discover-roots":
+        manifest = load_accountability_root_manifest(args.manifest)
        payload = collect_accountability_root_evidence(
            args.manifest,
            include_remote=args.include_remote,
            max_items_per_root=args.max_items_per_root,
        )
-        print(json.dumps(payload, indent=2, sort_keys=True))
+        projection = build_identity_projection(payload, manifest)
+        if args.store_db:
+            store = AccountabilityEvidenceStore(args.store_db)
+            store.add_evidence_run(payload, projection)
+        print(json.dumps(projection if args.identity_projection else payload, indent=2, sort_keys=True))
        return 0

    if args.command == "registry":
--- a/schemas/accountability-identity-projection.schema.yaml
+++ b/schemas/accountability-identity-projection.schema.yaml
@@ -0,0 +1,110 @@
+$schema: "https://json-schema.org/draft/2020-12/schema"
+$id: "https://railiance.local/fabric/schemas/accountability-identity-projection.schema.yaml"
+title: "AccountabilityIdentityProjection"
+type: object
+additionalProperties: false
+required:
+  - apiVersion
+  - kind
+  - generated_at
+  - evidence_run
+  - identity_candidates
+  - candidate_graph
+properties:
+  apiVersion:
+    type: string
+    const: "railiance.fabric/v1alpha2"
+  kind:
+    type: string
+    const: AccountabilityIdentityProjection
+  generated_at:
+    type: string
+    format: date-time
+  evidence_run:
+    type: object
+    additionalProperties: false
+    required:
+      - manifest_id
+      - manifest_fingerprint
+      - generated_at
+    properties:
+      manifest_id:
+        type: string
+      manifest_fingerprint:
+        type: string
+      generated_at:
+        type: string
+  identity_candidates:
+    type: array
+    items:
+      $ref: "#/$defs/identityCandidate"
+  candidate_graph:
+    type: object
+    additionalProperties: false
+    required:
+      - nodes
+      - edges
+    properties:
+      nodes:
+        type: array
+        items:
+          type: object
+          additionalProperties: true
+      edges:
+        type: array
+        items:
+          type: object
+          additionalProperties: true
+
+$defs:
+  identityCandidate:
+    type: object
+    additionalProperties: false
+    required:
+      - stable_key
+      - identity_type
+      - label
+      - review_state
+      - confidence
+      - aliases
+      - evidence_ids
+      - attributes
+    properties:
+      stable_key:
+        type: string
+        minLength: 3
+      identity_type:
+        type: string
+        minLength: 1
+      label:
+        type: string
+        minLength: 1
+      graph_id:
+        type: string
+      fabric_id:
+        type: string
+      subfabric_id:
+        type: string
+      owner_actor_id:
+        type: string
+      review_state:
+        type: string
+        enum:
+          - candidate
+          - accepted
+          - needs_review
+      confidence:
+        type: number
+        minimum: 0
+        maximum: 1
+      aliases:
+        type: array
+        items:
+          type: string
+      evidence_ids:
+        type: array
+        items:
+          type: string
+      attributes:
+        type: object
+        additionalProperties: true
--- a/tests/test_accountability_root_adapters.py
+++ b/tests/test_accountability_root_adapters.py
@@ -1,7 +1,12 @@
 import json
 from pathlib import Path

-from railiance_fabric.accountability_roots import collect_accountability_root_evidence
+from railiance_fabric.accountability_roots import (
+    AccountabilityEvidenceStore,
+    build_identity_projection,
+    collect_accountability_root_evidence,
+    load_accountability_root_manifest,
+)
 from railiance_fabric.cli import main as cli_main
 from railiance_fabric.schema_validation import draft202012_validator

@@ -32,6 +37,46 @@ def test_collect_accountability_root_evidence_from_manifest(tmp_path: Path) -> N
    assert "secret-value" not in json.dumps(secret_root)


+def test_identity_projection_is_stable_and_reviewable(tmp_path: Path) -> None:
+    manifest_path = _fixture_manifest(tmp_path)
+    manifest = load_accountability_root_manifest(manifest_path)
+
+    first = build_identity_projection(collect_accountability_root_evidence(manifest_path), manifest)
+    second = build_identity_projection(collect_accountability_root_evidence(manifest_path), manifest)
+
+    validator = draft202012_validator(Path("schemas/accountability-identity-projection.schema.yaml"))
+    assert list(validator.iter_errors(first)) == []
+
+    first_keys = {candidate["stable_key"] for candidate in first["identity_candidates"]}
+    second_keys = {candidate["stable_key"] for candidate in second["identity_candidates"]}
+    assert first_keys == second_keys
+    assert {
+        "Actor",
+        "Fabric",
+        "Repository",
+        "Deployable",
+        "SecretRoot",
+    } <= {candidate["identity_type"] for candidate in first["identity_candidates"]}
+    assert first["candidate_graph"]["nodes"]
+    assert first["candidate_graph"]["edges"]
+
+
+def test_evidence_store_persists_runs_items_and_identities(tmp_path: Path) -> None:
+    manifest_path = _fixture_manifest(tmp_path)
+    manifest = load_accountability_root_manifest(manifest_path)
+    evidence_run = collect_accountability_root_evidence(manifest_path)
+    projection = build_identity_projection(evidence_run, manifest)
+    store = AccountabilityEvidenceStore(tmp_path / "evidence.sqlite3")
+
+    stored = store.add_evidence_run(evidence_run, projection)
+    latest = store.latest_run()
+
+    assert latest is not None
+    assert latest["id"] == stored["run_id"]
+    assert stored["evidence_count"] == len(store.list_evidence(stored["run_id"]))
+    assert stored["identity_candidate_count"] == len(store.list_identity_candidates(stored["run_id"]))
+
+
 def test_discover_roots_cli_prints_evidence_json(tmp_path: Path, capsys) -> None:
    manifest = _fixture_manifest(tmp_path)

@@ -42,6 +87,29 @@ def test_discover_roots_cli_prints_evidence_json(tmp_path: Path, capsys) -> None
    assert payload["roots"]


+def test_discover_roots_cli_can_print_identities_and_store(tmp_path: Path, capsys) -> None:
+    manifest = _fixture_manifest(tmp_path)
+    store_path = tmp_path / "evidence.sqlite3"
+
+    assert (
+        cli_main(
+            [
+                "discover-roots",
+                "--manifest",
+                str(manifest),
+                "--identity-projection",
+                "--store-db",
+                str(store_path),
+            ]
+        )
+        == 0
+    )
+
+    payload = json.loads(capsys.readouterr().out)
+    assert payload["kind"] == "AccountabilityIdentityProjection"
+    assert AccountabilityEvidenceStore(store_path).latest_run() is not None
+
+
 def _fixture_manifest(tmp_path: Path) -> Path:
    workspace = tmp_path / "workspace"
    repo = workspace / "fixture-repo"
--- a/workplans/RAIL-FAB-WP-0018-accountability-root-discovery-update-loop.md
+++ b/workplans/RAIL-FAB-WP-0018-accountability-root-discovery-update-loop.md
@@ -135,7 +135,7 @@ Result:

 ```task
 id: RAIL-FAB-WP-0018-T03
-status: todo
+status: done
 priority: high
 state_hub_task_id: "2a79938f-13e2-41b4-b692-74420d31bec4"
 ```
@@ -157,6 +157,28 @@ Done when:
 - identity normalization produces reviewable candidates;
 - repeated scans produce deterministic identities for unchanged sources.

+Result:
+
+- Added `schemas/accountability-identity-projection.schema.yaml` for
+  normalized `AccountabilityIdentityProjection` payloads.
+- Extended `railiance_fabric/accountability_roots.py` with deterministic
+  identity normalization for netkingdoms, actors, fabrics, subfabrics,
+  repositories, deployables, endpoint/service/config roots, host paths,
+  catalog roots, secret roots, and backup/recovery roots.
+- Added duplicate/ambiguous alias marking on identity candidates and a
+  candidate graph section that remains separate from accepted registry graph
+  snapshots.
+- Added `AccountabilityEvidenceStore`, a SQLite store for raw evidence runs,
+  evidence items, and identity candidates.
+- Extended `railiance-fabric discover-roots` with `--identity-projection` and
+  `--store-db`.
+- Added focused tests for deterministic identity keys, schema validation,
+  persistence, CLI output, and store inspection.
+- Verified with
+  `python3 -m pytest tests/test_accountability_roots.py tests/test_accountability_root_adapters.py -q`,
+  `python3 -m railiance_fabric.cli discover-roots --max-items-per-root 5 --identity-projection --store-db /tmp/railiance-root-evidence.sqlite3`,
+  and full `python3 -m pytest`.
+
 ## T04 - Add Ownership Resolution And Review Flow

 ```task