feat(prompts): implement Phase 8 - Observability & Traceability (FR-11)
Complete implementation of Phase 8, the final phase of prompt dependency resolution infrastructure, adding full observability and traceability. ## Features (FR-11) ### FR-11.1: Complete Artifact Provenance Tracing - TraceabilityService: composition layer for full artifact lineage - Trace any artifact to producing PromptTemplate, input artifacts, generator runs, and quality validation results - ProvenanceTrace model with complete dependency chain reconstruction - RunSummary and ArtifactLineage models for structured trace output ### FR-11.2: Recomputation Query Infrastructure - PromptQueryService: cross-service complex queries - Run history queries with template and status filters - Stale artifact detection via impact debt analysis - Dependency graph statistics (nodes, edges, cycles, roots, leaves) - Content-based artifact lookups by digest ### Visualization Support - GraphExporter: DOT (Graphviz) and Mermaid format export - Supports all edge types (requires, generates, includes) - Handles isolated nodes, linear chains, diamonds, and complex graphs ### CLI Commands (prompt group) - `prompt trace <artifact_id>` - Full provenance trace as JSON - `prompt graph <artifact_id>` - Dependency graph (DOT/Mermaid) - `prompt runs` - List execution runs with filters - `prompt debt` - Show impact debt and stale artifacts - `prompt stats` - Dependency graph statistics ## Implementation Source files (8): - markitect/prompts/traceability/models.py - Trace data models - markitect/prompts/traceability/service.py - TraceabilityService - markitect/prompts/visualization/graph.py - Graph export - markitect/prompts/queries/operations.py - PromptQueryService - markitect/prompts/cli.py - Click CLI commands - Package __init__.py files (3) Tests (64 total, all passing): - tests/unit/prompts/test_traceability_service.py (21 tests) - tests/unit/prompts/test_visualization.py (14 tests) - tests/unit/prompts/test_query_operations.py (12 tests) - tests/integration/prompts/test_traceability_workflow.py (7 tests) - tests/integration/prompts/test_prompt_cli.py (10 tests) ## Architecture TraceabilityService is a composition layer that delegates to: - DependencyQueryService (transitive dependency lookups) - QualityValidator (validation history) - IncrementalExecutionEngine (impact debt queries) - Direct repository access (artifacts, edges) No duplicate data storage - all data comes from existing Phase 1-7 infrastructure (artifact repo, dependency repo, validation DB, debt DB). ## Verification All 2250 tests pass with 0 regressions. Phase 8 completes the full 8-phase implementation roadmap. Co-Authored-By: Claude Sonnet 4.5 <noreply@anthropic.com>
This commit is contained in:
@@ -7088,6 +7088,13 @@ try:
|
||||
except ImportError:
|
||||
pass # Plugin not available
|
||||
|
||||
# Register prompt dependency resolution commands
|
||||
try:
|
||||
from markitect.prompts.cli import prompt_commands
|
||||
cli.add_command(prompt_commands)
|
||||
except ImportError:
|
||||
pass # Prompts module not available
|
||||
|
||||
# Make cli function available as main entry point
|
||||
main = cli
|
||||
|
||||
|
||||
147
markitect/prompts/cli.py
Normal file
147
markitect/prompts/cli.py
Normal file
@@ -0,0 +1,147 @@
|
||||
"""
|
||||
CLI commands for prompt dependency resolution.
|
||||
|
||||
Provides Click commands for tracing provenance, visualizing graphs,
|
||||
querying run history, and inspecting impact debt.
|
||||
"""
|
||||
|
||||
import json
|
||||
import os
|
||||
|
||||
import click
|
||||
|
||||
from markitect.prompts.dependencies.graph import GraphBuilder
|
||||
from markitect.prompts.dependencies.repository import SQLiteDependencyRepository
|
||||
from markitect.prompts.queries.operations import PromptQueryService
|
||||
from markitect.prompts.repositories.sqlite import SQLiteArtifactRepository
|
||||
from markitect.prompts.traceability.service import TraceabilityService
|
||||
from markitect.prompts.visualization.graph import GraphExporter
|
||||
|
||||
|
||||
def _default_db_path():
|
||||
"""Return the default database path."""
|
||||
return os.path.expanduser("~/.markitect/markitect.db")
|
||||
|
||||
|
||||
def _get_repos(database):
|
||||
"""Create artifact and dependency repos from database path."""
|
||||
db = database or _default_db_path()
|
||||
artifact_repo = SQLiteArtifactRepository(db)
|
||||
dep_repo = SQLiteDependencyRepository(db)
|
||||
return artifact_repo, dep_repo, db
|
||||
|
||||
|
||||
@click.group(name="prompt")
|
||||
def prompt_commands():
|
||||
"""Prompt dependency resolution commands."""
|
||||
pass
|
||||
|
||||
|
||||
@prompt_commands.command("trace")
|
||||
@click.argument("artifact_id")
|
||||
@click.option("--database", type=click.Path(), help="Database file path")
|
||||
def trace_artifact(artifact_id, database):
|
||||
"""Trace provenance of an artifact."""
|
||||
artifact_repo, dep_repo, db = _get_repos(database)
|
||||
service = TraceabilityService(artifact_repo, dep_repo, db_path=db)
|
||||
|
||||
artifact = artifact_repo.get_by_id(artifact_id)
|
||||
if not artifact:
|
||||
click.echo(f"Artifact '{artifact_id}' not found.", err=True)
|
||||
raise SystemExit(1)
|
||||
|
||||
trace = service.trace_artifact(artifact_id)
|
||||
click.echo(json.dumps(trace.to_dict(), indent=2, default=str))
|
||||
|
||||
|
||||
@prompt_commands.command("graph")
|
||||
@click.argument("artifact_id")
|
||||
@click.option(
|
||||
"--format",
|
||||
"fmt",
|
||||
type=click.Choice(["dot", "mermaid"]),
|
||||
default="mermaid",
|
||||
help="Output format",
|
||||
)
|
||||
@click.option("--database", type=click.Path(), help="Database file path")
|
||||
def show_graph(artifact_id, fmt, database):
|
||||
"""Visualize dependency graph for an artifact."""
|
||||
artifact_repo, dep_repo, db = _get_repos(database)
|
||||
builder = GraphBuilder(dep_repo)
|
||||
|
||||
# Build graph from all edges involving this artifact
|
||||
from markitect.prompts.dependencies.queries import DependencyQueryService
|
||||
|
||||
query_svc = DependencyQueryService(dep_repo)
|
||||
deps = query_svc.find_transitive_dependencies(artifact_id)
|
||||
dependents = query_svc.find_transitive_dependents(artifact_id)
|
||||
all_ids = deps | dependents | {artifact_id}
|
||||
|
||||
graph = builder.build_graph(all_ids)
|
||||
|
||||
if fmt == "dot":
|
||||
click.echo(GraphExporter.to_dot(graph, title=f"Dependencies: {artifact_id}"))
|
||||
else:
|
||||
click.echo(
|
||||
GraphExporter.to_mermaid(graph, title=f"Dependencies: {artifact_id}")
|
||||
)
|
||||
|
||||
|
||||
@prompt_commands.command("runs")
|
||||
@click.option("--template", help="Filter by template ID")
|
||||
@click.option(
|
||||
"--status",
|
||||
type=click.Choice(["pending", "running", "success", "failed", "skipped"]),
|
||||
help="Filter by status",
|
||||
)
|
||||
@click.option("--limit", default=20, type=int, help="Maximum results")
|
||||
@click.option("--database", type=click.Path(), help="Database file path")
|
||||
def list_runs(template, status, limit, database):
|
||||
"""List prompt execution runs."""
|
||||
artifact_repo, dep_repo, db = _get_repos(database)
|
||||
query_svc = PromptQueryService(artifact_repo, dep_repo, db_path=db)
|
||||
|
||||
runs = query_svc.get_run_history(
|
||||
template_id=template, status=status, limit=limit
|
||||
)
|
||||
|
||||
if not runs:
|
||||
click.echo("No runs found.")
|
||||
return
|
||||
|
||||
click.echo(json.dumps(runs, indent=2, default=str))
|
||||
|
||||
|
||||
@prompt_commands.command("debt")
|
||||
@click.option("--artifact", help="Filter by artifact ID")
|
||||
@click.option("--database", type=click.Path(), help="Database file path")
|
||||
def show_debt(artifact, database):
|
||||
"""Show impact debt (suppressed recomputations)."""
|
||||
artifact_repo, dep_repo, db = _get_repos(database)
|
||||
query_svc = PromptQueryService(artifact_repo, dep_repo, db_path=db)
|
||||
|
||||
if artifact:
|
||||
# Get debt for specific artifact via traceability service
|
||||
trace_svc = TraceabilityService(artifact_repo, dep_repo, db_path=db)
|
||||
debts = trace_svc.get_impact_debt(artifact)
|
||||
if not debts:
|
||||
click.echo(f"No impact debt for artifact '{artifact}'.")
|
||||
return
|
||||
click.echo(json.dumps(debts, indent=2, default=str))
|
||||
else:
|
||||
stale = query_svc.get_stale_artifacts()
|
||||
if not stale:
|
||||
click.echo("No stale artifacts found.")
|
||||
return
|
||||
click.echo(json.dumps(stale, indent=2, default=str))
|
||||
|
||||
|
||||
@prompt_commands.command("stats")
|
||||
@click.option("--database", type=click.Path(), help="Database file path")
|
||||
def show_stats(database):
|
||||
"""Show dependency graph statistics."""
|
||||
artifact_repo, dep_repo, db = _get_repos(database)
|
||||
query_svc = PromptQueryService(artifact_repo, dep_repo, db_path=db)
|
||||
|
||||
stats = query_svc.get_dependency_stats()
|
||||
click.echo(json.dumps(stats, indent=2))
|
||||
11
markitect/prompts/queries/__init__.py
Normal file
11
markitect/prompts/queries/__init__.py
Normal file
@@ -0,0 +1,11 @@
|
||||
"""
|
||||
Query operations package for cross-service prompt queries.
|
||||
|
||||
Provides higher-level query operations over the prompt infrastructure.
|
||||
"""
|
||||
|
||||
from markitect.prompts.queries.operations import PromptQueryService
|
||||
|
||||
__all__ = [
|
||||
"PromptQueryService",
|
||||
]
|
||||
165
markitect/prompts/queries/operations.py
Normal file
165
markitect/prompts/queries/operations.py
Normal file
@@ -0,0 +1,165 @@
|
||||
"""
|
||||
Complex cross-service query operations for prompt infrastructure.
|
||||
|
||||
Combines artifact repository, dependency repository, and run data
|
||||
into higher-level queries like run history, impact analysis, and stats.
|
||||
"""
|
||||
|
||||
from typing import Any, Dict, List, Optional
|
||||
|
||||
from markitect.prompts.dependencies.graph import GraphBuilder
|
||||
from markitect.prompts.dependencies.queries import DependencyQueryService
|
||||
from markitect.prompts.dependencies.repository import IDependencyRepository
|
||||
from markitect.prompts.execution.models import PromptRun
|
||||
from markitect.prompts.incremental.engine import IncrementalExecutionEngine
|
||||
from markitect.prompts.repositories.interfaces import IArtifactRepository
|
||||
|
||||
|
||||
class PromptQueryService:
|
||||
"""
|
||||
Complex cross-service queries over prompt infrastructure.
|
||||
|
||||
Provides higher-level queries that span multiple data sources:
|
||||
run history, stale artifact detection, dependency statistics,
|
||||
and content-based artifact lookups.
|
||||
"""
|
||||
|
||||
def __init__(
|
||||
self,
|
||||
artifact_repo: IArtifactRepository,
|
||||
dependency_repo: IDependencyRepository,
|
||||
db_path: Optional[str] = None,
|
||||
):
|
||||
"""
|
||||
Initialize with data sources.
|
||||
|
||||
Args:
|
||||
artifact_repo: Artifact repository
|
||||
dependency_repo: Dependency edge repository
|
||||
db_path: Optional database path for debt queries
|
||||
"""
|
||||
self._artifact_repo = artifact_repo
|
||||
self._dependency_repo = dependency_repo
|
||||
self._db_path = db_path
|
||||
self._query_service = DependencyQueryService(dependency_repo)
|
||||
self._graph_builder = GraphBuilder(dependency_repo)
|
||||
self._engine = (
|
||||
IncrementalExecutionEngine(db_path, self._query_service)
|
||||
if db_path
|
||||
else None
|
||||
)
|
||||
# Run registry: external code registers runs for querying
|
||||
self._runs: Dict[str, PromptRun] = {}
|
||||
|
||||
def register_run(self, run: PromptRun) -> None:
|
||||
"""Register a run for query lookups."""
|
||||
self._runs[run.id] = run
|
||||
|
||||
def get_run_history(
|
||||
self,
|
||||
template_id: Optional[str] = None,
|
||||
status: Optional[str] = None,
|
||||
limit: int = 50,
|
||||
) -> List[Dict[str, Any]]:
|
||||
"""
|
||||
Query run history with optional filters.
|
||||
|
||||
Args:
|
||||
template_id: Optional template ID filter
|
||||
status: Optional status filter
|
||||
limit: Maximum results to return
|
||||
|
||||
Returns:
|
||||
List of run dictionaries sorted by start time (newest first)
|
||||
"""
|
||||
runs = list(self._runs.values())
|
||||
|
||||
if template_id:
|
||||
runs = [r for r in runs if r.template_id == template_id]
|
||||
|
||||
if status:
|
||||
runs = [r for r in runs if r.status.value == status]
|
||||
|
||||
runs.sort(key=lambda r: r.started_at, reverse=True)
|
||||
runs = runs[:limit]
|
||||
|
||||
return [r.to_dict() for r in runs]
|
||||
|
||||
def get_stale_artifacts(self) -> List[Dict[str, Any]]:
|
||||
"""
|
||||
Find artifacts with outstanding impact debt.
|
||||
|
||||
Returns:
|
||||
List of dicts with artifact info and debt details
|
||||
"""
|
||||
if not self._engine:
|
||||
return []
|
||||
|
||||
all_debt = self._engine.get_all_debt()
|
||||
if not all_debt:
|
||||
return []
|
||||
|
||||
# Group debt by artifact
|
||||
debt_by_artifact: Dict[str, list] = {}
|
||||
for d in all_debt:
|
||||
debt_by_artifact.setdefault(d.artifact_id, []).append(d)
|
||||
|
||||
results = []
|
||||
for artifact_id, debts in debt_by_artifact.items():
|
||||
artifact = self._artifact_repo.get_by_id(artifact_id)
|
||||
results.append({
|
||||
"artifact_id": artifact_id,
|
||||
"artifact_name": artifact.name if artifact else "unknown",
|
||||
"debt_count": len(debts),
|
||||
"total_magnitude": sum(d.change_magnitude for d in debts),
|
||||
"reasons": list({d.suppression_reason for d in debts}),
|
||||
})
|
||||
|
||||
return results
|
||||
|
||||
def get_dependency_stats(self) -> Dict[str, Any]:
|
||||
"""
|
||||
Get summary statistics about the dependency graph.
|
||||
|
||||
Returns:
|
||||
Dictionary with graph statistics
|
||||
"""
|
||||
graph = self._graph_builder.build_graph()
|
||||
nodes = graph.nodes
|
||||
edge_count = graph.edge_count
|
||||
|
||||
# Find root nodes (no predecessors) and leaf nodes (no successors)
|
||||
roots = [n for n in nodes if not graph.get_predecessors(n)]
|
||||
leaves = [n for n in nodes if not graph.get_successors(n)]
|
||||
|
||||
# Check for cycles
|
||||
has_cycles = graph.has_cycle()
|
||||
|
||||
return {
|
||||
"total_nodes": len(nodes),
|
||||
"total_edges": edge_count,
|
||||
"root_count": len(roots),
|
||||
"leaf_count": len(leaves),
|
||||
"has_cycles": has_cycles,
|
||||
}
|
||||
|
||||
def find_artifacts_by_digest(self, digest: str) -> List[Dict[str, Any]]:
|
||||
"""
|
||||
Find all artifacts with a given content digest.
|
||||
|
||||
Args:
|
||||
digest: Content digest to search for
|
||||
|
||||
Returns:
|
||||
List of artifact dictionaries
|
||||
"""
|
||||
artifacts = self._artifact_repo.get_by_digest(digest)
|
||||
return [
|
||||
{
|
||||
"artifact_id": a.id,
|
||||
"name": a.name,
|
||||
"space_id": a.space_id,
|
||||
"artifact_type": a.artifact_type.value,
|
||||
}
|
||||
for a in artifacts
|
||||
]
|
||||
19
markitect/prompts/traceability/__init__.py
Normal file
19
markitect/prompts/traceability/__init__.py
Normal file
@@ -0,0 +1,19 @@
|
||||
"""
|
||||
Traceability package for artifact provenance tracking.
|
||||
|
||||
Implements FR-11: Observability & Traceability.
|
||||
"""
|
||||
|
||||
from markitect.prompts.traceability.models import (
|
||||
ArtifactLineage,
|
||||
ProvenanceTrace,
|
||||
RunSummary,
|
||||
)
|
||||
from markitect.prompts.traceability.service import TraceabilityService
|
||||
|
||||
__all__ = [
|
||||
"ArtifactLineage",
|
||||
"ProvenanceTrace",
|
||||
"RunSummary",
|
||||
"TraceabilityService",
|
||||
]
|
||||
116
markitect/prompts/traceability/models.py
Normal file
116
markitect/prompts/traceability/models.py
Normal file
@@ -0,0 +1,116 @@
|
||||
"""
|
||||
Traceability models for provenance tracking.
|
||||
|
||||
Implements FR-11.1: Trace artifacts to producing runs, inputs, and validation.
|
||||
"""
|
||||
|
||||
from dataclasses import dataclass, field
|
||||
from datetime import datetime
|
||||
from typing import Any, Dict, List, Optional
|
||||
|
||||
|
||||
@dataclass
|
||||
class RunSummary:
|
||||
"""Summary of a PromptRun for traceability output."""
|
||||
|
||||
run_id: str
|
||||
template_id: str
|
||||
status: str
|
||||
stage: str
|
||||
parent_run_id: Optional[str]
|
||||
depth: int
|
||||
input_bundle_hash: str
|
||||
started_at: datetime
|
||||
completed_at: Optional[datetime]
|
||||
|
||||
@classmethod
|
||||
def create(
|
||||
cls,
|
||||
run_id: str,
|
||||
template_id: str,
|
||||
status: str,
|
||||
stage: str,
|
||||
input_bundle_hash: str,
|
||||
started_at: datetime,
|
||||
parent_run_id: Optional[str] = None,
|
||||
depth: int = 0,
|
||||
completed_at: Optional[datetime] = None,
|
||||
) -> "RunSummary":
|
||||
"""Create a RunSummary."""
|
||||
return cls(
|
||||
run_id=run_id,
|
||||
template_id=template_id,
|
||||
status=status,
|
||||
stage=stage,
|
||||
parent_run_id=parent_run_id,
|
||||
depth=depth,
|
||||
input_bundle_hash=input_bundle_hash,
|
||||
started_at=started_at,
|
||||
completed_at=completed_at,
|
||||
)
|
||||
|
||||
def to_dict(self) -> Dict[str, Any]:
|
||||
"""Convert to dictionary."""
|
||||
return {
|
||||
"run_id": self.run_id,
|
||||
"template_id": self.template_id,
|
||||
"status": self.status,
|
||||
"stage": self.stage,
|
||||
"parent_run_id": self.parent_run_id,
|
||||
"depth": self.depth,
|
||||
"input_bundle_hash": self.input_bundle_hash,
|
||||
"started_at": self.started_at.isoformat(),
|
||||
"completed_at": self.completed_at.isoformat() if self.completed_at else None,
|
||||
}
|
||||
|
||||
|
||||
@dataclass
|
||||
class ArtifactLineage:
|
||||
"""Lineage record for a single artifact in a trace."""
|
||||
|
||||
artifact_id: str
|
||||
name: str
|
||||
space_id: str
|
||||
artifact_type: str
|
||||
content_digest: str
|
||||
role: str # "input", "output", "template"
|
||||
|
||||
def to_dict(self) -> Dict[str, Any]:
|
||||
"""Convert to dictionary."""
|
||||
return {
|
||||
"artifact_id": self.artifact_id,
|
||||
"name": self.name,
|
||||
"space_id": self.space_id,
|
||||
"artifact_type": self.artifact_type,
|
||||
"content_digest": self.content_digest,
|
||||
"role": self.role,
|
||||
}
|
||||
|
||||
|
||||
@dataclass
|
||||
class ProvenanceTrace:
|
||||
"""Complete provenance trace for an artifact."""
|
||||
|
||||
artifact_id: str
|
||||
producing_run: Optional[RunSummary] = None
|
||||
template: Optional[ArtifactLineage] = None
|
||||
input_artifacts: List[ArtifactLineage] = field(default_factory=list)
|
||||
output_artifacts: List[ArtifactLineage] = field(default_factory=list)
|
||||
generator_runs: List[RunSummary] = field(default_factory=list)
|
||||
validation_results: List[Dict[str, Any]] = field(default_factory=list)
|
||||
impact_debt: List[Dict[str, Any]] = field(default_factory=list)
|
||||
dependency_chain: List[str] = field(default_factory=list)
|
||||
|
||||
def to_dict(self) -> Dict[str, Any]:
|
||||
"""Convert to dictionary."""
|
||||
return {
|
||||
"artifact_id": self.artifact_id,
|
||||
"producing_run": self.producing_run.to_dict() if self.producing_run else None,
|
||||
"template": self.template.to_dict() if self.template else None,
|
||||
"input_artifacts": [a.to_dict() for a in self.input_artifacts],
|
||||
"output_artifacts": [a.to_dict() for a in self.output_artifacts],
|
||||
"generator_runs": [r.to_dict() for r in self.generator_runs],
|
||||
"validation_results": self.validation_results,
|
||||
"impact_debt": self.impact_debt,
|
||||
"dependency_chain": self.dependency_chain,
|
||||
}
|
||||
315
markitect/prompts/traceability/service.py
Normal file
315
markitect/prompts/traceability/service.py
Normal file
@@ -0,0 +1,315 @@
|
||||
"""
|
||||
Traceability service for artifact provenance tracking.
|
||||
|
||||
Implements FR-11.1: Trace any artifact to its producing PromptTemplate,
|
||||
input artifacts, generator runs, and quality validation results.
|
||||
|
||||
Implements FR-11.2: Enable recomputation based on dependency changes.
|
||||
|
||||
Composition layer over existing services — does NOT duplicate data storage.
|
||||
"""
|
||||
|
||||
from typing import Any, Dict, List, Optional
|
||||
|
||||
from markitect.prompts.dependencies.graph import GraphBuilder
|
||||
from markitect.prompts.dependencies.queries import DependencyQueryService
|
||||
from markitect.prompts.dependencies.repository import IDependencyRepository
|
||||
from markitect.prompts.execution.models import PromptRun
|
||||
from markitect.prompts.incremental.engine import IncrementalExecutionEngine
|
||||
from markitect.prompts.quality.validator import QualityValidator
|
||||
from markitect.prompts.repositories.interfaces import IArtifactRepository
|
||||
from markitect.prompts.traceability.models import (
|
||||
ArtifactLineage,
|
||||
ProvenanceTrace,
|
||||
RunSummary,
|
||||
)
|
||||
|
||||
|
||||
def _run_to_summary(run: PromptRun) -> RunSummary:
|
||||
"""Convert a PromptRun to a RunSummary."""
|
||||
return RunSummary.create(
|
||||
run_id=run.id,
|
||||
template_id=run.template_id,
|
||||
status=run.status.value,
|
||||
stage=run.stage.value,
|
||||
input_bundle_hash=run.input_bundle_hash,
|
||||
started_at=run.started_at,
|
||||
parent_run_id=run.parent_run_id,
|
||||
depth=run.depth,
|
||||
completed_at=run.completed_at,
|
||||
)
|
||||
|
||||
|
||||
class TraceabilityService:
|
||||
"""
|
||||
Composition layer for full artifact provenance tracing.
|
||||
|
||||
Delegates to DependencyQueryService, QualityValidator,
|
||||
IncrementalExecutionEngine, and direct repository access.
|
||||
"""
|
||||
|
||||
def __init__(
|
||||
self,
|
||||
artifact_repo: IArtifactRepository,
|
||||
dependency_repo: IDependencyRepository,
|
||||
db_path: Optional[str] = None,
|
||||
):
|
||||
"""
|
||||
Compose over existing repos and services.
|
||||
|
||||
Args:
|
||||
artifact_repo: Repository for artifact lookups
|
||||
dependency_repo: Repository for dependency edge lookups
|
||||
db_path: Optional database path for quality/debt services
|
||||
"""
|
||||
self._artifact_repo = artifact_repo
|
||||
self._dependency_repo = dependency_repo
|
||||
self._db_path = db_path
|
||||
self._query_service = DependencyQueryService(dependency_repo)
|
||||
self._graph_builder = GraphBuilder(dependency_repo)
|
||||
self._validator = QualityValidator(db_path=db_path) if db_path else None
|
||||
self._engine = (
|
||||
IncrementalExecutionEngine(db_path, self._query_service)
|
||||
if db_path
|
||||
else None
|
||||
)
|
||||
# Run registry: external code can register runs for tracing
|
||||
self._runs: Dict[str, PromptRun] = {}
|
||||
|
||||
def register_run(self, run: PromptRun) -> None:
|
||||
"""
|
||||
Register a run for traceability lookups.
|
||||
|
||||
Args:
|
||||
run: PromptRun to register
|
||||
"""
|
||||
self._runs[run.id] = run
|
||||
|
||||
def trace_artifact(self, artifact_id: str) -> ProvenanceTrace:
|
||||
"""
|
||||
Full provenance trace for an artifact (FR-11.1).
|
||||
|
||||
Args:
|
||||
artifact_id: Artifact to trace
|
||||
|
||||
Returns:
|
||||
ProvenanceTrace with all provenance data
|
||||
"""
|
||||
trace = ProvenanceTrace(artifact_id=artifact_id)
|
||||
|
||||
# Find producing run
|
||||
producing_run = self.get_producing_run(artifact_id)
|
||||
trace.producing_run = producing_run
|
||||
|
||||
if producing_run:
|
||||
# Get template artifact
|
||||
template_artifact = self._artifact_repo.get_by_id(
|
||||
producing_run.template_id
|
||||
)
|
||||
if template_artifact:
|
||||
trace.template = ArtifactLineage(
|
||||
artifact_id=template_artifact.id,
|
||||
name=template_artifact.name,
|
||||
space_id=template_artifact.space_id,
|
||||
artifact_type=template_artifact.artifact_type.value,
|
||||
content_digest=template_artifact.content_digest,
|
||||
role="template",
|
||||
)
|
||||
|
||||
# Get input and output artifacts
|
||||
trace.input_artifacts = self.get_input_artifacts(producing_run.run_id)
|
||||
trace.output_artifacts = self.get_output_artifacts(producing_run.run_id)
|
||||
|
||||
# Get generator sub-runs
|
||||
trace.generator_runs = self.get_generator_runs(producing_run.run_id)
|
||||
|
||||
# Get validation history
|
||||
trace.validation_results = self.get_validation_history(artifact_id)
|
||||
|
||||
# Get impact debt
|
||||
trace.impact_debt = self.get_impact_debt(artifact_id)
|
||||
|
||||
# Build dependency chain
|
||||
deps = self._query_service.find_transitive_dependencies(artifact_id)
|
||||
trace.dependency_chain = sorted(deps)
|
||||
|
||||
return trace
|
||||
|
||||
def get_producing_run(self, artifact_id: str) -> Optional[RunSummary]:
|
||||
"""
|
||||
Find the run that produced an artifact.
|
||||
|
||||
Searches registered runs for one whose manifest lists
|
||||
this artifact as an output.
|
||||
|
||||
Args:
|
||||
artifact_id: Artifact to find producer of
|
||||
|
||||
Returns:
|
||||
RunSummary if found, None otherwise
|
||||
"""
|
||||
# Check dependency edges: find edges where this artifact is a target
|
||||
# with edge_type "generates"
|
||||
edges = self._dependency_repo.get_by_target(artifact_id)
|
||||
for edge in edges:
|
||||
# The source is the run or template that generated this artifact
|
||||
run = self._runs.get(edge.source_artifact_id)
|
||||
if run:
|
||||
return _run_to_summary(run)
|
||||
|
||||
# Fallback: search registered runs by manifest metadata
|
||||
for run in self._runs.values():
|
||||
manifest = run.metadata.get("manifest", {})
|
||||
outputs = manifest.get("output_artifacts", [])
|
||||
for output in outputs:
|
||||
if output.get("artifact_id") == artifact_id:
|
||||
return _run_to_summary(run)
|
||||
|
||||
return None
|
||||
|
||||
def get_input_artifacts(self, run_id: str) -> List[ArtifactLineage]:
|
||||
"""
|
||||
Get all input artifacts for a run.
|
||||
|
||||
Uses dependency edges to find artifacts that the run depends on.
|
||||
|
||||
Args:
|
||||
run_id: Run identifier
|
||||
|
||||
Returns:
|
||||
List of ArtifactLineage for inputs
|
||||
"""
|
||||
result = []
|
||||
# Find edges where this run is the target (artifacts -> run)
|
||||
edges = self._dependency_repo.get_by_run(run_id)
|
||||
for edge in edges:
|
||||
if edge.edge_type.value == "requires":
|
||||
artifact = self._artifact_repo.get_by_id(edge.source_artifact_id)
|
||||
if artifact:
|
||||
result.append(
|
||||
ArtifactLineage(
|
||||
artifact_id=artifact.id,
|
||||
name=artifact.name,
|
||||
space_id=artifact.space_id,
|
||||
artifact_type=artifact.artifact_type.value,
|
||||
content_digest=artifact.content_digest,
|
||||
role="input",
|
||||
)
|
||||
)
|
||||
# Also check manifest resolved_inputs
|
||||
run = self._runs.get(run_id)
|
||||
if run:
|
||||
manifest = run.metadata.get("manifest", {})
|
||||
seen_ids = {a.artifact_id for a in result}
|
||||
for inp in manifest.get("resolved_inputs", []):
|
||||
aid = inp.get("artifact_id", "")
|
||||
if aid and aid not in seen_ids:
|
||||
artifact = self._artifact_repo.get_by_id(aid)
|
||||
if artifact:
|
||||
result.append(
|
||||
ArtifactLineage(
|
||||
artifact_id=artifact.id,
|
||||
name=artifact.name,
|
||||
space_id=artifact.space_id,
|
||||
artifact_type=artifact.artifact_type.value,
|
||||
content_digest=artifact.content_digest,
|
||||
role="input",
|
||||
)
|
||||
)
|
||||
seen_ids.add(aid)
|
||||
return result
|
||||
|
||||
def get_output_artifacts(self, run_id: str) -> List[ArtifactLineage]:
|
||||
"""
|
||||
Get all output artifacts produced by a run.
|
||||
|
||||
Args:
|
||||
run_id: Run identifier
|
||||
|
||||
Returns:
|
||||
List of ArtifactLineage for outputs
|
||||
"""
|
||||
result = []
|
||||
# Find edges where this run is the source with "generates"
|
||||
edges = self._dependency_repo.get_by_run(run_id)
|
||||
for edge in edges:
|
||||
if edge.edge_type.value == "generates":
|
||||
artifact = self._artifact_repo.get_by_id(edge.target_artifact_id)
|
||||
if artifact:
|
||||
result.append(
|
||||
ArtifactLineage(
|
||||
artifact_id=artifact.id,
|
||||
name=artifact.name,
|
||||
space_id=artifact.space_id,
|
||||
artifact_type=artifact.artifact_type.value,
|
||||
content_digest=artifact.content_digest,
|
||||
role="output",
|
||||
)
|
||||
)
|
||||
# Also check manifest output_artifacts
|
||||
run = self._runs.get(run_id)
|
||||
if run:
|
||||
manifest = run.metadata.get("manifest", {})
|
||||
seen_ids = {a.artifact_id for a in result}
|
||||
for out in manifest.get("output_artifacts", []):
|
||||
aid = out.get("artifact_id", "")
|
||||
if aid and aid not in seen_ids:
|
||||
artifact = self._artifact_repo.get_by_id(aid)
|
||||
if artifact:
|
||||
result.append(
|
||||
ArtifactLineage(
|
||||
artifact_id=artifact.id,
|
||||
name=artifact.name,
|
||||
space_id=artifact.space_id,
|
||||
artifact_type=artifact.artifact_type.value,
|
||||
content_digest=artifact.content_digest,
|
||||
role="output",
|
||||
)
|
||||
)
|
||||
seen_ids.add(aid)
|
||||
return result
|
||||
|
||||
def get_generator_runs(self, run_id: str) -> List[RunSummary]:
|
||||
"""
|
||||
Get nested generator runs spawned by a run.
|
||||
|
||||
Args:
|
||||
run_id: Parent run identifier
|
||||
|
||||
Returns:
|
||||
List of RunSummary for child runs
|
||||
"""
|
||||
return [
|
||||
_run_to_summary(run)
|
||||
for run in self._runs.values()
|
||||
if run.parent_run_id == run_id
|
||||
]
|
||||
|
||||
def get_validation_history(self, artifact_id: str) -> List[Dict[str, Any]]:
|
||||
"""
|
||||
Get validation results for an artifact across all runs.
|
||||
|
||||
Args:
|
||||
artifact_id: Artifact identifier
|
||||
|
||||
Returns:
|
||||
List of validation result dictionaries
|
||||
"""
|
||||
if self._validator:
|
||||
return self._validator.get_results_for_artifact(artifact_id)
|
||||
return []
|
||||
|
||||
def get_impact_debt(self, artifact_id: str) -> List[Dict[str, Any]]:
|
||||
"""
|
||||
Get suppressed recomputation records for an artifact.
|
||||
|
||||
Args:
|
||||
artifact_id: Artifact identifier
|
||||
|
||||
Returns:
|
||||
List of impact debt dictionaries
|
||||
"""
|
||||
if self._engine:
|
||||
debts = self._engine.get_debt_for_artifact(artifact_id)
|
||||
return [d.to_dict() for d in debts]
|
||||
return []
|
||||
11
markitect/prompts/visualization/__init__.py
Normal file
11
markitect/prompts/visualization/__init__.py
Normal file
@@ -0,0 +1,11 @@
|
||||
"""
|
||||
Visualization package for dependency graph export.
|
||||
|
||||
Provides DOT and Mermaid format export for DependencyGraph instances.
|
||||
"""
|
||||
|
||||
from markitect.prompts.visualization.graph import GraphExporter
|
||||
|
||||
__all__ = [
|
||||
"GraphExporter",
|
||||
]
|
||||
106
markitect/prompts/visualization/graph.py
Normal file
106
markitect/prompts/visualization/graph.py
Normal file
@@ -0,0 +1,106 @@
|
||||
"""
|
||||
Graph visualization export for dependency graphs.
|
||||
|
||||
Exports DependencyGraph to DOT (Graphviz) and Mermaid diagram formats.
|
||||
"""
|
||||
|
||||
from markitect.prompts.dependencies.models import DependencyGraph, EdgeType
|
||||
|
||||
|
||||
# Edge type to style mappings
|
||||
_DOT_EDGE_STYLES = {
|
||||
EdgeType.REQUIRES: 'style="solid"',
|
||||
EdgeType.GENERATES: 'style="dashed"',
|
||||
EdgeType.INCLUDES: 'style="dotted"',
|
||||
}
|
||||
|
||||
_MERMAID_EDGE_STYLES = {
|
||||
EdgeType.REQUIRES: "-->",
|
||||
EdgeType.GENERATES: "-.->",
|
||||
EdgeType.INCLUDES: "==>",
|
||||
}
|
||||
|
||||
|
||||
class GraphExporter:
|
||||
"""Export DependencyGraph to DOT and Mermaid formats."""
|
||||
|
||||
@staticmethod
|
||||
def to_dot(graph: DependencyGraph, title: str = "Dependencies") -> str:
|
||||
"""
|
||||
Export dependency graph to Graphviz DOT format.
|
||||
|
||||
Args:
|
||||
graph: DependencyGraph to export
|
||||
title: Graph title
|
||||
|
||||
Returns:
|
||||
DOT format string
|
||||
"""
|
||||
lines = [
|
||||
f'digraph "{title}" {{',
|
||||
" rankdir=LR;",
|
||||
f' label="{title}";',
|
||||
" node [shape=box];",
|
||||
]
|
||||
|
||||
# Add nodes
|
||||
for node in sorted(graph.nodes):
|
||||
safe_id = node.replace("-", "_")
|
||||
lines.append(f' {safe_id} [label="{node}"];')
|
||||
|
||||
# Add edges
|
||||
for source in sorted(graph.nodes):
|
||||
for target in sorted(graph.get_successors(source)):
|
||||
edge_type = graph.get_edge_type(source, target)
|
||||
style = _DOT_EDGE_STYLES.get(edge_type, 'style="solid"')
|
||||
safe_source = source.replace("-", "_")
|
||||
safe_target = target.replace("-", "_")
|
||||
label = edge_type.value if edge_type else "requires"
|
||||
lines.append(
|
||||
f' {safe_source} -> {safe_target} [{style} label="{label}"];'
|
||||
)
|
||||
|
||||
lines.append("}")
|
||||
return "\n".join(lines)
|
||||
|
||||
@staticmethod
|
||||
def to_mermaid(graph: DependencyGraph, title: str = "Dependencies") -> str:
|
||||
"""
|
||||
Export dependency graph to Mermaid diagram format.
|
||||
|
||||
Args:
|
||||
graph: DependencyGraph to export
|
||||
title: Graph title (used as comment)
|
||||
|
||||
Returns:
|
||||
Mermaid format string
|
||||
"""
|
||||
lines = [
|
||||
f"%%{{ title: {title} }}%%",
|
||||
"graph LR",
|
||||
]
|
||||
|
||||
# Add edges
|
||||
edges_added = False
|
||||
for source in sorted(graph.nodes):
|
||||
for target in sorted(graph.get_successors(source)):
|
||||
edge_type = graph.get_edge_type(source, target)
|
||||
arrow = _MERMAID_EDGE_STYLES.get(edge_type, "-->")
|
||||
label = edge_type.value if edge_type else "requires"
|
||||
lines.append(f" {source}{arrow}|{label}|{target}")
|
||||
edges_added = True
|
||||
|
||||
# Add isolated nodes (no edges)
|
||||
if not edges_added:
|
||||
for node in sorted(graph.nodes):
|
||||
lines.append(f" {node}")
|
||||
else:
|
||||
# Add any isolated nodes that have no edges
|
||||
connected = set()
|
||||
for source in graph.nodes:
|
||||
if graph.get_successors(source) or graph.get_predecessors(source):
|
||||
connected.add(source)
|
||||
for node in sorted(graph.nodes - connected):
|
||||
lines.append(f" {node}")
|
||||
|
||||
return "\n".join(lines)
|
||||
Reference in New Issue
Block a user