CUST-WP-0050 follow-up: human review, push tooling, SSH inventory

Add human-review script for 13 high-blast-radius repos, bulk-push helper,
and SSH-based Gitea inventory probe. Update exclusion list with SSH-verified
absent slugs; marki-docx now classified and registered.
This commit is contained in:
2026-06-22 17:59:55 +02:00
parent 61fe8e0309
commit db88a34b3e
4 changed files with 310 additions and 17 deletions

View File

@@ -4,18 +4,18 @@
#
# Validate additions against canon/standards/repo-classification-standard_v1.0.md.
version: "1.0"
version: "1.1"
updated: "2026-06-22"
exclusions:
# Forks and personal repos — not ecosystem inventory.
- slug: tegwick/the-custodian
gitea_path: tegwick/the-custodian
reason: fork of the-custodian; not a managed ecosystem repo
reason: fork path not found on Gitea (SSH verified 2026-06-22)
- slug: python-snake
gitea_path: lando_worsch/python-snake
reason: personal / non-ecosystem repo
reason: personal / non-ecosystem repo (exists on Gitea; excluded by policy)
# Archived or collapsed hub registrations — superseded by another slug.
- slug: markitect-project
@@ -31,7 +31,7 @@ exclusions:
reason: archived duplicate; collapsed into vergabe-teilnahme
- slug: test_domain_v2
reason: archived test domain; not active portfolio
reason: archived test domain; not present on Gitea coulomb org (SSH verified)
# Local-only templates / sandboxes — not product inventory.
- slug: hub-core-seed
@@ -43,31 +43,27 @@ exclusions:
- slug: .nvm
reason: Node version manager checkout; not a coulomb project repo
# Gitea repos referenced in portfolio review but not present / not cloned locally
# at T11 execution time — classify when a checkout exists or Gitea inventory confirms.
# Portfolio-review slugs with no matching coulomb/* repo on Gitea (SSH verified 2026-06-22).
- slug: binect-chrome
reason: not cloned locally; pending inventory confirmation
reason: not present on Gitea coulomb org; likely renamed or removed
- slug: binect-js
reason: not cloned locally; pending inventory confirmation
reason: not present on Gitea coulomb org; likely renamed or removed
- slug: direkt-vermittlung-de
reason: not cloned locally; pending inventory confirmation
reason: not present on Gitea coulomb org; likely renamed or removed
- slug: polycode-sim
reason: not cloned locally; pending inventory confirmation
reason: not present on Gitea coulomb org; likely renamed or removed
- slug: ralph-workplan
reason: not cloned locally; pending inventory confirmation
reason: not present on Gitea coulomb org; likely renamed or removed
- slug: tele-mcp
reason: not cloned locally; pending inventory confirmation
reason: not present on Gitea coulomb org; likely renamed or removed
- slug: testdrive-jsui
reason: not cloned locally; pending inventory confirmation
reason: not present on Gitea coulomb org; likely renamed or removed
- slug: timeline-svg
reason: not cloned locally; pending inventory confirmation
- slug: marki-docx
reason: registered in hub; no local checkout at T11 — classify on next clone
reason: not present on Gitea coulomb org; likely renamed or removed

View File

@@ -0,0 +1,58 @@
#!/usr/bin/env python3
"""Compare State Hub registered repos against Gitea SSH reachability (no HTTP token)."""
from __future__ import annotations
import json
import subprocess
import sys
import urllib.request
API_BASE = "http://127.0.0.1:8000"
GITEA_REMOTE = "gitea-remote"
def hub_repos() -> list[dict]:
with urllib.request.urlopen(f"{API_BASE}/repos/", timeout=30) as resp:
return json.load(resp)
def gitea_exists(path: str) -> bool:
proc = subprocess.run(
[
"git",
"ls-remote",
f"{GITEA_REMOTE}:{path}.git",
"HEAD",
],
capture_output=True,
text=True,
env={**__import__("os").environ, "GIT_SSH_COMMAND": "ssh -o ConnectTimeout=8 -o BatchMode=yes"},
)
return proc.returncode == 0 and any(line.strip() for line in proc.stdout.splitlines())
def main() -> int:
repos = hub_repos()
active = [r for r in repos if r.get("status") == "active"]
matched: list[str] = []
missing: list[str] = []
for repo in sorted(active, key=lambda r: r["slug"]):
slug = repo["slug"]
if gitea_exists(f"coulomb/{slug}"):
matched.append(slug)
else:
missing.append(slug)
print(f"State Hub active repos: {len(active)}")
print(f"Gitea SSH reachable (coulomb/<slug>): {len(matched)}")
print(f"Hub-only (no coulomb/<slug> on Gitea SSH): {len(missing)}")
if missing:
print("\nMissing on Gitea:")
for slug in missing:
print(f" - {slug}")
return 0
if __name__ == "__main__":
raise SystemExit(main())

View File

@@ -0,0 +1,194 @@
#!/usr/bin/env python3
"""Apply human-reviewed classification corrections (CUST-WP-0050 follow-up)."""
from __future__ import annotations
import subprocess
import sys
from pathlib import Path
import yaml
REPO_ROOT = Path(__file__).resolve().parent.parent
VALIDATOR = REPO_ROOT / "tools" / "validate_repo_classification.py"
HOME = Path.home()
# Curated human-reviewed classifications for high-blast-radius portfolio anchors.
HUMAN_REVIEWS: dict[str, dict] = {
"helix-forge": {
"category": "product",
"domain": "infotech",
"secondary_domains": ["agents"],
"capability_tags": [
"platform",
"capability-registry",
"coordination",
"knowledge",
"product-development",
],
"business_stake": ["product", "technology", "execution", "automation", "intelligence"],
"business_mechanics": ["intention", "coordination", "operation", "adaptation"],
"notes": "Capability development platform; standard §13.1 — human confirmed.",
},
"reuse-surface": {
"category": "product",
"domain": "infotech",
"secondary_domains": ["agents"],
"capability_tags": ["capability-registry", "discovery", "reuse", "maturity", "evidence"],
"business_stake": ["technology", "product", "intelligence", "automation"],
"business_mechanics": ["intention", "control", "adaptation"],
"notes": "Reuse discovery surface; standard §13.7 — human confirmed.",
},
"coordination-engine": {
"category": "product",
"domain": "communication",
"secondary_domains": ["infotech", "agents"],
"capability_tags": ["coordination", "workflow", "orchestration", "evidence", "platform"],
"business_stake": ["product", "technology", "operations", "automation"],
"business_mechanics": ["coordination", "operation", "adaptation"],
"notes": "Goal-driven coordination framework; human confirmed.",
},
"markitect-main": {
"category": "product",
"domain": "communication",
"secondary_domains": ["infotech", "agents"],
"capability_tags": ["knowledge", "documentation", "product-development", "platform"],
"business_stake": ["product", "technology", "execution"],
"business_mechanics": ["intention", "coordination", "operation", "adaptation"],
"notes": "Markitect successor to archived markitect-project; human confirmed.",
},
"citation-evidence": {
"category": "product",
"domain": "infotech",
"secondary_domains": ["communication", "government"],
"capability_tags": ["citations", "evidence", "knowledge", "traceability", "source-management"],
"business_stake": ["intelligence", "legal", "product", "technology"],
"business_mechanics": ["control", "coordination", "adaptation"],
"notes": "Citation/evidence product; standard §13.5 — human confirmed.",
},
"adaptive-pricing": {
"category": "product",
"domain": "financials",
"secondary_domains": ["infotech", "agents"],
"capability_tags": ["pricing", "monetization", "lifecycle", "decision-support", "product-development"],
"business_stake": ["finance", "product", "sales", "intelligence", "automation"],
"business_mechanics": ["intention", "control", "adaptation"],
"notes": "Adaptive pricing product; standard §13.6 — human confirmed.",
},
"identity-canon": {
"category": "research",
"domain": "infotech",
"secondary_domains": ["government"],
"capability_tags": ["identity", "access-control", "terminology", "canon", "governance"],
"business_stake": ["technology", "legal", "operations", "intelligence"],
"business_mechanics": ["intention", "control", "adaptation"],
"notes": "Identity canon; standard §13.3 — human confirmed.",
},
"net-kingdom": {
"category": "product",
"domain": "infotech",
"secondary_domains": [],
"capability_tags": ["security", "identity", "platform", "operations", "access-control"],
"business_stake": ["technology", "operations", "legal", "automation"],
"business_mechanics": ["control", "operation", "adaptation"],
"notes": "NetKingdom security/identity platform; standard §13.4 — human confirmed.",
},
"audit-core": {
"category": "tooling",
"domain": "infotech",
"secondary_domains": [],
"capability_tags": ["audit", "traceability", "security", "governance", "operations"],
"business_stake": ["technology", "operations", "legal", "automation"],
"business_mechanics": ["control", "operation"],
"notes": "Multi-tenant audit emit capability; human confirmed.",
},
"key-cape": {
"category": "product",
"domain": "infotech",
"secondary_domains": ["communication"],
"capability_tags": ["identity", "access-control", "security", "platform", "operations"],
"business_stake": ["technology", "operations", "legal", "product"],
"business_mechanics": ["control", "operation", "adaptation"],
"notes": "NetKingdom IAM Profile lightweight mode (Authelia/LLDAP/privacyIDEA); human corrected domain from communication→infotech.",
},
"flex-auth": {
"category": "product",
"domain": "infotech",
"secondary_domains": ["government"],
"capability_tags": ["identity", "access-control", "policy", "governance", "audit"],
"business_stake": ["technology", "legal", "operations", "product"],
"business_mechanics": ["control", "coordination", "adaptation"],
"notes": "Policy-as-code authorization registry; human corrected domain from communication→infotech.",
},
"ops-hub": {
"category": "tooling",
"domain": "infotech",
"secondary_domains": [],
"capability_tags": ["operations", "platform", "observability", "coordination", "governance"],
"business_stake": ["operations", "technology", "automation"],
"business_mechanics": ["coordination", "operation", "control"],
"notes": "Inter-Hub operations extension (environments, incidents, runbooks); human corrected category project→tooling.",
},
"railiance-platform": {
"category": "tooling",
"domain": "financials",
"secondary_domains": ["infotech"],
"capability_tags": ["platform", "operations", "configuration", "governance"],
"business_stake": ["finance", "technology", "operations"],
"business_mechanics": ["control", "operation", "coordination"],
"notes": "Railiance platform substrate; human corrected category project→tooling.",
},
}
def build_block(slug: str, data: dict) -> dict:
notes = data.pop("notes", None)
block = {
"repo_classification": {
"standard": "Repo Classification Standard",
"version": "1.0",
"classified_at": "2026-06-22",
"classified_by": "human",
**data,
}
}
if notes:
block["repo_classification"]["notes"] = notes
return block
def main() -> int:
updated: list[str] = []
for slug, data in HUMAN_REVIEWS.items():
repo_path = HOME / slug
target = repo_path / ".repo-classification.yaml"
if not repo_path.is_dir():
print(f"skip {slug}: no checkout", file=sys.stderr)
continue
payload = build_block(slug, dict(data))
target.write_text(yaml.dump(payload, sort_keys=False, allow_unicode=True))
proc = subprocess.run([sys.executable, str(VALIDATOR), str(target)], capture_output=True, text=True)
if proc.returncode != 0:
print(proc.stdout, proc.stderr, file=sys.stderr)
return 1
subprocess.run(["git", "add", ".repo-classification.yaml"], cwd=repo_path, check=True)
diff = subprocess.run(["git", "diff", "--cached", "--quiet"], cwd=repo_path)
if diff.returncode != 0:
subprocess.run(
[
"git",
"commit",
"-m",
"Human-review .repo-classification.yaml (CUST-WP-0050 follow-up)",
],
cwd=repo_path,
check=True,
)
updated.append(slug)
print(f"Human-reviewed: {len(updated)}")
for slug in updated:
print(f"{slug}")
return 0
if __name__ == "__main__":
raise SystemExit(main())

View File

@@ -0,0 +1,45 @@
#!/usr/bin/env bash
# Push unpushed .repo-classification.yaml commits across local ecosystem repos.
set -euo pipefail
HOME_REPOS="${HOME}"
PUSHED=0
SKIPPED=0
FAILED=0
FAILED_NAMES=()
for dir in "$HOME_REPOS"/*/; do
[ -d "$dir/.git" ] || continue
[ -f "$dir/.repo-classification.yaml" ] || continue
name=$(basename "$dir")
cd "$dir"
if ! git rev-parse --abbrev-ref HEAD >/dev/null 2>&1; then
continue
fi
branch=$(git rev-parse --abbrev-ref HEAD)
ahead=$(git rev-list --count "@{u}..HEAD" 2>/dev/null || echo "no-upstream")
if [ "$ahead" = "no-upstream" ] || [ "$ahead" = "0" ]; then
SKIPPED=$((SKIPPED + 1))
continue
fi
echo "Pushing $name ($branch, $ahead commit(s))..."
if git push origin "$branch" 2>&1; then
PUSHED=$((PUSHED + 1))
else
FAILED=$((FAILED + 1))
FAILED_NAMES+=("$name")
fi
done
echo ""
echo "Summary: pushed=$PUSHED skipped=$SKIPPED failed=$FAILED"
if [ "${#FAILED_NAMES[@]}" -gt 0 ]; then
echo "Failed:"
printf ' %s\n' "${FAILED_NAMES[@]}"
exit 1
fi