#!/usr/bin/env python3 """Check ARIS skill inventory drift across mainline, Codex mirror, and docs.""" from __future__ import annotations import re import sys from pathlib import Path REPO_ROOT = Path(__file__).resolve().parents[1] SKILLS_ROOT = REPO_ROOT / "skills" CODEX_ROOT = SKILLS_ROOT / "skills-codex" CATALOG = REPO_ROOT / "docs" / "SKILLS_CATALOG.md" README = REPO_ROOT / "README.md" README_CN = REPO_ROOT / "README_CN.md" AGENT_GUIDE = REPO_ROOT / "AGENT_GUIDE.md" ARIS_INTRO = REPO_ROOT / "docs" / "ARIS_INTRO.md" ARIS_INTRO_HTML = REPO_ROOT / "docs" / "ARIS_INTRO.html" CODEX_README = CODEX_ROOT / "README.md" CODEX_README_CN = CODEX_ROOT / "README_CN.md" BOM = b"\xef\xbb\xbf" FORBIDDEN_CODEX_REVIEWER_STRINGS = ( "mcp__codex__codex", "codex-reply", "reviewer-continuation", "threadId", ) # Phase A (issue #240): cross-language anchor IDs that MUST exist as # explicit `` in both README.md and README_CN.md so that # cross-language hyperlinks resolve identically. Adding a new numbered # section means adding it to both READMEs AND extending this list. REQUIRED_README_ANCHORS = ( "contents", "more-than-just-a-prompt", "whats-new", "quick-start", "features", "score-progression", "community-showcase", "awesome-community-skills", "workflows", "skills-catalog", "setup", "customization", "alternative-model-combinations", "community", "citation", "star-history", "acknowledgements", "license", "prerequisites", "install-skills", "gpu-server-setup", "alt-a-glm--gpt", "-optional-gpt-54-pro-via-oracle", "-research-wiki--persistent-research-memory", ) def skill_names(root: Path) -> set[str]: return {path.parent.name for path in root.glob("*/SKILL.md")} def allowed_tools(text: str) -> list[str]: """Tokens on the frontmatter `allowed-tools:` line (empty if absent).""" match = re.search(r"^allowed-tools:\s*(.+)$", text, flags=re.MULTILINE) if not match: return [] return [tok.strip() for tok in match.group(1).split(",") if tok.strip()] def frontmatter_split(text: str) -> str: """Return the body after a leading YAML frontmatter block (whole text if no frontmatter). Anchors on the opening `---` fence and the first closing `---` fence, so `---` horizontal rules later in the body are not mistaken for the frontmatter boundary.""" match = re.match(r"^---\n.*?\n---\n", text, flags=re.DOTALL) return text[match.end():] if match else text def readme_anchors(text: str) -> set[str]: return set(re.findall(r'', text)) def numbered_h2_count(text: str) -> int: return len(re.findall(r"^## \d+\.\s", text, flags=re.MULTILINE)) def read(path: Path) -> str: return path.read_text(encoding="utf-8") def catalog_names() -> set[str]: text = read(CATALOG) return set(re.findall(r"\[`/([^`]+)`\]$\.\./skills/[^)]+/SKILL\.md$", text)) def require(condition: bool, message: str, failures: list[str]) -> None: if not condition: failures.append(message) def require_count(path: Path, text: str, pattern: str, expected_count: int, failures: list[str]) -> None: match = re.search(pattern, text) rel = path.relative_to(REPO_ROOT) if match is None: failures.append(f"{rel} is missing live count pattern: {pattern}") return actual = int(match.group("count")) if actual != expected_count: failures.append(f"{rel} reports {actual} skills; expected {expected_count}") def check_inventory() -> list[str]: failures: list[str] = [] main = skill_names(SKILLS_ROOT) codex = skill_names(CODEX_ROOT) catalog = catalog_names() missing_codex = sorted(main - codex) extra_codex = sorted(codex - main) missing_catalog = sorted(main - catalog) extra_catalog = sorted(catalog - main) require(not missing_codex, f"missing Codex mirrors: {', '.join(missing_codex)}", failures) require(not extra_codex, f"unexpected Codex-only skills: {', '.join(extra_codex)}", failures) require(not missing_catalog, f"missing catalog entries: {', '.join(missing_catalog)}", failures) require(not extra_catalog, f"catalog entries without mainline skills: {', '.join(extra_catalog)}", failures) catalog_text = read(CATALOG) readme = read(README) readme_cn = read(README_CN) agent_guide = read(AGENT_GUIDE) aris_intro = read(ARIS_INTRO) aris_intro_html = read(ARIS_INTRO_HTML) codex_readme = read(CODEX_README) codex_readme_cn = read(CODEX_README_CN) expected_count = len(main) count_checks = [ (CATALOG, catalog_text, r"\*\*(?P\d+) skills\*\*"), (README, readme, r"📊\s+\*\*(?P\d+) composable skills\*\*"), (README, readme, r"ARIS ships \*\*(?P\d+)\+ skills\*\*"), (README_CN, readme_cn, r"📊\s+\*\*(?P\d+) 个可组合 skill\*\*"), (README_CN, readme_cn, r"ARIS 现有 \*\*(?P\d+)\+ 个 skill\*\*"), (AGENT_GUIDE, agent_guide, r"Full catalog.*?\*\*(?P\d+) skills\*\*"), (ARIS_INTRO, aris_intro, r"collection of \*\*(?P\d+) composable Claude Code skills\*\*"), (ARIS_INTRO, aris_intro, r"## The (?P\d+) Skills"), (ARIS_INTRO, aris_intro, r"一组 (?P\d+) 个可组合的 Claude Code skills"), (ARIS_INTRO_HTML, aris_intro_html, r"collection of (?P\d+) composable Claude Code skills"), (ARIS_INTRO_HTML, aris_intro_html, r'id="the-(?P\d+)-skills"'), (ARIS_INTRO_HTML, aris_intro_html, r"一组 (?P\d+) 个可组合的 Claude Code skills"), (CODEX_README, codex_readme, r"all `(?P\d+)` mainline skills"), (CODEX_README_CN, codex_readme_cn, r"`(?P\d+)`[^\n]*skill"), ] for path, text, pattern in count_checks: require_count(path, text, pattern, expected_count, failures) for skill_file in sorted(CODEX_ROOT.glob("*/SKILL.md")): if skill_file.read_bytes().startswith(BOM): failures.append(f"{skill_file.relative_to(REPO_ROOT)} starts with UTF-8 BOM before frontmatter") text = read(skill_file) for forbidden in FORBIDDEN_CODEX_REVIEWER_STRINGS: if forbidden in text: failures.append(f"{skill_file.relative_to(REPO_ROOT)} contains forbidden reviewer string: {forbidden}") # README parity (EN ↔ CN) — Phase A invariant from #240 en_anchors = readme_anchors(readme) cn_anchors = readme_anchors(readme_cn) for required in REQUIRED_README_ANCHORS: if required not in en_anchors: failures.append(f"README.md missing required anchor: ") if required not in cn_anchors: failures.append(f"README_CN.md missing required anchor: ") en_h2 = numbered_h2_count(readme) cn_h2 = numbered_h2_count(readme_cn) require(en_h2 == 16, f"README.md has {en_h2} numbered H2 sections; expected 16 (Phase A)", failures) require(cn_h2 == 16, f"README_CN.md has {cn_h2} numbered H2 sections; expected 16 (Phase A)", failures) # Agent-grant hygiene (WB2): `Agent` in allowed-tools is the Tier-2 # fan-out capability gate. Per shared-references/fan-out-pattern.md it is # granted ONLY to skills that actually fan out, and such skills MUST cite # the convention doc in their body. A grant without that citation is a # vestigial/boilerplate grant and fails the drift check. for skill_file in sorted(SKILLS_ROOT.glob("*/SKILL.md")): text = read(skill_file) if "Agent" not in allowed_tools(text): continue if "fan-out-pattern.md" not in frontmatter_split(text): rel = skill_file.relative_to(REPO_ROOT) failures.append( f"{rel} grants `Agent` in allowed-tools but its body does not " f"cite fan-out-pattern.md — vestigial grant or undocumented " f"fan-out (see shared-references/fan-out-pattern.md)" ) # Watchdog 'loop' task type ⇔ its documented trigger (A2). Mirrors the Agent-grant⇒cite # rule above: a feature with no documented trigger is dead weight, a documented trigger # for a missing feature is a broken pointer. The loop type is a shipped feature, so BOTH # must be present. watchdog_py = read(REPO_ROOT / "tools" / "watchdog.py") ext_cadence = read(SKILLS_ROOT / "shared-references" / "external-cadence.md") tool_loop = bool(re.search(r"def check_loop\b", watchdog_py)) and bool(re.search(r'==\s*"loop"', watchdog_py)) doc_loop = bool(re.search(r'"type"\s*:\s*"loop"', ext_cadence)) require(tool_loop, "tools/watchdog.py must implement the loop-liveness check_loop (A2)", failures) require(doc_loop, "external-cadence.md must document registering a watchdog 'loop' task — its trigger (A2)", failures) # iteration_log.py (stall→pivot, B) must exist AND be both documented (the ladder with # both thresholds) and actually wired into a heartbeat consumer — else it is dead code. # Same dead-code guard as the Agent-grant⇒cite rule above. extc = read(SKILLS_ROOT / "shared-references" / "external-cadence.md") rp = read(SKILLS_ROOT / "research-pipeline" / "SKILL.md") tool_stall = (REPO_ROOT / "tools" / "iteration_log.py").is_file() doc_ladder = bool(re.search(r"forced structural pivot", extc, re.IGNORECASE)) and \ bool(re.search(r"stale_count`?\s*>=\s*2", extc)) and bool(re.search(r"stale_count`?\s*>=\s*4", extc)) # Prove the wiring is real (not a prose mention): resolver chain + note invocation + # both pivot branches handled in research-pipeline. wired = ('iteration_log.py' in rp and 'ITER_LOG' in rp and re.search(r'"\$ITER_LOG"\s+note', rp) is not None and 'pivot' in rp and 'structural' in rp and 'human' in rp) require(tool_stall, "tools/iteration_log.py (stall→pivot, B) must exist", failures) require(doc_ladder, "external-cadence.md must document the stall ladder with both thresholds (>=2 structural, >=4 human) (B)", failures) require(wired, "research-pipeline/SKILL.md must actually wire iteration_log.py (resolver + `$ITER_LOG note` + pivot handling) — not just mention it (B)", failures) # research_wiki.py add_claim (claim layer) ⇔ its documented birth trigger in # /proof-checker. add_claim is a writer; without a skill that calls it, the claim # layer is dead code (the exact orphan-writer trap). Same dead-code guard as above: # the writer and its single birth point must BOTH be present. rwiki = read(REPO_ROOT / "tools" / "research_wiki.py") pchk = read(SKILLS_ROOT / "proof-checker" / "SKILL.md") tool_claim = bool(re.search(r"def add_claim\b", rwiki)) and bool(re.search(r'add_parser\("add_claim"', rwiki)) # Prove the trigger is real (anchored to the actual command line, not a prose # mention or comment): proof-checker must literally invoke the resolved helper. born = re.search(r'python3\s+"\$WIKI_SCRIPT"\s+add_claim\b', pchk) is not None require(tool_claim, "tools/research_wiki.py must implement the add_claim claim-layer writer + its CLI", failures) require(born, "proof-checker/SKILL.md must invoke `add_claim` as the claim birth point — not just mention it (else add_claim is an orphan writer)", failures) # research_wiki.py upsert_idea (idea layer) ⇔ its documented write-back in # /idea-creator Phase 7. Same orphan-writer guard: the deterministic idea writer # and the skill that calls it must BOTH be present, anchored to the real command. icreator = read(SKILLS_ROOT / "idea-creator" / "SKILL.md") tool_idea = bool(re.search(r"def upsert_idea\b", rwiki)) and bool(re.search(r'add_parser\("upsert_idea"', rwiki)) idea_written = re.search(r'python3\s+"\$WIKI_SCRIPT"\s+upsert_idea\b', icreator) is not None require(tool_idea, "tools/research_wiki.py must implement the upsert_idea idea-layer writer + its CLI", failures) require(idea_written, "idea-creator/SKILL.md must invoke `upsert_idea` to record ideas (Phase 7) — not just mention it (else ideas are written freehand and skipped on re-gen)", failures) # research_wiki.py add_experiment (experiment layer) ⇔ its write-back in # /result-to-claim Step 5. Same orphan-writer guard; closes the last freehand # wiki layer so the supports/invalidates edges never dangle off a missing exp node. r2c = read(SKILLS_ROOT / "result-to-claim" / "SKILL.md") tool_exp = bool(re.search(r"def add_experiment\b", rwiki)) and bool(re.search(r'add_parser\("add_experiment"', rwiki)) exp_written = re.search(r'python3\s+"\$WIKI_SCRIPT"\s+add_experiment\b', r2c) is not None require(tool_exp, "tools/research_wiki.py must implement the add_experiment experiment-layer writer + its CLI", failures) require(exp_written, "result-to-claim/SKILL.md must invoke `add_experiment` to create the experiment node (Step 5) — not just mention it (else exp pages are freehand and supports/invalidates edges dangle)", failures) return failures def main() -> int: failures = check_inventory() if failures: print("ARIS skill inventory drift detected:", file=sys.stderr) for failure in failures: print(f"- {failure}", file=sys.stderr) return 1 print("ARIS skill inventory is consistent.") return 0 if __name__ == "__main__": raise SystemExit(main())