deer-flow/scripts/sync_labels.py
Xinmin Zeng aca7acc105
feat(ci): PR/issue auto-labeling + declarative label sync (#3360)
- .github/labels.yml: declarative source of truth (29 namespaced labels)
- scripts/sync_labels.py + label-sync.yml: idempotent label sync (self-bootstraps on merge)
- labeler.yml + pr-labeler.yml: area:* labels by changed path (actions/labeler)
- pr-triage.yml: size/*, risk:*, needs-validation, first-time-contributor, reviewing
- issue-triage.yml: needs-triage on new issues (self-healing)

All PR workflows use pull_request_target but never check out or run PR code
(read changed-file metadata via the API only).
2026-06-03 16:40:24 +08:00

94 lines
2.8 KiB
Python

#!/usr/bin/env python3
"""Sync GitHub labels from the declarative source of truth.
Reads ``.github/labels.yml`` and creates/updates each label via the GitHub CLI
(``gh label create --force``). Sync is additive/update-only: labels not listed
in the file are left untouched (never deleted).
Usage:
uv run --with pyyaml python scripts/sync_labels.py [--repo OWNER/NAME] [--dry-run]
Requires the ``gh`` CLI to be installed and authenticated (or ``GH_TOKEN`` set,
as in CI). When ``--repo`` is omitted, ``gh`` uses the current repository.
"""
from __future__ import annotations
import argparse
import subprocess
import sys
from pathlib import Path
try:
import yaml
except ModuleNotFoundError: # pragma: no cover - guidance for local runs
sys.exit(
"PyYAML is required. Run via:\n"
" uv run --with pyyaml python scripts/sync_labels.py"
)
LABELS_FILE = Path(__file__).resolve().parent.parent / ".github" / "labels.yml"
def load_labels(path: Path) -> list[dict[str, str]]:
data = yaml.safe_load(path.read_text(encoding="utf-8")) or {}
labels = data.get("labels")
if not isinstance(labels, list) or not labels:
sys.exit(f"No labels found in {path}")
for label in labels:
if not isinstance(label, dict) or "name" not in label:
sys.exit(f"Invalid label entry (missing 'name'): {label!r}")
return labels
def sync_label(label: dict[str, str], repo: str | None, dry_run: bool) -> bool:
name = str(label["name"])
color = str(label.get("color", "ededed")).lstrip("#")
description = str(label.get("description", ""))
cmd = ["gh", "label", "create", name, "--color", color, "--force"]
if description:
cmd += ["--description", description]
if repo:
cmd += ["--repo", repo]
if dry_run:
print(f"[dry-run] {' '.join(cmd)}")
return True
result = subprocess.run(cmd, capture_output=True, text=True)
if result.returncode != 0:
print(f"{name}: {result.stderr.strip()}", file=sys.stderr)
return False
print(f"{name}")
return True
def main() -> int:
parser = argparse.ArgumentParser(description=__doc__)
parser.add_argument("--repo", help="Target repository as OWNER/NAME")
parser.add_argument(
"--dry-run",
action="store_true",
help="Print the gh commands without executing them",
)
args = parser.parse_args()
labels = load_labels(LABELS_FILE)
target = args.repo or "(current repository)"
print(f"Syncing {len(labels)} labels to {target}")
failures = sum(
0 if sync_label(label, args.repo, args.dry_run) else 1 for label in labels
)
if failures:
print(f"\n{failures} label(s) failed to sync", file=sys.stderr)
return 1
print(f"\nDone — {len(labels)} labels in sync.")
return 0
if __name__ == "__main__":
raise SystemExit(main())