From ddc83582819bcee2a76912dfe39da34dc2aac6ba Mon Sep 17 00:00:00 2001 From: dangotbanned <125183946+dangotbanned@users.noreply.github.com> Date: Tue, 24 Dec 2024 19:41:38 +0000 Subject: [PATCH] ci: replace `sync_website.sh` with `.py` Decouples from `bash`, simplifies (https://github.com/vega/altair/issues/3577#issuecomment-2548280136) --- doc/sync_website.py | 125 ++++++++++++++++++++++++++++++++++++++++++++ doc/sync_website.sh | 27 ---------- pyproject.toml | 3 +- 3 files changed, 127 insertions(+), 28 deletions(-) create mode 100644 doc/sync_website.py delete mode 100644 doc/sync_website.sh diff --git a/doc/sync_website.py b/doc/sync_website.py new file mode 100644 index 000000000..5b7fd9bcf --- /dev/null +++ b/doc/sync_website.py @@ -0,0 +1,125 @@ +from __future__ import annotations + +import argparse +import datetime as dt +import os +import shutil +import subprocess +from pathlib import Path +from typing import TYPE_CHECKING + +if TYPE_CHECKING: + from typing import Literal + +DOC_REPO_ORG: Literal["altair-viz"] = "altair-viz" +GITHUB: Literal["github"] = "github" +WEBSITE: str = f"{DOC_REPO_ORG}.{GITHUB}.io" +DOC_REPO_URL: str = f"https://{GITHUB}.com/{DOC_REPO_ORG}/{WEBSITE}.git" + +WORKING_DIR: Path = Path(__file__).parent +DOC_BUILD_DIR: Path = WORKING_DIR / "_build" +DOC_REPO_DIR: Path = DOC_BUILD_DIR / WEBSITE +DOC_HTML_DIR: Path = DOC_BUILD_DIR / "html" + +DOC_BUILD_INFO: Path = DOC_HTML_DIR / ".buildinfo" + + +CMD_CLONE = f"git clone --filter=blob:none {DOC_REPO_URL}" +"""Partial clone, as we only keep ``./.git/**``.""" + +CMD_PULL = "git pull" +CMD_HEAD_HASH = "git rev-parse HEAD" +CMD_ADD = "git add . --all" +CMD_COMMIT = "git commit -m" +CMD_PUSH = "git push origin master" + +COMMIT_MSG_PREFIX = "doc build for commit" +UNTRACKED = ".git" + + +def _path_repr(fp: Path, /) -> str: + return f"{fp.relative_to(WORKING_DIR.parent).as_posix()!r}" + + +def clone_or_sync_repo() -> None: + os.chdir(DOC_BUILD_DIR) + if not DOC_REPO_DIR.exists(): + print(f"Cloning repo {WEBSITE!r}\n -> {_path_repr(DOC_REPO_DIR)}") + subprocess.run(CMD_CLONE, check=True) + else: + print(f"Using existing cloned altair directory {_path_repr(DOC_REPO_DIR)}") + os.chdir(DOC_REPO_DIR) + print(f"Syncing {WEBSITE!r}\n -> {_path_repr(DOC_REPO_DIR)} ...") + subprocess.run(CMD_PULL, check=True) + + +def remove_tracked_files() -> None: + os.chdir(DOC_REPO_DIR) + print(f"Removing all tracked files from {_path_repr(DOC_REPO_DIR)} ...") + for fp in DOC_REPO_DIR.iterdir(): + if fp.name == UNTRACKED: + continue + if fp.is_file(): + fp.unlink() + else: + shutil.rmtree(fp) + + +def sync_from_html_build() -> None: + print(f"Syncing files from {_path_repr(DOC_HTML_DIR)} ...") + copy_ret = shutil.copytree(DOC_HTML_DIR, DOC_REPO_DIR, dirs_exist_ok=True) + print(f"Successful copy to: {_path_repr(copy_ret)}") + + +def generate_commit_message() -> str: + os.chdir(DOC_REPO_DIR) + print("Generating commit message ...") + r = subprocess.run(CMD_HEAD_HASH, capture_output=True, check=True) + return f"{COMMIT_MSG_PREFIX} {r.stdout.decode().strip()}" + + +def add_commit_push_github(msg: str, /) -> None: + os.chdir(DOC_REPO_DIR) + print("Pushing ...") + subprocess.run(CMD_ADD, check=True) + subprocess.run(f"{CMD_COMMIT} {msg}", check=True) + subprocess.run(CMD_PUSH, check=True) + + +def ensure_build_html() -> None: + if not (DOC_HTML_DIR.exists() and DOC_HTML_DIR.is_dir()): + raise FileNotFoundError(DOC_HTML_DIR) + if not DOC_BUILD_INFO.exists(): + raise FileNotFoundError(DOC_BUILD_INFO) + mtime = DOC_BUILD_INFO.stat().st_mtime + modified = dt.datetime.fromtimestamp(mtime, dt.timezone.utc).isoformat( + " ", "seconds" + ) + print(f"Docs last build time: {modified!r}") + + +def main(*, no_commit: bool = False) -> None: + """ + Make sure these have been run first. + + Commands: + + hatch run doc:clean-all + hatch run doc:build-html + """ + ensure_build_html() + commit_message = generate_commit_message() + clone_or_sync_repo() + remove_tracked_files() + sync_from_html_build() + if no_commit: + print(f"Unused commit message:\n {commit_message!r}") + else: + add_commit_push_github(commit_message) + + +if __name__ == "__main__": + parser = argparse.ArgumentParser(prog="sync_website.py") + parser.add_argument("--no-commit", action="store_true") + args = parser.parse_args() + main(no_commit=args.no_commit) diff --git a/doc/sync_website.sh b/doc/sync_website.sh deleted file mode 100644 index fcb611ef5..000000000 --- a/doc/sync_website.sh +++ /dev/null @@ -1,27 +0,0 @@ -#!/bin/bash - -# get git hash for commit message -GITHASH=$(git rev-parse HEAD) -MSG="doc build for commit $GITHASH" -cd _build - -# clone the repo if needed -if test -d altair-viz.github.io; -then echo "using existing cloned altair directory"; -else git clone https://github.com/altair-viz/altair-viz.github.io.git; -fi - -# sync the website -cd altair-viz.github.io -git pull - -# remove all tracked files -git ls-files -z | xargs -0 rm -f - -# sync files from html build -rsync -r ../html/ ./ - -# add commit, and push to github -git add . --all -git commit -m "$MSG" -git push origin master diff --git a/pyproject.toml b/pyproject.toml index 52fb11b0c..0f96b3b68 100644 --- a/pyproject.toml +++ b/pyproject.toml @@ -189,10 +189,11 @@ build-html-win = [ doctest = "sphinx-build -b doctest -d doc/_build/doctrees doc doc/_build/doctest" coverage = "sphinx-build -b coverage -d doc/_build/doctrees doc doc/_build/coverage" serve = "(cd doc/_build/html && python -m http.server)" +publish = "python doc/sync_website.py --no-commit" publish-clean-build = [ "clean-all", "build-html", - "(cd doc && bash sync_website.sh)", + "publish" ] [tool.ruff]