""" Generate rippled release notes from GitHub commit history. Usage (from repo root): python3 tools/generate-release-notes.py --from release-3.0 --to release-3.1 [--date 2026-03-24] [--output path/to/file.md] Arguments: --from (required) Base ref — must match exact tag or branch to compare from. --to (required) Target ref — must match exact tag or branch to compare to. --date (optional) Release date in YYYY-MM-DD format. Defaults to today. --output (optional) Output file path. Defaults to blog//rippled-.md. Requires: gh CLI (authenticated) """ import argparse import base64 import json import os import re import subprocess import sys from datetime import date, datetime # Emails to exclude from credits (Ripple employees not using @ripple.com). # Commits from @ripple.com addresses are already filtered automatically. EXCLUDED_EMAILS = { "3maisons@gmail.com", # Luc des Trois Maisons "a1q123456@users.noreply.github.com", # Jingchen Wu "bthomee@users.noreply.github.com", # Bart Thomee "21219765+ckeshava@users.noreply.github.com", # Chenna Keshava B S "gregtatcam@users.noreply.github.com", # Gregory Tsipenyuk "kuzzz99@gmail.com", # Sergey Kuznetsov "legleux@users.noreply.github.com", # Michael Legleux "mathbunnyru@users.noreply.github.com", # Ayaz Salikhov "mvadari@gmail.com", # Mayukha Vadari "115580134+oleks-rip@users.noreply.github.com", # Oleksandr Pidskopnyi "3397372+pratikmankawde@users.noreply.github.com", # Pratik Mankawde "35279399+shawnxie999@users.noreply.github.com", # Shawn Xie "5780819+Tapanito@users.noreply.github.com", # Vito Tumas "13349202+vlntb@users.noreply.github.com", # Valentin Balaschenko "129996061+vvysokikh1@users.noreply.github.com", # Vladislav Vysokikh "vvysokikh@gmail.com", # Vladislav Vysokikh } # Pre-compiled patterns for skipping version commits SKIP_PATTERNS = [ re.compile(r"^Set version to", re.IGNORECASE), re.compile(r"^Version \d", re.IGNORECASE), re.compile(r"bump version to", re.IGNORECASE), re.compile(r"^Merge tag ", re.IGNORECASE), ] # --- API helpers --- def run_gh_rest(endpoint): """Run a gh api REST command and return parsed JSON.""" result = subprocess.run( ["gh", "api", endpoint], capture_output=True, text=True, ) if result.returncode != 0: print(f"Error running gh api: {result.stderr}", file=sys.stderr) sys.exit(1) return json.loads(result.stdout) def run_gh_graphql(query): """Run a gh api graphql command and return parsed JSON. Handles partial failures (e.g., missing PRs) by returning whatever data is available alongside errors. """ result = subprocess.run( ["gh", "api", "graphql", "-f", f"query={query}"], capture_output=True, text=True, ) try: return json.loads(result.stdout) except (json.JSONDecodeError, TypeError): print(f"Error running graphql: {result.stderr}", file=sys.stderr) sys.exit(1) def fetch_commit_files(sha): """Fetch list of files changed in a commit via REST API. Returns empty list on failure instead of exiting. """ result = subprocess.run( ["gh", "api", f"repos/XRPLF/rippled/commits/{sha}"], capture_output=True, text=True, ) if result.returncode != 0: print(f" Warning: Could not fetch files for commit {sha[:7]}", file=sys.stderr) return [] data = json.loads(result.stdout) return [f["filename"] for f in data.get("files", [])] # --- Data fetching --- def fetch_version_info(ref): """Fetch version string and version-setting commit info in a single GraphQL call. Returns (version_string, formatted_commit_block). """ data = run_gh_graphql(f""" {{ repository(owner: "XRPLF", name: "rippled") {{ file: object(expression: "{ref}:src/libxrpl/protocol/BuildInfo.cpp") {{ ... on Blob {{ text }} }} ref: object(expression: "{ref}") {{ ... on Commit {{ history(first: 1, path: "src/libxrpl/protocol/BuildInfo.cpp") {{ nodes {{ oid message author {{ name email date }} }} }} }} }} }} }} """) repo = data.get("data", {}).get("repository", {}) # Extract version string from BuildInfo.cpp file_text = (repo.get("file") or {}).get("text", "") match = re.search(r'versionString\s*=\s*"([^"]+)"', file_text) if not match: print("Warning: Could not find versionString in BuildInfo.cpp. Using placeholder.", file=sys.stderr) version = match.group(1) if match else "TODO" # Extract version commit info nodes = (repo.get("ref") or {}).get("history", {}).get("nodes", []) if not nodes: commit_block = "commit TODO\nAuthor: TODO\nDate: TODO\n\n Set version to TODO" else: commit = nodes[0] raw_date = commit["author"]["date"] try: dt = datetime.fromisoformat(raw_date) formatted_date = dt.strftime("%a %b %-d %H:%M:%S %Y %z") except ValueError: formatted_date = raw_date name = commit["author"]["name"] email = commit["author"]["email"] sha = commit["oid"] message = commit["message"].split("\n")[0] commit_block = f"commit {sha}\nAuthor: {name} <{email}>\nDate: {formatted_date}\n\n {message}" return version, commit_block def fetch_commits(from_ref, to_ref): """Fetch all commits between two refs using the GitHub compare API.""" commits = [] page = 1 while True: data = run_gh_rest( f"repos/XRPLF/rippled/compare/{from_ref}...{to_ref}?per_page=250&page={page}" ) batch = data.get("commits", []) commits.extend(batch) if len(batch) < 250: break page += 1 return commits def parse_features_macro(text): """Parse features.macro into {amendment_name: status_string} dict.""" results = {} for match in re.finditer( r'XRPL_(FEATURE|FIX)\s*$\s*(\w+)\s*,\s*Supported::(\w+)\s*,\s*VoteBehavior::(\w+)', text): macro_type, name, supported, vote = match.groups() key = f"fix{name}" if macro_type == "FIX" else name results[key] = f"{supported}, {vote}" for match in re.finditer(r'XRPL_RETIRE(?:_(FEATURE|FIX))?\s*\(\s*(\w+)\s*$', text): macro_type, name = match.groups() key = f"fix{name}" if macro_type == "FIX" else name results[key] = "retired" return results def fetch_amendment_diff(from_ref, to_ref): """Compare features.macro between two refs to find amendment changes. Returns (changes, unchanged) where: - changes: {name: True/False} for amendments that changed status - unchanged: {name: True/False} for amendments with no status change True = include; False = exclude """ macro_path = "repos/XRPLF/rippled/contents/include/xrpl/protocol/detail/features.macro" from_data = run_gh_rest(f"{macro_path}?ref={from_ref}") from_text = base64.b64decode(from_data["content"]).decode() from_amendments = parse_features_macro(from_text) to_data = run_gh_rest(f"{macro_path}?ref={to_ref}") to_text = base64.b64decode(to_data["content"]).decode() to_amendments = parse_features_macro(to_text) changes = {} for name, to_status in to_amendments.items(): if name not in from_amendments: # New amendment — include only if Supported::yes changes[name] = to_status.startswith("yes") elif from_amendments[name] != to_status: # Include if either old or new status involves yes (voting-ready) from_status = from_amendments[name] changes[name] = from_status.startswith("yes") or to_status.startswith("yes") # Removed amendments — include only if they were Supported::yes for name in from_amendments: if name not in to_amendments: changes[name] = from_amendments[name].startswith("yes") # Unchanged amendments to also exclude (unreleased work) unchanged = sorted( name for name, to_status in to_amendments.items() if name not in changes and to_status != "retired" and not to_status.startswith("yes") ) return changes, unchanged def fetch_prs_graphql(pr_numbers): """Fetch PR details in batches using GitHub GraphQL API. Falls back to issue lookup for numbers that aren't PRs. Returns a dict of {number: {title, body, labels, files, type}}. """ results = {} missing = [] batch_size = 50 pr_list = list(pr_numbers) # Fetch PRs for i in range(0, len(pr_list), batch_size): batch = pr_list[i:i + batch_size] fragments = [] for pr_num in batch: fragments.append(f""" pr{pr_num}: pullRequest(number: {pr_num}) {{ title body labels(first: 10) {{ nodes {{ name }} }} files(first: 100) {{ nodes {{ path }} }} }} """) query = f""" {{ repository(owner: "XRPLF", name: "rippled") {{ {"".join(fragments)} }} }} """ data = run_gh_graphql(query) repo_data = data.get("data", {}).get("repository", {}) for alias, pr_data in repo_data.items(): pr_num = int(alias.removeprefix("pr")) if pr_data: results[pr_num] = { "title": pr_data["title"], "body": clean_pr_body(pr_data.get("body") or ""), "labels": [l["name"] for l in pr_data.get("labels", {}).get("nodes", [])], "files": [f["path"] for f in pr_data.get("files", {}).get("nodes", [])], "type": "pull", } else: missing.append(pr_num) print(f" Fetched {min(i + batch_size, len(pr_list))}/{len(pr_list)} PRs...") # Fetch missing numbers as issues if missing: print(f" Looking up {len(missing)} missing PR numbers as Issues...") for i in range(0, len(missing), batch_size): batch = missing[i:i + batch_size] fragments = [] for num in batch: fragments.append(f""" issue{num}: issue(number: {num}) {{ title body labels(first: 10) {{ nodes {{ name }} }} }} """) query = f""" {{ repository(owner: "XRPLF", name: "rippled") {{ {"".join(fragments)} }} }} """ data = run_gh_graphql(query) repo_data = data.get("data", {}).get("repository", {}) for alias, issue_data in repo_data.items(): if issue_data: num = int(alias.removeprefix("issue")) results[num] = { "title": issue_data["title"], "body": clean_pr_body(issue_data.get("body") or ""), "labels": [l["name"] for l in issue_data.get("labels", {}).get("nodes", [])], "type": "issues", } return results # --- Utilities --- def clean_pr_body(text): """Strip HTML comments and PR template boilerplate from body text.""" # Remove HTML comments text = re.sub(r"", "", text, flags=re.DOTALL) # Remove unchecked checkbox lines, keep checked ones text = re.sub(r"^- \[ \] .+$", "", text, flags=re.MULTILINE) # Remove all markdown headings text = re.sub(r"^#{1,6} .+$", "", text, flags=re.MULTILINE) # Convert bare GitHub URLs to markdown links text = re.sub(r"(?") parts.append("\n".join(comment_lines) + "\n") for entry in amendment_entries: parts.append(entry) # Remaining empty subsection headings for manual/AI sorting sections = [ "Features", "Breaking Changes", "Bug Fixes", "Refactors", "Documentation", "Testing", "CI/Build", ] for section in sections: parts.append(f"\n### {section}\n") # Credits parts.append("\n\n## Credits\n") if authors: parts.append("The following RippleX teams and GitHub users contributed to this release:\n") else: parts.append("The following RippleX teams contributed to this release:\n") parts.append("- RippleX Engineering") parts.append("- RippleX Docs") parts.append("- RippleX Product") for author in sorted(authors): parts.append(f"- {author}") parts.append(""" ## Bug Bounties and Responsible Disclosures We welcome reviews of the `rippled` code and urge researchers to responsibly disclose any issues they may find. For more information, see: - [Ripple's Bug Bounty Program](https://ripple.com/legal/bug-bounty/) - [`rippled` Security Policy](https://github.com/XRPLF/rippled/blob/develop/SECURITY.md) """) # Unsorted entries with full context (after all published sections) parts.append("\n") for entry in entries: parts.append(entry) return "\n".join(parts) # --- Main --- def main(): parser = argparse.ArgumentParser(description="Generate rippled release notes") parser.add_argument("--from", dest="from_ref", required=True, help="Base ref (tag or branch)") parser.add_argument("--to", dest="to_ref", required=True, help="Target ref (tag or branch)") parser.add_argument("--date", help="Release date (YYYY-MM-DD). Defaults to today.") parser.add_argument("--output", help="Output file path (default: blog//rippled-.md)") args = parser.parse_args() args.date = args.date or date.today().isoformat() try: date.fromisoformat(args.date) except ValueError: print(f"Error: Invalid date format '{args.date}'. Use YYYY-MM-DD.", file=sys.stderr) sys.exit(1) print(f"Fetching version info from {args.to_ref}...") version, version_commit = fetch_version_info(args.to_ref) print(f"Version: {version}") year = args.date.split("-")[0] output_path = args.output or f"blog/{year}/rippled-{version}.md" print(f"Fetching commits: {args.from_ref}...{args.to_ref}") commits = fetch_commits(args.from_ref, args.to_ref) print(f"Found {len(commits)} commits") # Extract unique PR (in rare cases Issues) numbers and track authors pr_numbers = {} pr_shas = {} # PR/issue number → commit SHA (for file lookups on Issues) pr_bodies = {} # PR/issue number → commit body (for fallback descriptions) orphan_commits = [] # Commits with no PR/Issues link authors = set() for commit in commits: full_message = commit["commit"]["message"] message = full_message.split("\n")[0] body = "\n".join(full_message.split("\n")[1:]).strip() sha = commit["sha"] author = commit["commit"]["author"]["name"] email = commit["commit"]["author"].get("email", "") # Skip Ripple employees from credits login = (commit.get("author") or {}).get("login") if not email.lower().endswith("@ripple.com") and email not in EXCLUDED_EMAILS: if login: authors.add(f"@{login}") else: authors.add(author) if should_skip(message): continue pr_number = extract_pr_number(message) if pr_number: pr_numbers[pr_number] = message pr_shas[pr_number] = sha pr_bodies[pr_number] = body else: orphan_commits.append({"sha": sha, "message": message, "body": body}) print(f"Unique PRs after filtering: {len(pr_numbers)}") if orphan_commits: print(f"Commits without PR or Issue linked: {len(orphan_commits)}") # Fetch amendment diff between refs print(f"Comparing features.macro between {args.from_ref} and {args.to_ref}...") amendment_diff, amendment_unchanged = fetch_amendment_diff(args.from_ref, args.to_ref) if amendment_diff: for name, include in sorted(amendment_diff.items()): status = "include" if include else "exclude" print(f" Amendment {name}: {status}") else: print(" No amendment changes detected") print(f"Building changelog entries...") # Fetch all PR details in batches via GraphQL pr_details = fetch_prs_graphql(list(pr_numbers.keys())) # Build entries, sorting amendments automatically amendment_entries = [] entries = [] for pr_number, commit_msg in pr_numbers.items(): pr_data = pr_details.get(pr_number) if pr_data: title = pr_data["title"] body = pr_data.get("body", "") labels = pr_data.get("labels", []) files = pr_data.get("files", []) link_type = pr_data.get("type", "pull") # For issues (no files from GraphQL), fetch files from the commit if not files and pr_number in pr_shas: print(f" Building entry for Issue #{pr_number} via commit...") files = fetch_commit_files(pr_shas[pr_number]) if is_amendment(files) and amendment_diff: # Amendment entry — add to amendments section (AI will sort further) entry = format_uncategorized_entry(pr_number, title, labels, body, link_type=link_type) amendment_entries.append(entry) else: entry = format_uncategorized_entry(pr_number, title, labels, body, files, link_type) entries.append(entry) else: # Fallback to commit lookup for invalid PR and Issues link sha = pr_shas[pr_number] print(f" #{pr_number} not found as PR or Issue, building from commit {sha[:7]}...") files = fetch_commit_files(sha) if is_amendment(files) and amendment_diff: entry = format_commit_entry(sha, commit_msg, pr_bodies[pr_number]) amendment_entries.append(entry) else: entry = format_commit_entry(sha, commit_msg, pr_bodies[pr_number], files) entries.append(entry) # Build entries for orphan commits (no PR/Issue linked) for orphan in orphan_commits: sha = orphan["sha"] print(f" Building commit-only entry for {sha[:7]}...") files = fetch_commit_files(sha) if is_amendment(files) and amendment_diff: entry = format_commit_entry(sha, orphan["message"], orphan["body"]) amendment_entries.append(entry) else: entry = format_commit_entry(sha, orphan["message"], orphan["body"], files) entries.append(entry) # Generate markdown markdown = generate_markdown(version, args.date, amendment_diff, amendment_unchanged, amendment_entries, entries, authors, version_commit) # Write output os.makedirs(os.path.dirname(output_path), exist_ok=True) with open(output_path, "w") as f: f.write(markdown) print(f"\nRelease notes written to: {output_path}") # Update blog/sidebars.yaml sidebars_path = "blog/sidebars.yaml" # Derive sidebar path and year from actual output path relative_path = output_path.removeprefix("blog/") sidebar_year = relative_path.split("/")[0] new_entry = f" - page: {relative_path}" try: with open(sidebars_path, "r") as f: sidebar_content = f.read() if relative_path in sidebar_content: print(f"{sidebars_path} already contains {relative_path}") else: # Find the year group and insert at the top of its items year_marker = f" - group: '{sidebar_year}'" if year_marker not in sidebar_content: # Year group doesn't exist — find the right chronological position new_group = f" - group: '{sidebar_year}'\n expanded: false\n items:\n{new_entry}\n" # Find all existing year groups and insert before the first one with a smaller year year_groups = list(re.finditer(r" - group: '(\d{4})'", sidebar_content)) insert_pos = None for match in year_groups: existing_year = match.group(1) if int(sidebar_year) > int(existing_year): insert_pos = match.start() break if insert_pos is not None: sidebar_content = sidebar_content[:insert_pos] + new_group + sidebar_content[insert_pos:] else: # New year is older than all existing — append at the end sidebar_content = sidebar_content.rstrip() + "\n" + new_group else: # Insert after the year group's "items:" line year_idx = sidebar_content.index(year_marker) items_idx = sidebar_content.index(" items:", year_idx) insert_pos = items_idx + len(" items:\n") sidebar_content = sidebar_content[:insert_pos] + new_entry + "\n" + sidebar_content[insert_pos:] with open(sidebars_path, "w") as f: f.write(sidebar_content) print(f"Added {relative_path} to {sidebars_path}") except FileNotFoundError: print(f"Warning: {sidebars_path} not found, skipping sidebar update", file=sys.stderr) if __name__ == "__main__": main()