Skip to content
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
Show all changes
34 commits
Select commit Hold shift + click to select a range
d128c07
ci: add breaking change detector
rluvaton Apr 9, 2026
968fc57
ci: run manually for now
rluvaton Apr 9, 2026
3500fee
add to existing ci job so i can test the workflow
rluvaton Apr 9, 2026
b0f7cdf
add permission
rluvaton Apr 9, 2026
dcb3cfc
try running
rluvaton Apr 9, 2026
8ec278a
fetch main
rluvaton Apr 9, 2026
e15d6a7
run on all branches
rluvaton Apr 9, 2026
129e180
run on changed crates
rluvaton Apr 9, 2026
0a863bd
only if changed
rluvaton Apr 9, 2026
b3b6dde
compare against last commit
rluvaton Apr 9, 2026
95189de
test: add temporary public function for semver breaking change testing
rluvaton Apr 9, 2026
97ee5b5
test: remove public function to trigger semver breaking change
rluvaton Apr 9, 2026
d5b1985
fix
rluvaton Apr 9, 2026
910501c
test: re-add temporary public function for semver testing
rluvaton Apr 9, 2026
f40c07a
test: remove public function to trigger semver breaking change
rluvaton Apr 9, 2026
65779f4
fix
rluvaton Apr 9, 2026
6de3a14
test: re-add temporary public function for semver testing
rluvaton Apr 9, 2026
1bd00c2
test: remove public function to trigger semver breaking change
rluvaton Apr 9, 2026
b3bf244
revert
rluvaton Apr 9, 2026
5286bab
Merge branch 'main' into automate-semver-breaking-api
rluvaton Apr 9, 2026
10847a0
add coments
rluvaton Apr 9, 2026
6d27da4
Merge remote-tracking branch 'origin/automate-semver-breaking-api' in…
rluvaton Apr 9, 2026
a903cae
add license
rluvaton Apr 9, 2026
83a2f39
Merge branch 'main' into automate-semver-breaking-api
rluvaton Apr 9, 2026
8d99fba
use script instead
rluvaton Apr 9, 2026
2d4a25a
update to use cargo metadata and fix cr
rluvaton Apr 27, 2026
2202336
make sure the output is live and move the responsibility of removing
rluvaton Apr 27, 2026
7f9d802
fix change detector
rluvaton Apr 27, 2026
e943add
add comments
rluvaton Apr 27, 2026
2b5e8d4
Merge branch 'main' into automate-semver-breaking-api
rluvaton Apr 27, 2026
e9654b2
Merge branch 'main' into automate-semver-breaking-api
mbutrovich Apr 27, 2026
31dade4
Merge branch 'main' into automate-semver-breaking-api
rluvaton Apr 28, 2026
1077e92
address review feedback
rluvaton Apr 28, 2026
fbb2566
Merge branch 'main' into automate-semver-breaking-api
rluvaton Apr 28, 2026
File filter

Filter by extension

Filter by extension


Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
126 changes: 126 additions & 0 deletions .github/workflows/breaking_changes_detector.yml
Original file line number Diff line number Diff line change
@@ -0,0 +1,126 @@
# Licensed to the Apache Software Foundation (ASF) under one
# or more contributor license agreements. See the NOTICE file
# distributed with this work for additional information
# regarding copyright ownership. The ASF licenses this file
# to you under the Apache License, Version 2.0 (the
# "License"); you may not use this file except in compliance
# with the License. You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing,
# software distributed under the License is distributed on an
# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
# KIND, either express or implied. See the License for the
# specific language governing permissions and limitations
# under the License.

# Detect semver-incompatible (breaking) API changes in crates modified by a PR.
#
# Only public workspace crates that have file changes are checked.
# Internal crates (benchmarks, test-utils, sqllogictest, doc) are excluded.
#
# If breaking changes are found, a sticky comment is posted on the PR.
# The comment is removed automatically once the issues are resolved.

name: "Detect breaking changes"

on:
pull_request:
branches:
- main

permissions:
contents: read

jobs:
check-semver:
name: Check semver
runs-on: ubuntu-latest
outputs:
logs: ${{ steps.check_semver.outputs.logs }}
# Default to "success" so the comment job clears any stale comment
# when the check step is skipped (e.g. no published crates changed).
result: ${{ steps.check_semver.outputs.result || 'success' }}
steps:
- name: Checkout
uses: actions/checkout@de0fac2e4500dabe0009e67214ff5f5447ce83dd # v6.0.2
with:
fetch-depth: 0

# For fork PRs, `origin` points to the fork, not the upstream repo.
# Explicitly fetch the base branch from the upstream repo so we have
# a valid baseline ref for both diff and semver-checks.
- name: Fetch base branch
env:
BASE_REF: ${{ github.base_ref }}
REPO: ${{ github.repository }}
run: git fetch "https://github.com/${REPO}.git" "${BASE_REF}:refs/remotes/origin/${BASE_REF}"

- name: Determine changed crates
id: changed_crates
env:
BASE_REF: ${{ github.base_ref }}
run: |
PACKAGES=$(ci/scripts/changed_crates.sh changed-crates "origin/${BASE_REF}")
echo "packages=$PACKAGES" >> "$GITHUB_OUTPUT"
echo "Changed crates: $PACKAGES"

- name: Install cargo-semver-checks
if: steps.changed_crates.outputs.packages != ''
uses: taiki-e/install-action@94cb46f8d6e437890146ffbd78a778b78e623fb2 # v2.74.0
with:
tool: cargo-semver-checks

- name: Run cargo-semver-checks
id: check_semver
if: steps.changed_crates.outputs.packages != ''
env:
BASE_REF: ${{ github.base_ref }}
PACKAGES: ${{ steps.changed_crates.outputs.packages }}
run: |
set +e
# `tee` lets cargo's output stream live into the Actions log
# while we also keep a copy for the PR comment.
ci/scripts/changed_crates.sh semver-check "origin/${BASE_REF}" $PACKAGES \
2>&1 | tee /tmp/semver-output.txt
EXIT_CODE=${PIPESTATUS[0]}
{
echo "logs<<EOF"
sed 's/\x1b\[[0-9;]*m//g' /tmp/semver-output.txt
echo "EOF"
} >> "$GITHUB_OUTPUT"
# Pass the result through an output instead of failing the job:
# a detected breaking change should surface as a PR comment, not a
# red check, so PR authors aren't confused by an intentional break.
if [ "$EXIT_CODE" -eq 0 ]; then
echo "result=success" >> "$GITHUB_OUTPUT"
else
echo "result=failure" >> "$GITHUB_OUTPUT"
fi

# Post or remove a sticky comment on the PR based on the semver check result.
comment-on-pr:
Comment thread
github-advanced-security[bot] marked this conversation as resolved.
Fixed
name: Comment on pull request
runs-on: ubuntu-latest
needs: check-semver
if: always()
permissions:
contents: read
pull-requests: write
steps:
- name: Checkout
uses: actions/checkout@de0fac2e4500dabe0009e67214ff5f5447ce83dd # v6.0.2
with:
sparse-checkout: ci/scripts

- name: Update PR comment
env:
GH_TOKEN: ${{ github.token }}
REPO: ${{ github.repository }}
PR_NUMBER: ${{ github.event.pull_request.number }}
CHECK_RESULT: ${{ needs.check-semver.outputs.result }}
SEMVER_LOGS: ${{ needs.check-semver.outputs.logs }}
run: |
ci/scripts/changed_crates.sh comment \
"$REPO" "$PR_NUMBER" "$CHECK_RESULT" "$SEMVER_LOGS"
141 changes: 141 additions & 0 deletions ci/scripts/changed_crates.sh
Original file line number Diff line number Diff line change
@@ -0,0 +1,141 @@
#!/usr/bin/env bash
# Licensed to the Apache Software Foundation (ASF) under one
# or more contributor license agreements. See the NOTICE file
# distributed with this work for additional information
# regarding copyright ownership. The ASF licenses this file
# to you under the Apache License, Version 2.0 (the
# "License"); you may not use this file except in compliance
# with the License. You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing,
# software distributed under the License is distributed on an
# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
# KIND, either express or implied. See the License for the
# specific language governing permissions and limitations
# under the License.

# Helper script for the breaking-changes-detector workflow.
#
# Subcommands:
# changed-crates <base_ref>
# Print space-separated list of crate names whose files changed vs base_ref.
# Only published workspace members (those without `publish = false`) are
# considered.
#
# semver-check <base_ref> <packages...>
# Run cargo-semver-checks for the given packages against base_ref.
# Output and exit code are passed through unchanged; the caller is
# responsible for capturing/formatting them.
#
# comment <repo> <pr_number> <check_result> [logs]
# Upsert or delete a sticky PR comment based on check_result.
# check_result: "success" deletes any existing comment,
# anything else upserts the comment with the provided logs.
# Requires GH_TOKEN to be set.

set -euo pipefail

MARKER="<!-- semver-check-comment -->"

# ── changed-crates ──────────────────────────────────────────────────
cmd_changed_crates() {
local base_ref="${1:?Usage: changed_crates.sh changed-crates <base_ref>}"

# 1. Files changed between the PR and the base branch.
local changed_files
changed_files=$(git diff --name-only "${base_ref}...HEAD")

# 2. Every publishable workspace member, one per line as
# "<crate-name> <crate-dir>". `publish = false` in Cargo.toml shows
# up as `"publish": []` in cargo metadata, so filtering on that
# excludes internal crates without a manual exclusion list.
local crates
crates=$(cargo metadata --no-deps --format-version 1 | jq -r '
(.workspace_root + "/") as $root
| .packages[]
| select(.publish != [])
| "\(.name) \(.manifest_path | ltrimstr($root) | rtrimstr("/Cargo.toml"))"
')

# 3. Keep crates whose directory contains a changed file.
while read -r name dir; do
if grep -q "^${dir}/" <<<"$changed_files"; then
echo "$name"
fi
done <<<"$crates" | xargs
}

# ── semver-check ────────────────────────────────────────────────────
cmd_semver_check() {
local base_ref="${1:?Usage: changed_crates.sh semver-check <base_ref> <packages...>}"
shift

local args=()
for pkg in "$@"; do
args+=(--package "$pkg")
done

cargo semver-checks --baseline-rev "$base_ref" "${args[@]}"
}

# ── comment ─────────────────────────────────────────────────────────
cmd_comment() {
local repo="${1:?Usage: changed_crates.sh comment <repo> <pr_number> <check_result> [logs]}"
local pr_number="${2:?}"
local check_result="${3:?}"
local logs="${4:-}"

# Find existing comment with our marker
local comment_id
comment_id=$(gh api "repos/${repo}/issues/${pr_number}/comments" \
--jq ".[] | select(.body | contains(\"${MARKER}\")) | .id" | head -1)

echo "existing breaking change comment id $comment_id"

if [ "$check_result" = "success" ]; then
# Delete the comment if one exists
if [ -n "$comment_id" ]; then
echo "result is success, so deleting breaking change comment"
gh api "repos/${repo}/issues/comments/${comment_id}" --method DELETE
else
echo "result is success and no previous comment to delete"
fi
else
local body="${MARKER}
Thank you for opening this pull request!

Reviewer note: [cargo-semver-checks](https://github.com/obi1kenobi/cargo-semver-checks) reported the current version number is not SemVer-compatible with the changes in this pull request (compared against the base branch).

<details>
<summary>Details</summary>

\`\`\`
Comment thread
Jefffrey marked this conversation as resolved.
${logs}
\`\`\`

</details>"

if [ -n "$comment_id" ]; then
echo "comment already exists, updating content"
gh api "repos/${repo}/issues/comments/${comment_id}" \
--method PATCH --field body="$body"
else
echo "no comment with breaking changes, creating a new one"
gh api "repos/${repo}/issues/${pr_number}/comments" \
--method POST --field body="$body"
fi
fi
}

# ── main ────────────────────────────────────────────────────────────
cmd="${1:?Usage: changed_crates.sh <changed-crates|semver-check|comment> [args...]}"
shift

case "$cmd" in
changed-crates) cmd_changed_crates "$@" ;;
semver-check) cmd_semver_check "$@" ;;
comment) cmd_comment "$@" ;;
*) echo "Unknown command: $cmd" >&2; exit 1 ;;
esac
Loading