de en es ja ko ru zh

mcp-run-python

Official

by pydantic

Overview Schema Related Servers Score Discussions

Python

Hybrid

pydantic-ai
scripts

gather-review-context.sh•12.4 KiB

#!/usr/bin/env bash # Gather PR context for auto-review into .github/.review-context/ # Usage: scripts/gather-review-context.sh <pr-number> [repo] # # Examples: # scripts/gather-review-context.sh 4269 # scripts/gather-review-context.sh 4269 pydantic/pydantic-ai set -euo pipefail PR_NUMBER="${1:?Usage: $0 <pr-number> [repo]}" REPO="${2:-$(gh repo view --json nameWithOwner --jq .nameWithOwner)}" CTX=".github/.review-context" mkdir -p "$CTX" echo "Gathering context for PR #${PR_NUMBER} in ${REPO}..." # PR details (title, body, author, labels) echo " - PR details" gh pr view "$PR_NUMBER" --repo "$REPO" --json title,body,author,headRefName,baseRefName,additions,deletions,changedFiles,labels,isDraft,reviewDecision,state,createdAt,updatedAt,url > "$CTX/pr-details.json" # PR comments echo " - PR comments" gh api "repos/${REPO}/issues/${PR_NUMBER}/comments" --paginate --jq '.[] | "### \(.user.login) (\(.author_association)) at \(.created_at)\n\(.body)\n"' > "$CTX/pr-comments.txt" [ -s "$CTX/pr-comments.txt" ] || echo "(No PR comments)" > "$CTX/pr-comments.txt" # Inline review comments (with diff hunks and resolved state via GraphQL) # Fetch all review threads first, then determine last auto-review timestamp, then format echo " - Review comments" OWNER="${REPO%%/*}" REPO_NAME="${REPO##*/}" CURSOR="" THREADS_JSON=$(mktemp) echo '[]' > "$THREADS_JSON" while true; do CURSOR_ARG="" if [ -n "$CURSOR" ]; then CURSOR_ARG=", after: \"$CURSOR\"" fi RESULT=$(gh api graphql -f query=" query { repository(owner: \"$OWNER\", name: \"$REPO_NAME\") { pullRequest(number: $PR_NUMBER) { reviewThreads(first: 100$CURSOR_ARG) { pageInfo { hasNextPage endCursor } nodes { id isResolved isOutdated comments(first: 50) { nodes { id databaseId author { login } authorAssociation body diffHunk path line createdAt replyTo { id } } } } } } } } ") # Accumulate thread nodes into temp file jq -s '.[0] + [.[1].data.repository.pullRequest.reviewThreads.nodes[]]' "$THREADS_JSON" <(echo "$RESULT") > "${THREADS_JSON}.tmp" mv "${THREADS_JSON}.tmp" "$THREADS_JSON" CURSOR=$(echo "$RESULT" | jq -r '.data.repository.pullRequest.reviewThreads.pageInfo | select(.hasNextPage) | .endCursor') if [ -z "$CURSOR" ]; then break fi done # Find timestamp of last auto-review from both issue comments and inline review comments echo " - Checking for previous auto-review" LAST_ISSUE_COMMENT_TS=$(gh api "repos/${REPO}/issues/${PR_NUMBER}/comments" --paginate \ | jq -s '[.[][] | select(.user.login == "github-actions" or .user.login == "github-actions[bot]") | .created_at] | sort | last // empty' -r) LAST_REVIEW_COMMENT_TS=$(jq -r ' [.[] | .comments.nodes[] | select(.author.login == "github-actions" or .author.login == "github-actions[bot]") | .createdAt ] | sort | last // empty ' "$THREADS_JSON") # Take the later of the two timestamps if [ -n "$LAST_ISSUE_COMMENT_TS" ] && [ -n "$LAST_REVIEW_COMMENT_TS" ]; then if [[ "$LAST_ISSUE_COMMENT_TS" > "$LAST_REVIEW_COMMENT_TS" ]]; then LAST_REVIEW_TS="$LAST_ISSUE_COMMENT_TS" else LAST_REVIEW_TS="$LAST_REVIEW_COMMENT_TS" fi else LAST_REVIEW_TS="${LAST_ISSUE_COMMENT_TS:-$LAST_REVIEW_COMMENT_TS}" fi if [ -n "$LAST_REVIEW_TS" ]; then echo " Last auto-review: $LAST_REVIEW_TS" else echo " No previous auto-review found" fi # Format review threads with compaction > "$CTX/review-comments.txt" jq -r --arg last_review "$LAST_REVIEW_TS" ' def truncate: gsub("[\\r\\n]+"; " ") | if length > 200 then .[:200] + "..." else . end; [ .[] | { resolved: .isResolved, outdated: .isOutdated, state: ( (if .isResolved then "RESOLVED" else "UNRESOLVED" end) + (if .isOutdated then ", OUTDATED" else "" end) ), first: .comments.nodes[0], lastCommentAt: (.comments.nodes | last | .createdAt), replies: [ .comments.nodes[1:][] | { author: .author.login, databaseId: .databaseId, body: .body, createdAt: .createdAt } ] } ] as $arr | range($arr | length) as $i | $arr[$i] as $t | $t.first as $first | # Compact if: (resolved AND outdated) OR (all comments predate last auto-review) ( ($t.resolved and $t.outdated) or ($last_review != "" and $t.lastCommentAt < $last_review) ) as $compact | if $compact then "- [\($t.state)] \($first.author.login) at \($first.createdAt) on \($first.path)\(if $first.line then ":\($first.line)" else "" end) (comment \($first.databaseId)) — \($first.body | truncate)" + ([ $t.replies[] | "\n > \(.author) at \(.createdAt) (comment \(.databaseId)): \(.body | truncate)" ] | join("")) else ( ($first.path + ":" + ($first.diffHunk | split("\n")[0])) as $hunkKey | (if $i > 0 then ($arr[$i - 1].first.path + ":" + ($arr[$i - 1].first.diffHunk | split("\n")[0])) else "" end) as $prevKey | (if $hunkKey != $prevKey then true else false end) as $showHunk | "### [\($t.state)] \($first.author.login) (\($first.authorAssociation)) at \($first.createdAt) on \($first.path)\(if $first.line then ":\($first.line)" else "" end) (comment \($first.databaseId))" + (if $showHunk then "\n```diff\n\($first.diffHunk)\n```" else "" end) + "\n\($first.body)\n" + ([ $t.replies[] | " > **\(.author)** at \(.createdAt) (comment \(.databaseId)): \(.body)\n" ] | join("")) ) end ' "$THREADS_JSON" >> "$CTX/review-comments.txt" rm -f "$THREADS_JSON" [ -s "$CTX/review-comments.txt" ] || echo "(No review comments)" > "$CTX/review-comments.txt" # Related issues: extract issue numbers from PR body echo " - Related issues" PR_BODY=$(gh pr view "$PR_NUMBER" --repo "$REPO" --json body --jq '.body') { echo "$PR_BODY" | grep -oiP '(?:closes|fixes|resolves|close|fix|resolve)\s*#\K\d+' || true echo "$PR_BODY" | grep -oiP '(?:closes|fixes|resolves|close|fix|resolve)\s+https://github\.com/[^/]+/[^/]+/issues/\K\d+' || true } | sort -u | while read -r ISSUE_NUM; do echo "=== Issue #${ISSUE_NUM} ===" gh issue view "$ISSUE_NUM" --repo "$REPO" --json title,body,author,comments --jq '"## \(.title)\nBy: \(.author.login)\n\(.body)\n\n### Comments:\n\(.comments | map("#### \(.author.login) (\(.authorAssociation))\n\(.body)\n") | join("\n"))"' done > "$CTX/related-issues.txt" [ -s "$CTX/related-issues.txt" ] || echo "(No issues referenced in PR description)" > "$CTX/related-issues.txt" # Fetch base branch for function-context diffs # Always fetch from the target repo URL, not origin — for fork PRs, origin points to # the fork (which may have an outdated base branch), causing incorrect merge bases # and diffs that include unrelated changes from the base repo. echo " - Fetching base branch for function-context diffs" BASE_REF=$(jq -r '.baseRefName' "$CTX/pr-details.json") MERGE_BASE="" if [ -n "$BASE_REF" ]; then if git fetch "https://github.com/${REPO}.git" "$BASE_REF" --quiet 2>/dev/null; then MERGE_BASE=$(git merge-base HEAD FETCH_HEAD 2>/dev/null || echo "") fi fi if [ -n "$MERGE_BASE" ]; then echo " Merge base: ${MERGE_BASE:0:12} (using function-context diffs)" else echo " Could not determine merge base (falling back to API diff)" fi # Per-file diffs with function context (excluding generated files) echo " - Per-file diffs (excluding generated files)" mkdir -p "$CTX/diff" if [ -n "$MERGE_BASE" ]; then # -W (--function-context) shows the full function body around each change, # so the reviewer can see the function signature and surrounding logic without # needing to read the full source file separately. git diff -W --no-color "$MERGE_BASE" HEAD else gh pr diff "$PR_NUMBER" --repo "$REPO" fi | awk -v dir="$CTX/diff" ' /^diff --git/ { # Close previous file to avoid running out of file descriptors if (outfile) close(outfile) outfile = "" # Extract new (b/) filename from "diff --git a/path b/path" # Uses b/ side so renamed files match the GitHub API .filename field fname = $0 sub(/^.* b\//, "", fname) skip = (fname ~ /uv\.lock/ || fname ~ /\/cassettes\//) if (!skip) { # Sanitize path: replace / with __, strip leading dots to avoid hidden files safe = fname gsub(/\//, "__", safe) sub(/^\.+/, "", safe) outfile = dir "/" safe ".diff" } } !skip && outfile { print > outfile } ' # Annotate commentable diff lines with source line numbers (NL:/OL: prefixes) # so the review bot can target inline comments without computing line numbers. echo " - Annotating diffs with source line numbers" for diff_file in "$CTX/diff/"*.diff; do [ -f "$diff_file" ] || continue awk ' BEGIN { NEAR = 3 } # Diff metadata: flush any buffered hunk, pass through /^diff --git/ || /^index / || /^---/ || /^\+\+\+/ || /^new file/ || /^deleted file/ || /^old mode/ || /^new mode/ || /^rename / || /^similarity / || /^dissimilarity / || /^Binary / { flush_hunk() print next } # Hunk header: flush previous hunk, parse line numbers /^@@ / { flush_hunk() split($2, _o, ","); old_num = substr(_o[1], 2) + 0 split($3, _n, ","); new_num = substr(_n[1], 2) + 0 hunk_hdr = $0 n = 0 next } # "\ No newline at end of file" /^\\/ { n++; lines[n] = $0; types[n] = "\\"; is_chg[n] = 0 next } # Hunk body lines { n++; lines[n] = $0 c = substr($0, 1, 1) if (c == "+") { types[n] = "+"; lnums[n] = new_num++; is_chg[n] = 1 } else if (c == "-") { types[n] = "-"; lnums[n] = old_num++; is_chg[n] = 1 } else { types[n] = " "; lnums[n] = new_num++; old_num++; is_chg[n] = 0 } } function flush_hunk( i, dist, min_d) { if (n == 0) return # Forward pass: context-line distance from nearest preceding change dist = NEAR + 1 for (i = 1; i <= n; i++) { if (is_chg[i]) dist = 0 else if (types[i] != "\\") { dist++; fwd[i] = dist } } # Backward pass: context-line distance from nearest following change dist = NEAR + 1 for (i = n; i >= 1; i--) { if (is_chg[i]) dist = 0 else if (types[i] != "\\") { dist++; bwd[i] = dist } } print hunk_hdr for (i = 1; i <= n; i++) { if (types[i] == "\\") { print lines[i] } else if (is_chg[i]) { if (types[i] == "+") printf "NL:%d %s\n", lnums[i], lines[i] else printf "OL:%d %s\n", lnums[i], lines[i] } else { min_d = fwd[i]; if (bwd[i] < min_d) min_d = bwd[i] if (min_d <= NEAR) printf "NL:%d %s\n", lnums[i], lines[i] else print lines[i] } } delete lines; delete types; delete lnums delete is_chg; delete fwd; delete bwd n = 0 } END { flush_hunk() } ' "$diff_file" > "${diff_file}.tmp" && mv "${diff_file}.tmp" "$diff_file" done # List of ALL changed files with change counts + diff file paths echo " - Changed files" gh api "repos/${REPO}/pulls/${PR_NUMBER}/files" --paginate \ --jq '.[] | "\(.filename)\t+\(.additions) -\(.deletions)\t\(.filename | gsub("/"; "__") | gsub("^\\.+"; "")).diff"' \ | while IFS=$'\t' read -r fname counts diffname; do if echo "$fname" | grep -qE 'uv\.lock|/cassettes/'; then printf '%s\t%s\n' "$fname" "$counts" else printf '%s\t%s\tdiff/%s\n' "$fname" "$counts" "$diffname" fi done > "$CTX/changed-files.txt" # Gather directory-specific AGENTS.md files for changed directories echo " - Directory AGENTS.md files" > "$CTX/agents-md.txt" for agents_file in docs/AGENTS.md pydantic_ai_slim/pydantic_ai/models/AGENTS.md tests/AGENTS.md; do dir=$(dirname "$agents_file") if grep -q "^${dir}/" "$CTX/changed-files.txt" 2>/dev/null && [ -f "$agents_file" ]; then echo "=== ${agents_file} ===" cat "$agents_file" echo "" fi done >> "$CTX/agents-md.txt" [ -s "$CTX/agents-md.txt" ] || echo "(No directory-specific AGENTS.md files for changed directories)" > "$CTX/agents-md.txt" echo "" echo "Context gathered in ${CTX}/:" ls -lh "$CTX/" DIFF_COUNT=$(find "$CTX/diff" -name '*.diff' 2>/dev/null | wc -l) echo " Per-file diffs: ${DIFF_COUNT} files in ${CTX}/diff/"

Loading blob content...

Latest Blog Posts

Redis vs ioredis vs valkey-glide
By punkpeye on January 26, 2026.
benchmark
Redis
valkey
Quickstart: Publish an MCP Server to the MCP Registry
By punkpeye on January 24, 2026.
mcp
official reference mirror
Official MCP Registry Server.json Requirements
By punkpeye on January 24, 2026.
mcp
official reference mirror

MCP directory API

We provide all the information about MCP servers via our MCP API.

curl -X GET 'https://glama.ai/api/mcp/v1/servers/pydantic/pydantic-ai'

If you have feedback or need assistance with the MCP directory API, please join our Discord server

gather-review-context.sh•12.4 KiB