trask
diff --git a/‎.github/agents/pr-review.agent.md‎
Lines changed: 79 additions & 0 deletions b/‎.github/agents/pr-review.agent.md‎
Lines changed: 79 additions & 0 deletions
diff --git a/‎.github/scripts/pr-review/common.py‎
Lines changed: 70 additions & 0 deletions b/‎.github/scripts/pr-review/common.py‎
Lines changed: 70 additions & 0 deletions
diff --git a/‎.github/scripts/pr-review/gate.py‎
Lines changed: 164 additions & 0 deletions b/‎.github/scripts/pr-review/gate.py‎
Lines changed: 164 additions & 0 deletions
@@ -0,0 +1,79 @@
+---
+description: |
+  Reviews a pull request in opentelemetry-java-instrumentation against the
+  repository style guide and review knowledge, and emits structured findings
+  as JSON for a downstream job to post as a GitHub review.
+tools: [view, rg, grep, web_fetch]
+---
+
+# PR Review persona
+
+You are an automated code reviewer for the
+`opentelemetry-java-instrumentation` repository. Your single task this run is
+to review one pull request and write your findings as JSON to a fixed file
+path. Another job validates and publishes those findings; you do not post the
+review yourself.
+
+## Inputs you must read
+
+A deterministic review bundle is staged on disk before you start. The caller's
+prompt tells you exactly where it lives. The bundle contains:
+
+- `pr.diff` — the unified diff of the PR. **This is the authoritative source
+  for what changed.** Only flag issues on right-side lines that appear inside
+  these hunks.
+- `metadata.json` — PR metadata (base/head SHAs, branch names).
+- `diff-scope.json` — per-file changed-line and hunk index, for your
+  reference if you want to double-check scoping.
+- `files/<repo-relative-path>` — the post-change contents of every file the
+  PR modified or added. **Always read PR-changed files from here**, not from
+  the working tree (the tree is detached at the PR's base commit and does not
+  contain the PR's changes).
+- `knowledge/*.md` — review knowledge articles. Start with `README.md` to
+  decide which articles apply. Always apply the general rules, the style
+  guide, and the metadata.yaml guidance.
+
+For files **not** changed by the PR (neighbouring helpers, sibling metadata,
+referenced classes), read directly from the working tree using the repo-
+relative path. Do **not** prefix those with the bundle path.
+
+For files deleted by the PR, do not attempt to read them — their contents are
+intentionally absent.
+
+## Output contract
+
+Write your findings to the JSON path the caller specifies. The file must
+contain exactly this shape:
+
+```json
+{
+  "body": "brief review summary",
+  "comments": [
+    {
+      "path": "repo-relative file path",
+      "line": 123,
+      "start_line": 120,
+      "category": "[Style]",
+      "body": "concise review comment",
+      "suggestion": "optional exact replacement text"
+    }
+  ]
+}
+```
+
+## Hard rules
+
+- Do not switch branches.
+- Do not edit any repository file. Your only write is the findings JSON.
+- Do not commit. Do not push.
+- Only flag issues on changed right-side lines that fall inside a diff hunk
+  in `pr.diff`. Findings outside the diff scope will be discarded by the
+  validator.
+- Do not flag non-capturing lambdas or method references as "unnecessary
+  allocations" — the JIT caches them per call site.
+- Use `suggestion` text only when the replacement is exact and ready to apply
+  via GitHub's suggestion UI.
+- For a deletion suggestion, set `start_line` and `line` to span the lines to
+  remove and set `suggestion` to the empty string `""`.
+- Return no comments for uncertain or low-confidence observations. Silence is
+  better than noise.
@@ -0,0 +1,70 @@
+"""Shared helpers for the pr-review workflow scripts.
+
+Kept intentionally small: the full pr-triage `common` module includes
+branch-restoration, Copilot CLI handoff, and other helpers the review
+workflow does not need. This module covers only what the three review
+scripts in this directory actually use.
+"""
+
+from __future__ import annotations
+
+import json
+import shlex
+import subprocess
+import sys
+from dataclasses import dataclass, field
+from pathlib import Path
+from typing import Any
+
+
+# Force UTF-8 on parent stdout/stderr so unicode characters in subprocess
+# output don't crash the default cp1252 codec on Windows.
+for _stream in (sys.stdout, sys.stderr):
+    _reconfigure = getattr(_stream, "reconfigure", None)
+    if _reconfigure is not None:
+        _reconfigure(encoding="utf-8", errors="replace")
+
+
+@dataclass
+class Summary:
+    """Lightweight bag of side-effect results, threaded through helpers."""
+
+    pr: int
+    pr_url: str | None = None
+    review_url: str | None = None
+    temp_dir: str | None = None
+    notes: list[str] = field(default_factory=list)
+
+
+def progress(message: str) -> None:
+    print(f"[review] {message}", flush=True)
+
+
+def _run(cmd: list[str], summary: Summary | None = None, check: bool = True) -> subprocess.CompletedProcess[str]:
+    if summary is not None:
+        progress("Running: " + " ".join(shlex.quote(part) for part in cmd))
+    return subprocess.run(
+        cmd,
+        capture_output=True,
+        text=True,
+        encoding="utf-8",
+        errors="replace",
+        check=check,
+    )
+
+
+def gh(args: list[str], summary: Summary | None = None, check: bool = True) -> subprocess.CompletedProcess[str]:
+    return _run(["gh", *args], summary, check)
+
+
+def gh_json(args: list[str], summary: Summary | None = None) -> Any:
+    result = gh(args, summary)
+    return json.loads(result.stdout or "null")
+
+
+def detect_repo(summary: Summary | None = None) -> str:
+    return gh(["repo", "view", "--json", "nameWithOwner", "-q", ".nameWithOwner"], summary).stdout.strip()
+
+
+def write_json(path: Path, value: Any) -> None:
+    path.write_text(json.dumps(value, indent=2, sort_keys=True) + "\n", encoding="utf-8")
@@ -0,0 +1,164 @@
+#!/usr/bin/env python3
+"""Gate the pr-review workflow: resolve trigger, validate, emit outputs.
+
+Reads trigger context from environment variables, decides whether the agent
+should run, and writes outputs to $GITHUB_OUTPUT:
+
+  should_run     - "true" if the agent should run, else "false"
+  pr_number      - PR number to review
+  model          - resolved Copilot model (default if override invalid)
+  model_warning  - human-readable warning if the requested model was rejected
+  triggered_by   - short string for the review-body footer
+  base_ref_oid   - PR base commit SHA, used by the agent's checkout step
+
+Required env: GH_TOKEN, EVENT_NAME, DEFAULT_MODEL, ALLOWED_MODELS, plus the
+trigger-specific variables documented inline.
+"""
+
+from __future__ import annotations
+
+import os
+import re
+import sys
+from pathlib import Path
+
+from common import gh_json, progress
+
+
+REVIEW_RE = re.compile(r"^/review(?:\s+(\S+))?\s*$")
+
+
+def emit(outputs: dict[str, str]) -> None:
+    path = os.environ.get("GITHUB_OUTPUT")
+    if not path:
+        for key, value in outputs.items():
+            print(f"{key}={value}")
+        return
+    with Path(path).open("a", encoding="utf-8") as f:
+        for key, value in outputs.items():
+            if "\n" in value:
+                f.write(f"{key}<<__GATE_EOF__\n{value}\n__GATE_EOF__\n")
+            else:
+                f.write(f"{key}={value}\n")
+
+
+def skip(reason: str) -> int:
+    progress(f"Gate: {reason} - skipping run.")
+    emit(
+        {
+            "should_run": "false",
+            "pr_number": "",
+            "model": "",
+            "model_warning": "",
+            "triggered_by": "",
+            "base_ref_oid": "",
+        }
+    )
+    return 0
+
+
+def resolve_model(requested: str, default_model: str, allowed_models: str) -> tuple[str, str]:
+    if not requested:
+        return default_model, ""
+    allowed = {m.strip() for m in allowed_models.split(",") if m.strip()}
+    if requested in allowed:
+        return requested, ""
+    return (
+        default_model,
+        f"requested model `{requested}` is not in the allowlist; using default `{default_model}`.",
+    )
+
+
+def commenter_has_write_access(repo: str, login: str) -> bool:
+    # gh returns non-zero (404) for users without an explicit collaborator
+    # entry, which we treat the same as "no write access". This also denies
+    # on transient gh/API failures, which is the safer default for a gate
+    # that controls whether the reviewer agent runs.
+    try:
+        result = gh_json(
+            ["api", f"repos/{repo}/collaborators/{login}/permission", "-q", ".permission"],
+        )
+    except Exception:
+        return False
+    # gh_json returns parsed JSON; with -q the output is a bare string.
+    return result in {"admin", "write"}
+
+
+class SkipRun(Exception):
+    """Raised to abort the gate cleanly with a skip outcome."""
+
+
+def resolve_trigger(env: dict[str, str]) -> tuple[str, str, str, str]:
+    """Return (pr, model, warning, triggered_by). Raises SkipRun to skip."""
+    event = env.get("EVENT_NAME", "")
+    default_model = env.get("DEFAULT_MODEL", "")
+    allowed_models = env.get("ALLOWED_MODELS", "")
+    repo = env.get("GITHUB_REPOSITORY", "")
+
+    if event == "pull_request_target":
+        pr = env.get("PR_FROM_PR_EVENT", "")
+        if not pr:
+            raise SkipRun("no PR number on pull_request_target event")
+        model, warning = resolve_model("", default_model, allowed_models)
+        return pr, model, warning, "ready_for_review"
+
+    if event == "issue_comment":
+        pr = env.get("PR_FROM_COMMENT", "")
+        if not pr:
+            raise SkipRun("no PR number on issue_comment event")
+        body = (env.get("COMMENT_BODY", "") or "").strip()
+        match = REVIEW_RE.match(body)
+        if not match:
+            raise SkipRun("comment body does not match /review[ <model>]")
+        author = env.get("COMMENT_AUTHOR", "")
+        if not author or not commenter_has_write_access(repo, author):
+            raise SkipRun(f"commenter @{author} lacks write permission")
+        requested_model = match.group(1) or ""
+        model, warning = resolve_model(requested_model, default_model, allowed_models)
+        return pr, model, warning, f"`/review` by @{author}"
+
+    raise SkipRun(f"unsupported event: {event}")
+
+
+def pr_state(repo: str, pr: str) -> dict | None:
+    try:
+        return gh_json(
+            ["pr", "view", pr, "--repo", repo, "--json", "state,baseRefOid,isDraft,number"],
+        )
+    except Exception:
+        return None
+
+
+def main() -> int:
+    env = os.environ
+    repo = env.get("GITHUB_REPOSITORY", "")
+
+    try:
+        pr, model, warning, triggered_by = resolve_trigger(env)
+        info = pr_state(repo, pr)
+        if not info:
+            raise SkipRun(f"PR #{pr} not found")
+        if info.get("state") != "OPEN":
+            raise SkipRun(f"PR #{pr} is not open (state={info.get('state')})")
+        if info.get("isDraft") and env.get("EVENT_NAME") != "issue_comment":
+            raise SkipRun(f"PR #{pr} is a draft and trigger is {env.get('EVENT_NAME')}")
+        base_ref_oid = info.get("baseRefOid", "")
+    except SkipRun as e:
+        return skip(str(e))
+
+    progress(f"Gate accepted: pr={pr} trigger={triggered_by} model={model}")
+    emit(
+        {
+            "should_run": "true",
+            "pr_number": str(pr),
+            "model": model,
+            "model_warning": warning,
+            "triggered_by": triggered_by,
+            "base_ref_oid": base_ref_oid,
+        }
+    )
+    return 0
+
+
+if __name__ == "__main__":
+    sys.exit(main())