Merge branch 'merge-upstream-batch2' into develop

yestion · yestion · commit 0f8c9353a4e7 · 2025-12-22T20:20:53.000+08:00
合并上游第二批特性： - PR sunmh207#130: 项目级别的 Prompt 模板配置 - PR sunmh207#148: 批量审查功能 主要功能： 1. 支持为不同项目设置专属的 prompt 模板文件 2. 批量审查：按文件分批次审查，避免上下文过长 3. 智能汇总：多批次审查结果自动汇总 4. 保留 Gitea 平台支持
diff --git a/biz/queue/worker.py b/biz/queue/worker.py
@@ -39,8 +39,10 @@ def handle_push_event(webhook_data: dict, gitlab_token: str, gitlab_url: str, gi
             review_result = "关注的文件没有修改"
 
             if len(changes) > 0:
+                project_name = webhook_data['project']['name']
                 commits_text = ';'.join(commit.get('message', '').strip() for commit in commits)
-                review_result = CodeReviewer().review_and_strip_code(str(changes), commits_text)
+                code_reviewer = CodeReviewer()
+                review_result = code_reviewer.review_changes_in_batches(changes, commits_text, project_name)
                 score = CodeReviewer.parse_review_score(review_text=review_result)
                 for item in changes:
                     additions += item['additions']
@@ -133,9 +135,11 @@ def handle_merge_request_event(webhook_data: dict, gitlab_token: str, gitlab_url
             logger.error('Failed to get commits')
             return
 
-        # review 代码
+        # review 代码 - 使用批量审查方法
+        project_name = webhook_data['project']['name']
         commits_text = ';'.join(commit['title'] for commit in commits)
-        review_result = CodeReviewer().review_and_strip_code(str(changes), commits_text)
+        code_reviewer = CodeReviewer()
+        review_result = code_reviewer.review_changes_in_batches(changes, commits_text, project_name)
 
         # 将review结果提交到Gitlab的 notes
         handler.add_merge_request_notes(f'Auto Review Result: \n{review_result}')
@@ -189,8 +193,10 @@ def handle_github_push_event(webhook_data: dict, github_token: str, github_url:
             review_result = "关注的文件没有修改"
 
             if len(changes) > 0:
+                project_name = webhook_data['repository']['name']
                 commits_text = ';'.join(commit.get('message', '').strip() for commit in commits)
-                review_result = CodeReviewer().review_and_strip_code(str(changes), commits_text)
+                code_reviewer = CodeReviewer()
+                review_result = code_reviewer.review_changes_in_batches(changes, commits_text, project_name)
                 score = CodeReviewer.parse_review_score(review_text=review_result)
                 for item in changes:
                     additions += item.get('additions', 0)
@@ -273,9 +279,11 @@ def handle_github_pull_request_event(webhook_data: dict, github_token: str, gith
             logger.error('Failed to get commits')
             return
 
-        # review 代码
+        # review 代码 - 使用批量审查方法
+        project_name = webhook_data['repository']['name']
         commits_text = ';'.join(commit['title'] for commit in commits)
-        review_result = CodeReviewer().review_and_strip_code(str(changes), commits_text)
+        code_reviewer = CodeReviewer()
+        review_result = code_reviewer.review_changes_in_batches(changes, commits_text, project_name)
 
         # 将review结果提交到GitHub的 notes
         handler.add_pull_request_notes(f'Auto Review Result: \n{review_result}')
@@ -328,8 +336,10 @@ def handle_gitea_push_event(webhook_data: dict, gitea_token: str, gitea_url: str
             review_result = "关注的文件没有修改"
 
             if len(changes) > 0:
+                project_name = webhook_data.get('repository', {}).get('name')
                 commits_text = ';'.join(commit.get('message', '').strip() for commit in commits)
-                review_result = CodeReviewer().review_and_strip_code(str(changes), commits_text)
+                code_reviewer = CodeReviewer()
+                review_result = code_reviewer.review_changes_in_batches(changes, commits_text, project_name)
                 score = CodeReviewer.parse_review_score(review_text=review_result)
                 for item in changes:
                     additions += item.get('additions', 0)
@@ -406,8 +416,10 @@ def handle_gitea_pull_request_event(webhook_data: dict, gitea_token: str, gitea_
             logger.error('Failed to get commits for Gitea pull request')
             return
 
+        project_name = webhook_data.get('repository', {}).get('name')
         commits_text = ';'.join(commit.get('title', '') for commit in commits)
-        review_result = CodeReviewer().review_and_strip_code(str(changes), commits_text)
+        code_reviewer = CodeReviewer()
+        review_result = code_reviewer.review_changes_in_batches(changes, commits_text, project_name)
 
         handler.add_pull_request_notes(f'Auto Review Result: \n{review_result}')
 
diff --git a/biz/utils/code_reviewer.py b/biz/utils/code_reviewer.py
@@ -1,7 +1,7 @@
 import abc
 import os
 import re
-from typing import Dict, Any, List
+from typing import Dict, Any, List, Optional
 
 import yaml
 from jinja2 import Template
@@ -16,11 +16,20 @@ class BaseReviewer(abc.ABC):
 
     def __init__(self, prompt_key: str):
         self.client = Factory().getClient()
-        self.prompts = self._load_prompts(prompt_key, os.getenv("REVIEW_STYLE", "professional"))
+        self.prompts = self._load_prompts(prompt_key)
 
-    def _load_prompts(self, prompt_key: str, style="professional") -> Dict[str, Any]:
+    def _load_prompts(
+        self, prompt_key: str, style: Optional[str] = None, prompt_templates_file: Optional[str] = None
+    ) -> Dict[str, Any]:
         """加载提示词配置"""
-        prompt_templates_file = "conf/prompt_templates.yml"
+        if not style:
+            # 如果未提供, 从环境变量中获取审查风格，默认为 "professional"
+            style = os.getenv("REVIEW_STYLE", "professional")
+
+        if not prompt_templates_file:
+            # 如果未提供, 使用默认的提示词配置文件路径
+            prompt_templates_file = "conf/prompt_templates.yml"
+
         try:
             # 在打开 YAML 文件时显式指定编码为 UTF-8，避免使用系统默认的 GBK 编码。
             with open(prompt_templates_file, "r", encoding="utf-8") as file:
@@ -60,12 +69,13 @@ class CodeReviewer(BaseReviewer):
     def __init__(self):
         super().__init__("code_review_prompt")
 
-    def review_and_strip_code(self, changes_text: str, commits_text: str = "") -> str:
+    def review_and_strip_code(self, changes_text: str, commits_text: str = "", project_name: str = "") -> str:
         """
         Review判断changes_text超出取前REVIEW_MAX_TOKENS个token，超出则截断changes_text，
         调用review_code方法，返回review_result，如果review_result是markdown格式，则去掉头尾的```
-        :param changes_text:
-        :param commits_text:
+        :param changes_text: 代码变更内容
+        :param commits_text: 提交信息
+        :param project_name: 项目名称
         :return:
         """
         # 如果超长，取前REVIEW_MAX_TOKENS个token
@@ -80,29 +90,152 @@ def review_and_strip_code(self, changes_text: str, commits_text: str = "") -> st
         if tokens_count > review_max_tokens:
             changes_text = truncate_text_by_tokens(changes_text, review_max_tokens)
 
-        review_result = self.review_code(changes_text, commits_text).strip()
+        review_result = self.review_code(changes_text, commits_text, project_name).strip()
         if review_result.startswith("```markdown") and review_result.endswith("```"):
             return review_result[11:-3].strip()
         return review_result
 
-    def review_code(self, diffs_text: str, commits_text: str = "") -> str:
+    def review_code(self, diffs_text: str, commits_text: str = "", project_name: str = "") -> str:
         """Review 代码并返回结果"""
+        normalized_project_name = project_name.replace("-", "_") if project_name else project_name
+        project_prompts_path = os.getenv(f"{normalized_project_name.upper()}_PROMPT", None)
+
+        # 按需重新加载 prompts 配置， 同时也可以支持项目级别提示词的热加载
+        prompts = (
+            self._load_prompts(prompt_key="code_review_prompt", prompt_templates_file=project_prompts_path)
+            if project_prompts_path
+            else self.prompts
+        )
         messages = [
-            self.prompts["system_message"],
+            prompts["system_message"],
             {
                 "role": "user",
-                "content": self.prompts["user_message"]["content"].format(
-                    diffs_text=diffs_text, commits_text=commits_text
-                ),
+                "content": prompts["user_message"]["content"].format(diffs_text=diffs_text, commits_text=commits_text),
             },
         ]
         return self.call_llm(messages)
 
+    def review_changes_in_batches(self, changes: List[Dict[str, Any]], commits_text: str = "", project_name: str = "") -> str:
+        """
+        按文件批次审查代码变更，然后汇总所有审查结果
+        :param changes: 代码变更列表，每个元素是一个包含文件信息的字典
+        :param commits_text: 提交信息
+        :param project_name: 项目名称
+        :return: 汇总后的审查结果
+        """
+        if not changes:
+            logger.info("代码变更为空")
+            return "代码为空"
+
+        # 检查是否启用批量审查
+        batch_review_enabled = os.getenv("BATCH_REVIEW_ENABLED", "1") == "1"
+
+        # 如果未启用批量审查，使用原有的一次性审查方式
+        if not batch_review_enabled:
+            logger.info("批量审查功能未启用，使用传统一次性审查方式")
+            return self.review_and_strip_code(str(changes), commits_text, project_name)
+
+        review_max_tokens = int(os.getenv("REVIEW_MAX_TOKENS", 10000))
+        # 获取每批次审查的文件数量配置
+        files_per_batch = int(os.getenv("BATCH_REVIEW_FILES_PER_BATCH", 1))
+        logger.info(f"批量审查已启用，每批次审查 {files_per_batch} 个文件")
+
+        partial_reviews = []
+        total_files = len(changes)
+
+        # 按配置的批次大小分批进行审查
+        for batch_start in range(0, total_files, files_per_batch):
+            batch_end = min(batch_start + files_per_batch, total_files)
+            batch_changes = changes[batch_start:batch_end]
+            batch_num = (batch_start // files_per_batch) + 1
+            total_batches = (total_files + files_per_batch - 1) // files_per_batch
+
+            logger.info(f"正在审查第 {batch_num}/{total_batches} 批次 (文件 {batch_start + 1}-{batch_end}/{total_files})")
+
+            # 收集当前批次的文件路径
+            batch_file_paths = [
+                change.get('new_path') or change.get('old_path', 'unknown')
+                for change in batch_changes
+            ]
+
+            # 将批次内的文件转换为文本
+            batch_text = str(batch_changes)
+
+            # 计算tokens数量，如果超过限制则截断
+            tokens_count = count_tokens(batch_text)
+            if tokens_count > review_max_tokens:
+                logger.warning(f"批次 {batch_num} 的变更超过 {review_max_tokens} tokens，将截断")
+                batch_text = truncate_text_by_tokens(batch_text, review_max_tokens)
+
+            # 审查当前批次，传递 project_name 参数
+            try:
+                review_result = self.review_code(batch_text, commits_text, project_name).strip()
+                if review_result.startswith("```markdown") and review_result.endswith("```"):
+                    review_result = review_result[11:-3].strip()
+
+                # 添加批次标识
+                batch_header = f"### 批次 {batch_num} (文件: {', '.join(batch_file_paths)})\n"
+                partial_reviews.append(f"{batch_header}{review_result}")
+                logger.info(f"批次 {batch_num} 审查完成")
+            except Exception as e:
+                logger.error(f"审查批次 {batch_num} 时出错: {e}")
+                partial_reviews.append(f"### 批次 {batch_num}\n审查失败: {str(e)}")
+
+        # 如果只有一个批次，直接返回结果（去掉批次标识）
+        if len(partial_reviews) == 1:
+            # 去掉批次标题行
+            result = partial_reviews[0]
+            lines = result.split('\n', 1)
+            return lines[1] if len(lines) > 1 else result
+
+        # 汇总多个批次的审查结果
+        logger.info(f"开始汇总 {len(partial_reviews)} 个批次的审查结果")
+        summary_result = self._summarize_reviews(partial_reviews, project_name)
+        return summary_result
+
+    def _summarize_reviews(self, partial_reviews: List[str], project_name: str = "") -> str:
+        """
+        使用 summary_merge_review_prompt 汇总多个审查结果
+        :param partial_reviews: 各批次的审查结果列表
+        :param project_name: 项目名称
+        :return: 汇总后的总审查报告
+        """
+        # 加载汇总提示词，支持项目级别的自定义
+        normalized_project_name = project_name.replace("-", "_") if project_name else project_name
+        project_prompts_path = os.getenv(f"{normalized_project_name.upper()}_PROMPT", None)
+        
+        summary_prompts = (
+            self._load_prompts(prompt_key="summary_merge_review_prompt", prompt_templates_file=project_prompts_path)
+            if project_prompts_path
+            else self._load_prompts("summary_merge_review_prompt", os.getenv("REVIEW_STYLE", "professional"))
+        )
+
+        # 拼接所有分批审查结果
+        partial_reviews_text = "\n\n---\n\n".join(partial_reviews)
+
+        # 构建汇总请求消息
+        messages = [
+            summary_prompts["system_message"],
+            {
+                "role": "user",
+                "content": summary_prompts["user_message"]["content"].format(
+                    partial_reviews_text=partial_reviews_text
+                ),
+            },
+        ]
+
+        # 调用LLM进行汇总
+        summary_result = self.call_llm(messages).strip()
+        if summary_result.startswith("```markdown") and summary_result.endswith("```"):
+            summary_result = summary_result[11:-3].strip()
+
+        logger.info("审查结果汇总完成")
+        return summary_result
+
     @staticmethod
     def parse_review_score(review_text: str) -> int:
         """解析 AI 返回的 Review 结果，返回评分"""
         if not review_text:
             return 0
         match = re.search(r"总分[:：]\s*(\d+)分?", review_text)
         return int(match.group(1)) if match else 0
-
diff --git a/conf/prompt_templates.yml b/conf/prompt_templates.yml
@@ -41,3 +41,55 @@ code_review_prompt:
     
     提交历史(commits)：
     {commits_text}
+
+summary_merge_review_prompt:
+  system_prompt: |-
+    你是一位高级软件架构师，现在需要对多个分批完成的代码审查结果进行整合成一个完整的总审查报告。
+
+    你的职责：
+    1. 重新整合多个批次的审查结果，形成"统一评分的总报告"
+    2. 不得丢失开发者定位问题所需的"批次级详细描述"
+    3. 在顶层总结问题趋势及关键风险
+    4. 根据全量问题重新统一打分
+
+    ---
+
+    汇总结构必须包含以下 3 部分：
+
+    ### 第一部分：全局问题总结与优化建议（进行归类整合，去重问题）
+    - 从所有批次报告中抽取共性问题进行分类总结
+    - 以整体角度提出优化方向，而不是重复粘贴批次内容
+
+    ### 第二部分：分批次详细问题保留区（必须原样结构化保留）
+    你的任务是按以下格式保留批次细节，不得简化或省略：
+    ```
+    #### 批次 X（文件范围/来源说明）
+    <保留该批完整的"问题描述与评分明细"，不得删减内容>
+    ```
+
+    这样开发者能快速找到"哪个文件在哪个批次出了什么问题"。
+
+    ### 第三部分：统一评分明细与总分（你必须重新评分）
+    - 你需要结合多个批次的影响范围重新量化总评分，而不是平均或取最大值
+    - 格式如下：
+      ```
+      - 功能实现的正确性与健壮性：XX分
+      - 安全性与潜在风险：XX分
+      - 是否符合最佳实践：XX分
+      - 性能与资源效率：XX分
+      - 提交信息清晰性与准确性：XX分
+      ```
+
+    最后一行必须为：**总分:XX分**
+
+    ---
+
+    自检规则：
+    - 若未包含"分批次详细问题保留区"则需重新生成
+    - 若未重新统一评分，而直接引用批次数值，则需重新评分
+    - 若缺少"总分:XX分"，必须重新生成
+    - 若全局总结部分只是重复批次内容，必须进行整合后重新生成
+
+  user_prompt: |-
+    以下是分批次代码审查结果，请将其整合为一个完整的总审查报告，并统一量化评分：
+    {partial_reviews_text}