CodeReview/backend/app/services/agent/agents/orchestrator.py

"""
Orchestrator Agent (编排层) - LLM 驱动版

LLM 是真正的大脑，全程参与决策！
- LLM 决定下一步做什么
- LLM 决定调度哪个子 Agent
- LLM 决定何时完成
- LLM 根据中间结果动态调整策略

类型: Autonomous Agent with Dynamic Planning
"""

import asyncio
import json
import logging
import os
import re
from typing import List, Dict, Any, Optional
from dataclasses import dataclass

from .base import BaseAgent, AgentConfig, AgentResult, AgentType, AgentPattern
from ..json_parser import AgentJsonParser
from ..prompts import MULTI_AGENT_RULES, CORE_SECURITY_PRINCIPLES

logger = logging.getLogger(__name__)


ORCHESTRATOR_SYSTEM_PROMPT = """你是 DeepAudit 的编排 Agent，负责**自主**协调整个安全审计流程。

## 你的角色
你是整个审计流程的**大脑**，不是一个机械执行者。你需要：
1. 自主思考和决策
2. 根据观察结果动态调整策略
3. 决定何时调用哪个子 Agent
4. 判断何时审计完成

## 你可以调度的子 Agent
1. **recon**: 信息收集 Agent - 分析项目结构、技术栈、入口点
2. **analysis**: 分析 Agent - 深度代码审计、漏洞检测
3. **verification**: 验证 Agent - 验证发现的漏洞、生成 PoC

## 你可以使用的操作

### 1. 调度子 Agent
```
Action: dispatch_agent
Action Input: {"agent": "recon|analysis|verification", "task": "具体任务描述", "context": "任务上下文"}
```

### 2. 汇总发现
```
Action: summarize
Action Input: {"findings": [...], "analysis": "你的分析"}
```

### 3. 完成审计
```
Action: finish
Action Input: {"conclusion": "审计结论", "findings": [...], "recommendations": [...]}
```

## 工作方式
每一步，你需要：

1. **Thought**: 分析当前状态，思考下一步应该做什么
   - 目前收集到了什么信息？
   - 还需要了解什么？
   - 应该深入分析哪些地方？
   - 有什么发现需要验证？

2. **Action**: 选择一个操作
3. **Action Input**: 提供操作参数

## 输出格式
每一步必须严格按照以下格式：

```
Thought: [你的思考过程]
Action: [dispatch_agent|summarize|finish]
Action Input: [JSON 参数]
```

## 审计策略建议
- 先用 recon Agent 了解项目全貌（只需调度一次）
- 根据 recon 结果，让 analysis Agent 重点审计高风险区域
- 发现可疑漏洞后，用 verification Agent 验证
- 随时根据新发现调整策略，不要机械执行
- 当你认为审计足够全面时，选择 finish

## 重要原则
1. **你是大脑，不是执行器** - 每一步都要思考
2. **动态调整** - 根据发现调整策略
3. **主动决策** - 不要等待，主动推进
4. **质量优先** - 宁可深入分析几个真实漏洞，不要浅尝辄止
5. **避免重复** - 每个 Agent 通常只需要调度一次，如果结果不理想，尝试其他 Agent 或直接完成审计

## 处理子 Agent 结果
- 子 Agent 返回的 Observation 包含它们的分析结果
- 即使结果看起来不完整，也要基于已有信息继续推进
- 不要反复调度同一个 Agent 期望得到不同结果
- 如果 recon 完成后，应该调度 analysis 进行深度分析
- 如果 analysis 完成后有发现，可以调度 verification 验证
- 如果没有更多工作要做，使用 finish 结束审计

现在，基于项目信息开始你的审计工作！"""


@dataclass
class AgentStep:
    """执行步骤"""
    thought: str
    action: str
    action_input: Dict[str, Any]
    observation: Optional[str] = None
    sub_agent_result: Optional[AgentResult] = None


class OrchestratorAgent(BaseAgent):
    """
    编排 Agent - LLM 驱动版
    
    LLM 全程参与决策：
    1. LLM 思考当前状态
    2. LLM 决定下一步操作
    3. 执行操作，获取结果
    4. LLM 分析结果，决定下一步
    5. 重复直到 LLM 决定完成
    """
    
    def __init__(
        self,
        llm_service,
        tools: Dict[str, Any],
        event_emitter=None,
        sub_agents: Optional[Dict[str, BaseAgent]] = None,
        tracer=None,
    ):
        # 组合增强的系统提示词，注入多Agent协作规则和核心安全原则
        full_system_prompt = f"{ORCHESTRATOR_SYSTEM_PROMPT}\n\n{CORE_SECURITY_PRINCIPLES}\n\n{MULTI_AGENT_RULES}"
        
        config = AgentConfig(
            name="Orchestrator",
            agent_type=AgentType.ORCHESTRATOR,
            pattern=AgentPattern.REACT,  # 改为 ReAct 模式！
            max_iterations=20,
            system_prompt=full_system_prompt,
        )
        super().__init__(config, llm_service, tools, event_emitter)
        
        self.sub_agents = sub_agents or {}
        self._conversation_history: List[Dict[str, str]] = []
        self._steps: List[AgentStep] = []
        self._all_findings: List[Dict] = []
        
        # 🔥 Tracer 遥测支持
        self.tracer = tracer
        
        # 🔥 存储运行时上下文，用于传递给子 Agent
        self._runtime_context: Dict[str, Any] = {}
        
        # 🔥 跟踪已调度的 Agent 任务，避免重复调度
        self._dispatched_tasks: Dict[str, int] = {}  # agent_name -> dispatch_count

        # 🔥 保存各个 Agent 的完整结果，用于传递给后续 Agent
        self._agent_results: Dict[str, Dict[str, Any]] = {}  # agent_name -> full result data
    
    def register_sub_agent(self, name: str, agent: BaseAgent):
        """注册子 Agent"""
        self.sub_agents[name] = agent
    
    def cancel(self):
        """
        取消执行 - 同时取消所有子 Agent
        
        重写父类方法，确保取消信号传播到所有子 Agent
        """
        self._cancelled = True
        logger.info(f"[{self.name}] Cancel requested, propagating to {len(self.sub_agents)} sub-agents")
        
        # 🔥 传播取消信号到所有子 Agent
        for name, agent in self.sub_agents.items():
            if hasattr(agent, 'cancel'):
                agent.cancel()
                logger.info(f"[{self.name}] Cancelled sub-agent: {name}")
    
    async def run(self, input_data: Dict[str, Any]) -> AgentResult:
        """
        执行编排任务 - LLM 全程参与！
        
        Args:
            input_data: {
                "project_info": 项目信息,
                "config": 审计配置,
                "project_root": 项目根目录,
                "task_id": 任务ID,
            }
        """
        import time
        start_time = time.time()
        
        project_info = input_data.get("project_info", {})
        config = input_data.get("config", {})
        
        # 🔥 保存运行时上下文，用于传递给子 Agent
        self._runtime_context = {
            "project_info": project_info,
            "config": config,
            "project_root": input_data.get("project_root", project_info.get("root", ".")),
            "task_id": input_data.get("task_id"),
        }
        
        # 构建初始消息
        initial_message = self._build_initial_message(project_info, config)
        
        # 初始化对话历史
        self._conversation_history = [
            {"role": "system", "content": self.config.system_prompt},
            {"role": "user", "content": initial_message},
        ]
        
        self._steps = []
        self._all_findings = []
        self._agent_results = {}  # 🔥 重置 Agent 结果缓存
        final_result = None
        error_message = None  # 🔥 跟踪错误信息
        
        await self.emit_thinking("🧠 Orchestrator Agent 启动，LLM 开始自主编排决策...")
        
        try:
            for iteration in range(self.config.max_iterations):
                if self.is_cancelled:
                    break
                
                self._iteration = iteration + 1
                
                # 🔥 再次检查取消标志（在LLM调用之前）
                if self.is_cancelled:
                    await self.emit_thinking("🛑 任务已取消，停止执行")
                    break
                
                # 调用 LLM 进行思考和决策（流式输出）
                try:
                    llm_output, tokens_this_round = await self.stream_llm_call(
                        self._conversation_history,
                        # 🔥 不传递 temperature 和 max_tokens，使用用户配置
                    )
                except asyncio.CancelledError:
                    logger.info(f"[{self.name}] LLM call cancelled")
                    break
                
                self._total_tokens += tokens_this_round
                
                # 🔥 检测空响应
                if not llm_output or not llm_output.strip():
                    logger.warning(f"[{self.name}] Empty LLM response")
                    empty_retry_count = getattr(self, '_empty_retry_count', 0) + 1
                    self._empty_retry_count = empty_retry_count
                    if empty_retry_count >= 5:  # 🔥 增加重试次数到5次
                        logger.error(f"[{self.name}] Too many empty responses, stopping")
                        error_message = "连续收到空响应，停止编排"
                        await self.emit_event("error", error_message)
                        break

                    # 🔥 添加短暂延迟，避免快速重试
                    await asyncio.sleep(1.0)

                    # 🔥 更详细的重试提示
                    retry_prompt = f"""收到空响应（第 {empty_retry_count} 次）。请严格按照以下格式输出你的决策：

Thought: [你对当前审计状态的思考]
Action: [dispatch_agent|summarize|finish]
Action Input: {{"参数": "值"}}

当前可调度的子 Agent: {list(self.sub_agents.keys())}
当前已收集发现: {len(self._all_findings)} 个

请立即输出你的下一步决策。"""

                    self._conversation_history.append({
                        "role": "user",
                        "content": retry_prompt,
                    })
                    continue
                
                # 重置空响应计数器
                self._empty_retry_count = 0

                # 🔥 检查是否是 API 错误（而非格式错误）
                if llm_output.startswith("[API_ERROR:"):
                    # 提取错误类型和消息
                    match = re.match(r"\[API_ERROR:(\w+)\]\s*(.*)", llm_output)
                    if match:
                        error_type = match.group(1)
                        error_message = match.group(2)

                        if error_type == "rate_limit":
                            # 速率限制 - 等待后重试
                            api_retry_count = getattr(self, '_api_retry_count', 0) + 1
                            self._api_retry_count = api_retry_count
                            if api_retry_count >= 3:
                                logger.error(f"[{self.name}] Too many rate limit errors, stopping")
                                await self.emit_event("error", f"API 速率限制重试次数过多: {error_message}")
                                break
                            logger.warning(f"[{self.name}] Rate limit hit, waiting before retry ({api_retry_count}/3)")
                            await self.emit_event("warning", f"API 速率限制，等待后重试 ({api_retry_count}/3)")
                            await asyncio.sleep(30)  # 等待 30 秒后重试
                            continue

                        elif error_type == "quota_exceeded":
                            # 配额用尽 - 终止任务
                            logger.error(f"[{self.name}] API quota exceeded: {error_message}")
                            await self.emit_event("error", f"API 配额已用尽: {error_message}")
                            break

                        elif error_type == "authentication":
                            # 认证错误 - 终止任务
                            logger.error(f"[{self.name}] API authentication error: {error_message}")
                            await self.emit_event("error", f"API 认证失败: {error_message}")
                            break

                        elif error_type == "connection":
                            # 连接错误 - 重试
                            api_retry_count = getattr(self, '_api_retry_count', 0) + 1
                            self._api_retry_count = api_retry_count
                            if api_retry_count >= 3:
                                logger.error(f"[{self.name}] Too many connection errors, stopping")
                                await self.emit_event("error", f"API 连接错误重试次数过多: {error_message}")
                                break
                            logger.warning(f"[{self.name}] Connection error, retrying ({api_retry_count}/3)")
                            await self.emit_event("warning", f"API 连接错误，重试中 ({api_retry_count}/3)")
                            await asyncio.sleep(5)  # 等待 5 秒后重试
                            continue

                        elif error_type == "server_error":
                            # 服务器错误 (5xx) - 重试
                            api_retry_count = getattr(self, '_api_retry_count', 0) + 1
                            self._api_retry_count = api_retry_count
                            if api_retry_count >= 3:
                                logger.error(f"[{self.name}] Too many server errors, stopping")
                                await self.emit_event("error", f"API 服务端错误重试次数过多: {error_message}")
                                break
                            logger.warning(f"[{self.name}] Server error, retrying ({api_retry_count}/3)")
                            await self.emit_event("warning", f"API 服务端繁忙或异常，重试中 ({api_retry_count}/3)")
                            await asyncio.sleep(10)  # 等待 10 秒后重试（服务端错误通常需要更久恢复）
                            continue

                # 重置 API 重试计数器（成功获取响应后）
                self._api_retry_count = 0

                # 解析 LLM 的决策
                step = self._parse_llm_response(llm_output)
                
                if not step:
                    # LLM 输出格式不正确，提示重试
                    format_retry_count = getattr(self, '_format_retry_count', 0) + 1
                    self._format_retry_count = format_retry_count
                    if format_retry_count >= 3:
                        logger.error(f"[{self.name}] Too many format errors, stopping")
                        error_message = "连续格式错误，停止编排"
                        await self.emit_event("error", error_message)
                        break
                    await self.emit_llm_decision("格式错误", "需要重新输出")
                    self._conversation_history.append({
                        "role": "assistant",
                        "content": llm_output,
                    })
                    self._conversation_history.append({
                        "role": "user",
                        "content": "请按照规定格式输出：Thought + Action + Action Input",
                    })
                    continue
                
                # 重置格式重试计数器
                self._format_retry_count = 0
                
                self._steps.append(step)
                
                # 🔥 发射 LLM 思考内容事件 - 展示编排决策的思考过程
                if step.thought:
                    await self.emit_llm_thought(step.thought, iteration + 1)
                
                # 添加 LLM 响应到历史
                self._conversation_history.append({
                    "role": "assistant",
                    "content": llm_output,
                })
                
                # 执行 LLM 决定的操作
                if step.action == "finish":
                    # 🔥 LLM 决定完成审计
                    await self.emit_llm_decision("完成审计", "LLM 判断审计已充分完成")
                    await self.emit_llm_complete(
                        f"编排完成，发现 {len(self._all_findings)} 个漏洞",
                        self._total_tokens
                    )
                    final_result = step.action_input
                    break
                
                elif step.action == "dispatch_agent":
                    # 🔥 LLM 决定调度子 Agent
                    agent_name = step.action_input.get("agent", "unknown")
                    task_desc = step.action_input.get("task", "")
                    await self.emit_llm_decision(
                        f"调度 {agent_name} Agent",
                        f"任务: {task_desc[:100]}"
                    )
                    await self.emit_llm_action("dispatch_agent", step.action_input)
                    
                    observation = await self._dispatch_agent(step.action_input)
                    step.observation = observation
                    
                    # 🔥 子 Agent 执行完成后检查取消状态
                    if self.is_cancelled:
                        logger.info(f"[{self.name}] Cancelled after sub-agent dispatch")
                        break
                    
                    # 🔥 发射观察事件
                    await self.emit_llm_observation(observation)
                    
                elif step.action == "summarize":
                    # LLM 要求汇总
                    await self.emit_llm_decision("汇总发现", "LLM 请求查看当前发现汇总")
                    observation = self._summarize_findings()
                    step.observation = observation
                    await self.emit_llm_observation(observation)
                    
                else:
                    observation = f"未知操作: {step.action}，可用操作: dispatch_agent, summarize, finish"
                    await self.emit_llm_decision("未知操作", observation)
                
                # 添加观察结果到历史
                self._conversation_history.append({
                    "role": "user",
                    "content": f"Observation:\n{step.observation}",
                })
            
            # 生成最终结果
            duration_ms = int((time.time() - start_time) * 1000)
            
            # 🔥 如果被取消，返回取消结果
            if self.is_cancelled:
                await self.emit_event(
                    "info",
                    f"🛑 Orchestrator 已取消: {len(self._all_findings)} 个发现, {self._iteration} 轮决策"
                )
                return AgentResult(
                    success=False,
                    error="任务已取消",
                    data={
                        "findings": self._all_findings,
                        "steps": [
                            {
                                "thought": s.thought,
                                "action": s.action,
                                "action_input": s.action_input,
                                "observation": s.observation[:500] if s.observation else None,
                            }
                            for s in self._steps
                        ],
                    },
                    iterations=self._iteration,
                    tool_calls=self._tool_calls,
                    tokens_used=self._total_tokens,
                    duration_ms=duration_ms,
                )
            
            # 🔥 如果有错误，返回失败结果
            if error_message:
                await self.emit_event(
                    "error",
                    f"❌ Orchestrator 失败: {error_message}"
                )
                return AgentResult(
                    success=False,
                    error=error_message,
                    data={
                        "findings": self._all_findings,
                        "steps": [
                            {
                                "thought": s.thought,
                                "action": s.action,
                                "action_input": s.action_input,
                                "observation": s.observation[:500] if s.observation else None,
                            }
                            for s in self._steps
                        ],
                    },
                    iterations=self._iteration,
                    tool_calls=self._tool_calls,
                    tokens_used=self._total_tokens,
                    duration_ms=duration_ms,
                )
            
            await self.emit_event(
                "info",
                f"🎯 Orchestrator 完成: {len(self._all_findings)} 个发现, {self._iteration} 轮决策"
            )

            # 🔥 CRITICAL: Log final findings count before returning
            logger.info(f"[Orchestrator] Final result: {len(self._all_findings)} findings collected")
            if len(self._all_findings) == 0:
                logger.warning(f"[Orchestrator] ⚠️ No findings collected! Dispatched agents: {list(self._dispatched_tasks.keys())}, Iterations: {self._iteration}")
            for i, f in enumerate(self._all_findings[:5]):  # Log first 5 for debugging
                logger.debug(f"[Orchestrator] Finding {i+1}: {f.get('title', 'N/A')} - {f.get('vulnerability_type', 'N/A')}")

            return AgentResult(
                success=True,
                data={
                    "findings": self._all_findings,
                    "summary": final_result or self._generate_default_summary(),
                    "steps": [
                        {
                            "thought": s.thought,
                            "action": s.action,
                            "action_input": s.action_input,
                            "observation": s.observation[:500] if s.observation else None,
                        }
                        for s in self._steps
                    ],
                },
                iterations=self._iteration,
                tool_calls=self._tool_calls,
                tokens_used=self._total_tokens,
                duration_ms=duration_ms,
            )
            
        except Exception as e:
            logger.error(f"Orchestrator failed: {e}", exc_info=True)
            return AgentResult(
                success=False,
                error=str(e),
            )
    
    def _build_initial_message(
        self,
        project_info: Dict[str, Any],
        config: Dict[str, Any],
    ) -> str:
        """构建初始消息"""
        structure = project_info.get('structure', {})
        
        # 🔥 检查是否是限定范围的审计
        scope_limited = structure.get('scope_limited', False)
        scope_message = structure.get('scope_message', '')
        
        msg = f"""请开始对以下项目进行安全审计。

## 项目信息
- 名称: {project_info.get('name', 'unknown')}
- 语言: {project_info.get('languages', [])}
- 文件数量: {project_info.get('file_count', 0)}
"""
        
        # 🔥 根据是否限定范围显示不同的结构信息
        if scope_limited:
            msg += f"""
## ⚠️ 审计范围限定
**{scope_message}**

### 目标文件列表
"""
            for f in structure.get('files', []):
                msg += f"- {f}\n"
            
            if structure.get('directories'):
                msg += f"""
### 相关目录
{structure.get('directories', [])}
"""
        else:
            msg += f"""
## 目录结构
{json.dumps(structure, ensure_ascii=False, indent=2)}
"""
        
        # 🔥 如果配置了 target_files，也明确显示
        target_files = config.get('target_files', [])
        if target_files:
            msg += f"""
## ⚠️ 重要提示
用户指定了 **{len(target_files)}** 个目标文件进行审计。
请确保你的分析集中在这些指定的文件上，不要浪费时间分析其他文件。
"""
        
        msg += f"""
## 用户配置
- 目标漏洞: {config.get('target_vulnerabilities', ['all'])}
- 验证级别: {config.get('verification_level', 'sandbox')}
- 排除模式: {config.get('exclude_patterns', [])}

## 可用子 Agent
{', '.join(self.sub_agents.keys()) if self.sub_agents else '(暂无子 Agent)'}

请开始你的审计工作。首先思考应该如何开展，然后决定第一步做什么。"""
        
        return msg
    
    def _parse_llm_response(self, response: str) -> Optional[AgentStep]:
        """解析 LLM 响应"""
        # 🔥 v2.1: 预处理 - 移除 Markdown 格式标记（LLM 有时会输出 **Action:** 而非 Action:）
        cleaned_response = response
        cleaned_response = re.sub(r'\*\*Action:\*\*', 'Action:', cleaned_response)
        cleaned_response = re.sub(r'\*\*Action Input:\*\*', 'Action Input:', cleaned_response)
        cleaned_response = re.sub(r'\*\*Thought:\*\*', 'Thought:', cleaned_response)
        cleaned_response = re.sub(r'\*\*Observation:\*\*', 'Observation:', cleaned_response)

        # 提取 Thought
        thought_match = re.search(r'Thought:\s*(.*?)(?=Action:|$)', cleaned_response, re.DOTALL)
        thought = thought_match.group(1).strip() if thought_match else ""

        # 提取 Action
        action_match = re.search(r'Action:\s*(\w+)', cleaned_response)
        if not action_match:
            return None
        action = action_match.group(1).strip()

        # 提取 Action Input
        input_match = re.search(r'Action Input:\s*(.*?)(?=Thought:|Observation:|$)', cleaned_response, re.DOTALL)
        if not input_match:
            return None

        input_text = input_match.group(1).strip()
        # 移除 markdown 代码块
        input_text = re.sub(r'```json\s*', '', input_text)
        input_text = re.sub(r'```\s*', '', input_text)

        # 使用增强的 JSON 解析器
        action_input = AgentJsonParser.parse(
            input_text,
            default={"raw": input_text}
        )

        return AgentStep(
            thought=thought,
            action=action,
            action_input=action_input,
        )
    
    async def _dispatch_agent(self, params: Dict[str, Any]) -> str:
        """调度子 Agent"""
        agent_name = params.get("agent", "")
        task = params.get("task", "")
        context = params.get("context", "")
        
        logger.debug(f"[Orchestrator] _dispatch_agent 被调用: agent_name='{agent_name}', task='{task[:50]}...'")
        
        # 🔥 尝试大小写不敏感匹配
        agent = self.sub_agents.get(agent_name)
        if not agent:
            # 尝试小写匹配
            agent_name_lower = agent_name.lower()
            agent = self.sub_agents.get(agent_name_lower)
            if agent:
                agent_name = agent_name_lower
                logger.debug(f"[Orchestrator] 使用小写匹配: {agent_name}")
        
        if not agent:
            available = list(self.sub_agents.keys())
            logger.warning(f"[Orchestrator] Agent '{agent_name}' 不存在，可用: {available}")
            return f"错误: Agent '{agent_name}' 不存在。可用的 Agent: {available}"
        
        # 🔥 检查是否重复调度同一个 Agent
        dispatch_count = self._dispatched_tasks.get(agent_name, 0)
        if dispatch_count >= 2:
            return f"""## ⚠️ 重复调度警告

你已经调度 {agent_name} Agent {dispatch_count} 次了。

如果之前的调度没有返回有用的结果，请考虑：
1. 尝试调度其他 Agent（如 analysis 或 verification）
2. 使用 finish 操作结束审计并汇总已有发现
3. 提供更具体的任务描述

当前已收集的发现数量: {len(self._all_findings)}
"""
        
        self._dispatched_tasks[agent_name] = dispatch_count + 1
        
        # 🔥 设置父 Agent ID 并注册到注册表（动态 Agent 树）
        logger.debug(f"[Orchestrator] 准备调度 {agent_name} Agent, agent._registered={agent._registered}")
        agent.set_parent_id(self._agent_id)
        logger.debug(f"[Orchestrator] 设置 parent_id 完成，准备注册 {agent_name}")
        agent._register_to_registry(task=task)
        logger.debug(f"[Orchestrator] {agent_name} 注册完成，agent._registered={agent._registered}")
        
        await self.emit_event(
            "dispatch",
            f"📤 调度 {agent_name} Agent: {task[:100]}...",
            agent=agent_name,
            task=task,
        )
        
        self._tool_calls += 1
        
        try:
            # 🔥 构建子 Agent 输入 - 传递完整的运行时上下文
            project_info = self._runtime_context.get("project_info", {}).copy()
            # 确保 project_info 包含 root 路径
            if "root" not in project_info:
                project_info["root"] = self._runtime_context.get("project_root", ".")

            # 🔥 FIX: 构建完整的 previous_results，包含所有已执行 Agent 的结果
            previous_results = {
                "findings": self._all_findings,  # 传递已收集的发现
            }

            # 🔥 将之前 Agent 的完整结果传递给后续 Agent
            for prev_agent, prev_data in self._agent_results.items():
                previous_results[prev_agent] = {"data": prev_data}

            sub_input = {
                "task": task,
                "task_context": context,
                "project_info": project_info,
                "config": self._runtime_context.get("config", {}),
                "project_root": self._runtime_context.get("project_root", "."),
                "previous_results": previous_results,
            }

            # 🔥 执行子 Agent 前检查取消状态
            if self.is_cancelled:
                return f"## {agent_name} Agent 执行取消\n\n任务已被用户取消"

            # 🔥 执行子 Agent - 支持取消和超时
            # 设置子 Agent 超时（根据 Agent 类型）
            agent_timeouts = {
                "recon": 300,        # 5 分钟
                "analysis": 600,     # 10 分钟
                "verification": 600, # 10 分钟
            }
            timeout = agent_timeouts.get(agent_name, 300)

            async def run_with_cancel_check():
                """包装子 Agent 执行，定期检查取消状态"""
                run_task = asyncio.create_task(agent.run(sub_input))
                try:
                    while not run_task.done():
                        if self.is_cancelled:
                            # 🔥 传播取消到子 Agent
                            logger.info(f"[{self.name}] Cancelling sub-agent {agent_name} due to parent cancel")
                            if hasattr(agent, 'cancel'):
                                agent.cancel()
                            run_task.cancel()
                            try:
                                await run_task
                            except asyncio.CancelledError:
                                pass
                            raise asyncio.CancelledError("任务已取消")

                        # Use asyncio.wait to poll without cancelling the task
                        done, pending = await asyncio.wait(
                            [run_task],
                            timeout=0.5,
                            return_when=asyncio.FIRST_COMPLETED
                        )
                        if run_task in done:
                            return run_task.result()
                        # If not done, continue loop
                        continue

                    return await run_task
                except asyncio.CancelledError:
                    # 🔥 确保子任务被取消
                    if not run_task.done():
                        if hasattr(agent, 'cancel'):
                            agent.cancel()
                        run_task.cancel()
                        try:
                            await run_task
                        except asyncio.CancelledError:
                            pass
                    raise

            try:
                result = await asyncio.wait_for(
                    run_with_cancel_check(),
                    timeout=timeout
                )
            except asyncio.TimeoutError:
                logger.warning(f"[{self.name}] Sub-agent {agent_name} timed out after {timeout}s")
                return f"## {agent_name} Agent 执行超时\n\n子 Agent 执行超过 {timeout} 秒，已强制终止。请尝试更具体的任务或使用其他 Agent。"
            except asyncio.CancelledError:
                logger.info(f"[{self.name}] Sub-agent {agent_name} was cancelled")
                return f"## {agent_name} Agent 执行取消\n\n任务已被用户取消"

            # 🔥 执行后再次检查取消状态
            if self.is_cancelled:
                return f"## {agent_name} Agent 执行中断\n\n任务已被用户取消"

            # 🔥 处理子 Agent 结果 - 不同 Agent 返回不同的数据结构
            # 🔥 DEBUG: 添加诊断日志
            logger.info(f"[Orchestrator] Processing {agent_name} result: success={result.success}, data_type={type(result.data).__name__}, data_keys={list(result.data.keys()) if isinstance(result.data, dict) else 'N/A'}")

            if result.success and result.data:
                data = result.data

                # 🔥 FIX: 保存 Agent 的完整结果，供后续 Agent 使用
                self._agent_results[agent_name] = data
                logger.info(f"[Orchestrator] Saved {agent_name} result with keys: {list(data.keys())}")

                # 🔥 CRITICAL FIX: 收集发现 - 支持多种字段名
                # findings 字段通常来自 Analysis/Verification Agent
                # initial_findings 来自 Recon Agent
                raw_findings = data.get("findings", [])
                logger.info(f"[Orchestrator] {agent_name} returned data with {len(raw_findings)} findings in 'findings' field")

                # 🔥 ENHANCED: Also check for initial_findings (from Recon) - 改进逻辑
                # 即使 findings 为空列表，也检查 initial_findings
                if "initial_findings" in data:
                    initial = data.get("initial_findings", [])
                    logger.info(f"[Orchestrator] {agent_name} has {len(initial)} initial_findings, types: {[type(f).__name__ for f in initial[:3]]}")
                    for f in initial:
                        if isinstance(f, dict):
                            # 🔥 Normalize finding format - 处理 Recon 返回的格式
                            normalized = self._normalize_finding(f)
                            if normalized not in raw_findings:
                                raw_findings.append(normalized)
                                logger.info(f"[Orchestrator] Added dict finding from initial_findings")
                        elif isinstance(f, str) and f.strip():
                            # 🔥 FIX: Convert string finding to dict format instead of skipping
                            # Recon Agent 有时候会返回字符串格式的发现
                            # 尝试从字符串中提取文件路径（格式如 "app.py:36 - 描述"）
                            file_path = ""
                            line_start = 0
                            if ":" in f:
                                parts = f.split(":", 1)
                                potential_file = parts[0].strip()
                                # 检查是否像文件路径
                                if "." in potential_file and "/" not in potential_file[:3]:
                                    file_path = potential_file
                                    # 尝试提取行号
                                    if len(parts) > 1:
                                        remaining = parts[1].strip()
                                        line_match = remaining.split()[0] if remaining else ""
                                        if line_match.isdigit():
                                            line_start = int(line_match)

                            string_finding = {
                                "title": f[:100] if len(f) > 100 else f,
                                "description": f,
                                "file_path": file_path,
                                "line_start": line_start,
                                "severity": "medium",  # 默认中等严重度，Analysis 会重新评估
                                "vulnerability_type": "potential_issue",
                                "source": "recon",
                                "needs_verification": True,
                                "confidence": 0.5,  # 较低置信度，需要进一步分析
                            }
                            logger.info(f"[Orchestrator] Converted string finding to dict: {f[:80]}... (file={file_path}, line={line_start})")
                            raw_findings.append(string_finding)
                else:
                    logger.info(f"[Orchestrator] {agent_name} has no 'initial_findings' key in data")

                # 🔥 Also check high_risk_areas from Recon for potential findings
                if agent_name == "recon" and "high_risk_areas" in data:
                    high_risk = data.get("high_risk_areas", [])
                    logger.info(f"[Orchestrator] {agent_name} identified {len(high_risk)} high risk areas")
                    # 🔥 FIX: 将 high_risk_areas 也转换为发现
                    for area in high_risk:
                        if isinstance(area, str) and area.strip():
                            # 尝试从描述中提取文件路径和漏洞类型
                            file_path = ""
                            line_start = 0
                            vuln_type = "potential_issue"

                            # 🔥 FIX: 改进文件路径提取逻辑
                            # 格式1: "file.py:36 - 描述" -> 提取 file.py 和 36
                            # 格式2: "描述性文本" -> 不提取文件路径
                            if ":" in area:
                                parts = area.split(":", 1)
                                potential_file = parts[0].strip()
                                # 只有当 parts[0] 看起来像文件路径时才提取
                                # 文件路径通常包含 . 且没有空格（或只在结尾有扩展名）
                                if ("." in potential_file and
                                    " " not in potential_file and
                                    len(potential_file) < 100 and
                                    any(potential_file.endswith(ext) for ext in ['.py', '.js', '.ts', '.java', '.go', '.php', '.rb', '.c', '.cpp', '.h'])):
                                    file_path = potential_file
                                    # 尝试提取行号
                                    if len(parts) > 1:
                                        remaining = parts[1].strip()
                                        line_match = remaining.split()[0] if remaining else ""
                                        if line_match.isdigit():
                                            line_start = int(line_match)

                            # 推断漏洞类型
                            area_lower = area.lower()
                            if "command" in area_lower or "命令" in area_lower or "subprocess" in area_lower:
                                vuln_type = "command_injection"
                            elif "sql" in area_lower:
                                vuln_type = "sql_injection"
                            elif "xss" in area_lower:
                                vuln_type = "xss"
                            elif "path" in area_lower or "traversal" in area_lower or "路径" in area_lower:
                                vuln_type = "path_traversal"
                            elif "ssrf" in area_lower:
                                vuln_type = "ssrf"
                            elif "secret" in area_lower or "密钥" in area_lower or "key" in area_lower:
                                vuln_type = "hardcoded_secret"

                            high_risk_finding = {
                                "title": area[:100] if len(area) > 100 else area,
                                "description": area,
                                "file_path": file_path,
                                "line_start": line_start,
                                "severity": "high",  # 高风险区域默认高严重度
                                "vulnerability_type": vuln_type,
                                "source": "recon_high_risk",
                                "needs_verification": True,
                                "confidence": 0.6,
                            }
                            raw_findings.append(high_risk_finding)
                            logger.info(f"[Orchestrator] Converted high_risk_area to finding: {area[:60]}... (file={file_path}, type={vuln_type})")

                # 🔥 初始化 valid_findings，确保后续代码可以访问
                valid_findings = []

                if raw_findings:
                    # 只添加字典格式的发现
                    valid_findings = [f for f in raw_findings if isinstance(f, dict)]

                    logger.info(f"[Orchestrator] {agent_name} returned {len(valid_findings)} valid findings")

                    # 🔥 ENHANCED: Merge findings with better deduplication
                    for new_f in valid_findings:
                        # Normalize the finding first
                        normalized_new = self._normalize_finding(new_f)
                        
                        # 🔥 FIX: Skip if normalization returned None (e.g., file path validation failed)
                        if normalized_new is None:
                            logger.debug(f"[Orchestrator] Skipping invalid finding: {new_f.get('title', 'N/A')[:50]}")
                            continue

                        # Create fingerprint for deduplication (file + description similarity)
                        new_file = normalized_new.get("file_path", "").lower().strip()
                        new_desc = (normalized_new.get("description", "") or "").lower()[:100]
                        new_type = (normalized_new.get("vulnerability_type", "") or "").lower()
                        new_line = normalized_new.get("line_start") or normalized_new.get("line", 0)

                        # Check if exists (more flexible matching)
                        found = False
                        for i, existing_f in enumerate(self._all_findings):
                            existing_file = (existing_f.get("file_path", "") or existing_f.get("file", "")).lower().strip()
                            existing_desc = (existing_f.get("description", "") or "").lower()[:100]
                            existing_type = (existing_f.get("vulnerability_type", "") or existing_f.get("type", "")).lower()
                            existing_line = existing_f.get("line_start") or existing_f.get("line", 0)

                            # Match if same file AND (same line OR similar description OR same vulnerability type)
                            same_file = new_file and existing_file and (
                                new_file == existing_file or
                                new_file.endswith(existing_file) or
                                existing_file.endswith(new_file)
                            )
                            same_line = new_line and existing_line and new_line == existing_line
                            similar_desc = new_desc and existing_desc and (
                                new_desc in existing_desc or existing_desc in new_desc
                            )
                            same_type = new_type and existing_type and (
                                new_type == existing_type or
                                (new_type in existing_type) or (existing_type in new_type)
                            )

                            if same_file and (same_line or similar_desc or same_type):
                                # Update existing with new info (e.g. verification results)
                                # 🔥 FIX: Smart merge - don't overwrite good data with empty values
                                merged = dict(existing_f)  # Start with existing data
                                for key, value in normalized_new.items():
                                    # Only overwrite if new value is meaningful
                                    if value is not None and value != "" and value != 0:
                                        merged[key] = value
                                    elif key not in merged or merged[key] is None:
                                        # Fill in missing fields even with empty values
                                        merged[key] = value

                                # Keep the better title
                                if normalized_new.get("title") and len(normalized_new.get("title", "")) > len(existing_f.get("title", "")):
                                    merged["title"] = normalized_new["title"]
                                # Keep verified status if either is verified
                                if existing_f.get("is_verified") or normalized_new.get("is_verified"):
                                    merged["is_verified"] = True
                                # 🔥 FIX: Preserve non-zero line numbers
                                if existing_f.get("line_start") and not normalized_new.get("line_start"):
                                    merged["line_start"] = existing_f["line_start"]
                                # 🔥 FIX: Preserve vulnerability_type
                                if existing_f.get("vulnerability_type") and not normalized_new.get("vulnerability_type"):
                                    merged["vulnerability_type"] = existing_f["vulnerability_type"]

                                self._all_findings[i] = merged
                                found = True
                                logger.info(f"[Orchestrator] Merged finding: {new_file}:{merged.get('line_start', 0)} ({merged.get('vulnerability_type', '')})")
                                break

                        if not found:
                            self._all_findings.append(normalized_new)
                            logger.info(f"[Orchestrator] Added new finding: {new_file}:{new_line} ({new_type})")

                    logger.info(f"[Orchestrator] Total findings now: {len(self._all_findings)}")
                else:
                    logger.info(f"[Orchestrator] {agent_name} returned no findings")
                
                await self.emit_event(
                    "dispatch_complete",
                    f"✅ {agent_name} Agent 完成",
                    agent=agent_name,
                    findings_count=len(self._all_findings),  # 🔥 Use total findings count
                )
                
                # 🔥 根据 Agent 类型构建不同的观察结果
                if agent_name == "recon":
                    # Recon Agent 返回项目信息
                    observation = f"""## Recon Agent 执行结果

**状态**: 成功
**迭代次数**: {result.iterations}
**耗时**: {result.duration_ms}ms

### 项目结构
{json.dumps(data.get('project_structure', {}), ensure_ascii=False, indent=2)}

### 技术栈
- 语言: {data.get('tech_stack', {}).get('languages', [])}
- 框架: {data.get('tech_stack', {}).get('frameworks', [])}
- 数据库: {data.get('tech_stack', {}).get('databases', [])}

### 入口点 ({len(data.get('entry_points', []))} 个)
"""
                    for i, ep in enumerate(data.get('entry_points', [])[:10]):
                        if isinstance(ep, dict):
                            observation += f"{i+1}. [{ep.get('type', 'unknown')}] {ep.get('file', '')}:{ep.get('line', '')}\n"
                    
                    observation += f"""
### 高风险区域
{data.get('high_risk_areas', [])}

### 初步发现 ({len(data.get('initial_findings', []))} 个)
"""
                    for finding in data.get('initial_findings', [])[:5]:
                        if isinstance(finding, str):
                            observation += f"- {finding}\n"
                        elif isinstance(finding, dict):
                            observation += f"- {finding.get('title', finding)}\n"
                    
                else:
                    # Analysis/Verification Agent 返回漏洞发现
                    observation = f"""## {agent_name} Agent 执行结果

**状态**: 成功
**发现数量**: {len(valid_findings)}
**迭代次数**: {result.iterations}
**耗时**: {result.duration_ms}ms

### 发现摘要
"""
                    for i, f in enumerate(valid_findings[:10]):
                        if not isinstance(f, dict):
                            continue
                        observation += f"""
{i+1}. [{f.get('severity', 'unknown')}] {f.get('title', 'Unknown')}
   - 类型: {f.get('vulnerability_type', 'unknown')}
   - 文件: {f.get('file_path', 'unknown')}
   - 描述: {f.get('description', '')[:200]}...
"""

                    if len(valid_findings) > 10:
                        observation += f"\n... 还有 {len(valid_findings) - 10} 个发现"
                
                if data.get("summary"):
                    observation += f"\n\n### Agent 总结\n{data['summary']}"
                
                return observation
            else:
                return f"## {agent_name} Agent 执行失败\n\n错误: {result.error}"
                
        except Exception as e:
            logger.error(f"Sub-agent dispatch failed: {e}", exc_info=True)
            return f"## 调度失败\n\n错误: {str(e)}"

    def _validate_file_path(self, file_path: str) -> bool:
        """
        🔥 v2.1: 验证文件路径是否真实存在

        Args:
            file_path: 相对或绝对文件路径（可能包含行号，如 "app.py:36"）

        Returns:
            bool: 文件是否存在
        """
        if not file_path or not file_path.strip():
            return False

        # 获取项目根目录
        project_root = self._runtime_context.get("project_root", "")
        if not project_root:
            # 没有项目根目录时，无法验证，返回 True 以避免误判
            return True

        # 清理路径（移除可能的行号）
        clean_path = file_path.split(":")[0].strip() if ":" in file_path else file_path.strip()

        # 尝试相对路径
        full_path = os.path.join(project_root, clean_path)
        if os.path.isfile(full_path):
            return True

        # 尝试绝对路径
        if os.path.isabs(clean_path) and os.path.isfile(clean_path):
            return True

        return False

    def _normalize_finding(self, finding: Dict[str, Any]) -> Optional[Dict[str, Any]]:
        """
        标准化发现格式

        不同 Agent 可能返回不同格式的发现，这个方法将它们标准化为统一格式

        🔥 v2.1: 添加文件路径验证，返回 None 表示发现无效（幻觉）
        """
        normalized = dict(finding)  # 复制原始数据

        # 🔥 处理 location 字段 -> file_path + line_start
        if "location" in normalized and "file_path" not in normalized:
            location = normalized["location"]
            if isinstance(location, str) and ":" in location:
                parts = location.split(":")
                normalized["file_path"] = parts[0]
                try:
                    normalized["line_start"] = int(parts[1])
                except (ValueError, IndexError):
                    pass
            elif isinstance(location, str):
                normalized["file_path"] = location

        # 🔥 处理 file 字段 -> file_path
        if "file" in normalized and "file_path" not in normalized:
            normalized["file_path"] = normalized["file"]

        # 🔥 处理 line 字段 -> line_start
        if "line" in normalized and "line_start" not in normalized:
            normalized["line_start"] = normalized["line"]

        # 🔥 处理 type 字段 -> vulnerability_type
        if "type" in normalized and "vulnerability_type" not in normalized:
            # 不是所有 type 都是漏洞类型，比如 "Vulnerability" 只是标记
            type_val = normalized["type"]
            if type_val and type_val.lower() not in ["vulnerability", "finding", "issue"]:
                normalized["vulnerability_type"] = type_val
            elif "description" in normalized:
                # 尝试从描述中推断漏洞类型
                desc = normalized["description"].lower()
                if "command injection" in desc or "rce" in desc or "system(" in desc:
                    normalized["vulnerability_type"] = "command_injection"
                elif "sql injection" in desc or "sqli" in desc:
                    normalized["vulnerability_type"] = "sql_injection"
                elif "xss" in desc or "cross-site scripting" in desc:
                    normalized["vulnerability_type"] = "xss"
                elif "path traversal" in desc or "directory traversal" in desc:
                    normalized["vulnerability_type"] = "path_traversal"
                elif "ssrf" in desc:
                    normalized["vulnerability_type"] = "ssrf"
                elif "xxe" in desc:
                    normalized["vulnerability_type"] = "xxe"
                else:
                    normalized["vulnerability_type"] = "other"

        # 🔥 确保 severity 字段存在且为小写
        if "severity" in normalized:
            normalized["severity"] = str(normalized["severity"]).lower()
        else:
            normalized["severity"] = "medium"

        # 🔥 处理 risk 字段 -> severity
        if "risk" in normalized and "severity" not in normalized:
            normalized["severity"] = str(normalized["risk"]).lower()

        # 🔥 生成 title 如果不存在
        if "title" not in normalized:
            vuln_type = normalized.get("vulnerability_type", "Unknown")
            file_path = normalized.get("file_path", "")
            if file_path:
                import os
                normalized["title"] = f"{vuln_type.replace('_', ' ').title()} in {os.path.basename(file_path)}"
            else:
                normalized["title"] = f"{vuln_type.replace('_', ' ').title()} Vulnerability"

        # 🔥 处理 code 字段 -> code_snippet
        if "code" in normalized and "code_snippet" not in normalized:
            normalized["code_snippet"] = normalized["code"]

        # 🔥 处理 recommendation -> suggestion
        if "recommendation" in normalized and "suggestion" not in normalized:
            normalized["suggestion"] = normalized["recommendation"]

        # 🔥 处理 impact -> 添加到 description
        if "impact" in normalized and normalized.get("description"):
            if "impact" not in normalized["description"].lower():
                normalized["description"] += f"\n\nImpact: {normalized['impact']}"

        # 🔥 v2.1: 验证文件路径存在性
        file_path = normalized.get("file_path", "")
        if file_path and not self._validate_file_path(file_path):
            logger.warning(
                f"[Orchestrator] 🚫 过滤幻觉发现: 文件不存在 '{file_path}' "
                f"(title: {normalized.get('title', 'N/A')[:50]})"
            )
            return None  # 返回 None 表示发现无效

        return normalized

    def _summarize_findings(self) -> str:
        """汇总当前发现"""
        if not self._all_findings:
            return "目前还没有发现任何漏洞。"
        
        # 统计
        severity_counts = {"critical": 0, "high": 0, "medium": 0, "low": 0}
        type_counts = {}
        
        for f in self._all_findings:
            if not isinstance(f, dict):
                continue
                
            sev = f.get("severity", "low")
            severity_counts[sev] = severity_counts.get(sev, 0) + 1
            
            vtype = f.get("vulnerability_type", "other")
            type_counts[vtype] = type_counts.get(vtype, 0) + 1
        
        summary = f"""## 当前发现汇总

**总计**: {len(self._all_findings)} 个漏洞

### 严重程度分布
- Critical: {severity_counts['critical']}
- High: {severity_counts['high']}
- Medium: {severity_counts['medium']}
- Low: {severity_counts['low']}

### 漏洞类型分布
"""
        for vtype, count in type_counts.items():
            summary += f"- {vtype}: {count}\n"
        
        summary += "\n### 详细列表\n"
        for i, f in enumerate(self._all_findings):
            if isinstance(f, dict):
                summary += f"{i+1}. [{f.get('severity')}] {f.get('title')} ({f.get('file_path')})\n"
        
        return summary
    
    def _generate_default_summary(self) -> Dict[str, Any]:
        """生成默认摘要"""
        severity_counts = {"critical": 0, "high": 0, "medium": 0, "low": 0}
        
        for f in self._all_findings:
            if isinstance(f, dict):
                sev = f.get("severity", "low")
                severity_counts[sev] = severity_counts.get(sev, 0) + 1
        
        return {
            "total_findings": len(self._all_findings),
            "severity_distribution": severity_counts,
            "conclusion": "审计完成（未通过 LLM 生成结论）",
        }
    
    def get_conversation_history(self) -> List[Dict[str, str]]:
        """获取对话历史"""
        return self._conversation_history
    
    def get_steps(self) -> List[AgentStep]:
        """获取执行步骤"""
        return self._steps
-												feat(agent): implement Agent audit module with LangGraph integration

- Introduce new Agent audit functionality for autonomous code security analysis and vulnerability verification.
- Add API endpoints for managing Agent tasks and configurations.
- Implement UI components for Agent mode selection and embedding model configuration.
- Enhance the overall architecture with a focus on RAG (Retrieval-Augmented Generation) for improved code semantic search.
- Create a sandbox environment for secure execution of vulnerability tests.
- Update documentation to include details on the new Agent audit features and usage instructions.

											
										
										
											2025-12-11 19:09:10 +08:00
+								"""
-												feat(agent): enhance agent functionality with LLM-driven decision-making and event handling

- Introduce LLM-driven decision-making across various agents, allowing for dynamic adjustments based on real-time analysis.
- Implement new event types for LLM thinking, decisions, actions, and observations to enrich the event streaming experience.
- Update agent task responses to include additional metrics for better tracking of task progress and outcomes.
- Refactor UI components to highlight LLM-related events and improve user interaction during audits.
- Enhance API endpoints to support new event structures and improve overall error handling.

											
										
										
											2025-12-11 21:14:32 +08:00
+								Orchestrator Agent (编排层) - LLM 驱动版
-												feat(agent): implement Agent audit module with LangGraph integration

- Introduce new Agent audit functionality for autonomous code security analysis and vulnerability verification.
- Add API endpoints for managing Agent tasks and configurations.
- Implement UI components for Agent mode selection and embedding model configuration.
- Enhance the overall architecture with a focus on RAG (Retrieval-Augmented Generation) for improved code semantic search.
- Create a sandbox environment for secure execution of vulnerability tests.
- Update documentation to include details on the new Agent audit features and usage instructions.

											
										
										
											2025-12-11 19:09:10 +08:00
-												feat(agent): enhance agent functionality with LLM-driven decision-making and event handling

- Introduce LLM-driven decision-making across various agents, allowing for dynamic adjustments based on real-time analysis.
- Implement new event types for LLM thinking, decisions, actions, and observations to enrich the event streaming experience.
- Update agent task responses to include additional metrics for better tracking of task progress and outcomes.
- Refactor UI components to highlight LLM-related events and improve user interaction during audits.
- Enhance API endpoints to support new event structures and improve overall error handling.

											
										
										
											2025-12-11 21:14:32 +08:00
+								LLM 是真正的大脑，全程参与决策！
 								- LLM 决定下一步做什么
 								- LLM 决定调度哪个子 Agent
 								- LLM 决定何时完成
 								- LLM 根据中间结果动态调整策略
 								类型: Autonomous Agent with Dynamic Planning
-												feat(agent): implement Agent audit module with LangGraph integration

- Introduce new Agent audit functionality for autonomous code security analysis and vulnerability verification.
- Add API endpoints for managing Agent tasks and configurations.
- Implement UI components for Agent mode selection and embedding model configuration.
- Enhance the overall architecture with a focus on RAG (Retrieval-Augmented Generation) for improved code semantic search.
- Create a sandbox environment for secure execution of vulnerability tests.
- Update documentation to include details on the new Agent audit features and usage instructions.

											
										
										
											2025-12-11 19:09:10 +08:00
+								"""
 								import asyncio
-												feat(agent): enhance agent functionality with LLM-driven decision-making and event handling

- Introduce LLM-driven decision-making across various agents, allowing for dynamic adjustments based on real-time analysis.
- Implement new event types for LLM thinking, decisions, actions, and observations to enrich the event streaming experience.
- Update agent task responses to include additional metrics for better tracking of task progress and outcomes.
- Refactor UI components to highlight LLM-related events and improve user interaction during audits.
- Enhance API endpoints to support new event structures and improve overall error handling.

											
										
										
											2025-12-11 21:14:32 +08:00
+								import json
-												feat(agent): implement Agent audit module with LangGraph integration

- Introduce new Agent audit functionality for autonomous code security analysis and vulnerability verification.
- Add API endpoints for managing Agent tasks and configurations.
- Implement UI components for Agent mode selection and embedding model configuration.
- Enhance the overall architecture with a focus on RAG (Retrieval-Augmented Generation) for improved code semantic search.
- Create a sandbox environment for secure execution of vulnerability tests.
- Update documentation to include details on the new Agent audit features and usage instructions.

											
										
										
											2025-12-11 19:09:10 +08:00
+								import logging
-												feat(agent): 增强文件路径验证防止幻觉报告

添加文件路径验证规则和检查逻辑，确保漏洞报告中的文件真实存在
移除LLM响应中的Markdown格式标记，统一解析处理
更新报告工具和端点以支持项目根目录验证

											
										
										
											2025-12-19 19:08:36 +08:00
+								import os
-												feat(agent): enhance agent functionality with LLM-driven decision-making and event handling

- Introduce LLM-driven decision-making across various agents, allowing for dynamic adjustments based on real-time analysis.
- Implement new event types for LLM thinking, decisions, actions, and observations to enrich the event streaming experience.
- Update agent task responses to include additional metrics for better tracking of task progress and outcomes.
- Refactor UI components to highlight LLM-related events and improve user interaction during audits.
- Enhance API endpoints to support new event structures and improve overall error handling.

											
										
										
											2025-12-11 21:14:32 +08:00
+								import re
-												feat(agent): implement Agent audit module with LangGraph integration

- Introduce new Agent audit functionality for autonomous code security analysis and vulnerability verification.
- Add API endpoints for managing Agent tasks and configurations.
- Implement UI components for Agent mode selection and embedding model configuration.
- Enhance the overall architecture with a focus on RAG (Retrieval-Augmented Generation) for improved code semantic search.
- Create a sandbox environment for secure execution of vulnerability tests.
- Update documentation to include details on the new Agent audit features and usage instructions.

											
										
										
											2025-12-11 19:09:10 +08:00
+								from typing import List, Dict, Any, Optional
 								from dataclasses import dataclass
 								from .base import BaseAgent, AgentConfig, AgentResult, AgentType, AgentPattern
-												feat: Introduce structured agent collaboration with `TaskHandoff` and `analysis_v2` agent, updating core agent logic, tools, and audit UI.

											
										
										
											2025-12-11 23:29:04 +08:00
+								from ..json_parser import AgentJsonParser
-												feat: 新增安全工具集成和漏洞知识库扩展

- 添加 Bandit 和 Safety 安全工具到依赖项
- 新增 CSRF、业务逻辑和开放重定向漏洞知识文档
- 实现安全工具一键安装脚本和文档
- 改进模式匹配工具支持直接文件扫描
- 增强遥测模块和 Agent 审计功能
- 修复验证节点中 findings 合并逻辑
- 优化前端 Agent 审计界面和状态展示

											
										
										
											2025-12-13 12:35:03 +08:00
+								from ..prompts import MULTI_AGENT_RULES, CORE_SECURITY_PRINCIPLES
-												feat(agent): implement Agent audit module with LangGraph integration

- Introduce new Agent audit functionality for autonomous code security analysis and vulnerability verification.
- Add API endpoints for managing Agent tasks and configurations.
- Implement UI components for Agent mode selection and embedding model configuration.
- Enhance the overall architecture with a focus on RAG (Retrieval-Augmented Generation) for improved code semantic search.
- Create a sandbox environment for secure execution of vulnerability tests.
- Update documentation to include details on the new Agent audit features and usage instructions.

											
										
										
											2025-12-11 19:09:10 +08:00
 								logger = logging.getLogger(__name__)
-												feat(agent): enhance agent functionality with LLM-driven decision-making and event handling

- Introduce LLM-driven decision-making across various agents, allowing for dynamic adjustments based on real-time analysis.
- Implement new event types for LLM thinking, decisions, actions, and observations to enrich the event streaming experience.
- Update agent task responses to include additional metrics for better tracking of task progress and outcomes.
- Refactor UI components to highlight LLM-related events and improve user interaction during audits.
- Enhance API endpoints to support new event structures and improve overall error handling.

											
										
										
											2025-12-11 21:14:32 +08:00
+								ORCHESTRATOR_SYSTEM_PROMPT = """你是 DeepAudit 的编排 Agent，负责**自主**协调整个安全审计流程。
 								## 你的角色
 								你是整个审计流程的**大脑**，不是一个机械执行者。你需要：
 . 自主思考和决策
 . 根据观察结果动态调整策略
 . 决定何时调用哪个子 Agent
 . 判断何时审计完成
 								## 你可以调度的子 Agent
 . **recon**: 信息收集 Agent - 分析项目结构、技术栈、入口点
 . **analysis**: 分析 Agent - 深度代码审计、漏洞检测
 . **verification**: 验证 Agent - 验证发现的漏洞、生成 PoC
 								## 你可以使用的操作
 								### 1. 调度子 Agent
 								```
 								Action: dispatch_agent
 								Action Input: {"agent": "recon|analysis|verification", "task": "具体任务描述", "context": "任务上下文"}
 								```
 								### 2. 汇总发现
 								```
 								Action: summarize
 								Action Input: {"findings": [...], "analysis": "你的分析"}
 								```
 								### 3. 完成审计
 								```
 								Action: finish
 								Action Input: {"conclusion": "审计结论", "findings": [...], "recommendations": [...]}
 								```
 								## 工作方式
 								每一步，你需要：
 . **Thought**: 分析当前状态，思考下一步应该做什么
 								   - 目前收集到了什么信息？
 								   - 还需要了解什么？
 								   - 应该深入分析哪些地方？
 								   - 有什么发现需要验证？
 . **Action**: 选择一个操作
 . **Action Input**: 提供操作参数
-												feat(agent): implement Agent audit module with LangGraph integration

- Introduce new Agent audit functionality for autonomous code security analysis and vulnerability verification.
- Add API endpoints for managing Agent tasks and configurations.
- Implement UI components for Agent mode selection and embedding model configuration.
- Enhance the overall architecture with a focus on RAG (Retrieval-Augmented Generation) for improved code semantic search.
- Create a sandbox environment for secure execution of vulnerability tests.
- Update documentation to include details on the new Agent audit features and usage instructions.

											
										
										
											2025-12-11 19:09:10 +08:00
 								## 输出格式
-												feat(agent): enhance agent functionality with LLM-driven decision-making and event handling

- Introduce LLM-driven decision-making across various agents, allowing for dynamic adjustments based on real-time analysis.
- Implement new event types for LLM thinking, decisions, actions, and observations to enrich the event streaming experience.
- Update agent task responses to include additional metrics for better tracking of task progress and outcomes.
- Refactor UI components to highlight LLM-related events and improve user interaction during audits.
- Enhance API endpoints to support new event structures and improve overall error handling.

											
										
										
											2025-12-11 21:14:32 +08:00
+								每一步必须严格按照以下格式：
-												feat(agent): implement Agent audit module with LangGraph integration

- Introduce new Agent audit functionality for autonomous code security analysis and vulnerability verification.
- Add API endpoints for managing Agent tasks and configurations.
- Implement UI components for Agent mode selection and embedding model configuration.
- Enhance the overall architecture with a focus on RAG (Retrieval-Augmented Generation) for improved code semantic search.
- Create a sandbox environment for secure execution of vulnerability tests.
- Update documentation to include details on the new Agent audit features and usage instructions.

											
										
										
											2025-12-11 19:09:10 +08:00
+								```
-												feat(agent): enhance agent functionality with LLM-driven decision-making and event handling

- Introduce LLM-driven decision-making across various agents, allowing for dynamic adjustments based on real-time analysis.
- Implement new event types for LLM thinking, decisions, actions, and observations to enrich the event streaming experience.
- Update agent task responses to include additional metrics for better tracking of task progress and outcomes.
- Refactor UI components to highlight LLM-related events and improve user interaction during audits.
- Enhance API endpoints to support new event structures and improve overall error handling.

											
										
										
											2025-12-11 21:14:32 +08:00
+								Thought: [你的思考过程]
 								Action: [dispatch_agent|summarize|finish]
 								Action Input: [JSON 参数]
 								```
 								## 审计策略建议
-												feat(agent): implement comprehensive agent architecture with knowledge base and persistence layer

- Add database migrations for agent checkpoints and tree node tracking
- Implement core agent execution framework with executor, state management, and message handling
- Create knowledge base system with framework-specific modules (Django, FastAPI, Flask, Express, React, Supabase)
- Add vulnerability knowledge modules covering authentication, cryptography, injection, XSS, XXE, SSRF, path traversal, deserialization, and race conditions
- Introduce new agent tools: thinking tool, reporting tool, and agent-specific utilities
- Implement LLM memory compression and prompt caching for improved performance
- Add agent registry and persistence layer for checkpoint management
- Refactor agent implementations (analysis, recon, verification, orchestrator) with enhanced capabilities
- Remove legacy agent implementations (analysis_v2, react_agent)
- Update API endpoints for agent task creation and project management
- Add frontend components for agent task creation and enhanced audit UI
- Consolidate agent service architecture with improved separation of concerns
- This refactoring provides a scalable foundation for multi-agent collaboration with knowledge-driven decision making and state persistence

											
										
										
											2025-12-12 15:27:12 +08:00
+								- 先用 recon Agent 了解项目全貌（只需调度一次）
-												feat(agent): enhance agent functionality with LLM-driven decision-making and event handling

- Introduce LLM-driven decision-making across various agents, allowing for dynamic adjustments based on real-time analysis.
- Implement new event types for LLM thinking, decisions, actions, and observations to enrich the event streaming experience.
- Update agent task responses to include additional metrics for better tracking of task progress and outcomes.
- Refactor UI components to highlight LLM-related events and improve user interaction during audits.
- Enhance API endpoints to support new event structures and improve overall error handling.

											
										
										
											2025-12-11 21:14:32 +08:00
+								- 根据 recon 结果，让 analysis Agent 重点审计高风险区域
 								- 发现可疑漏洞后，用 verification Agent 验证
 								- 随时根据新发现调整策略，不要机械执行
 								- 当你认为审计足够全面时，选择 finish
 								## 重要原则
 . **你是大脑，不是执行器** - 每一步都要思考
 . **动态调整** - 根据发现调整策略
 . **主动决策** - 不要等待，主动推进
 . **质量优先** - 宁可深入分析几个真实漏洞，不要浅尝辄止
-												feat(agent): implement comprehensive agent architecture with knowledge base and persistence layer

- Add database migrations for agent checkpoints and tree node tracking
- Implement core agent execution framework with executor, state management, and message handling
- Create knowledge base system with framework-specific modules (Django, FastAPI, Flask, Express, React, Supabase)
- Add vulnerability knowledge modules covering authentication, cryptography, injection, XSS, XXE, SSRF, path traversal, deserialization, and race conditions
- Introduce new agent tools: thinking tool, reporting tool, and agent-specific utilities
- Implement LLM memory compression and prompt caching for improved performance
- Add agent registry and persistence layer for checkpoint management
- Refactor agent implementations (analysis, recon, verification, orchestrator) with enhanced capabilities
- Remove legacy agent implementations (analysis_v2, react_agent)
- Update API endpoints for agent task creation and project management
- Add frontend components for agent task creation and enhanced audit UI
- Consolidate agent service architecture with improved separation of concerns
- This refactoring provides a scalable foundation for multi-agent collaboration with knowledge-driven decision making and state persistence

											
										
										
											2025-12-12 15:27:12 +08:00
+. **避免重复** - 每个 Agent 通常只需要调度一次，如果结果不理想，尝试其他 Agent 或直接完成审计
 								## 处理子 Agent 结果
 								- 子 Agent 返回的 Observation 包含它们的分析结果
 								- 即使结果看起来不完整，也要基于已有信息继续推进
 								- 不要反复调度同一个 Agent 期望得到不同结果
 								- 如果 recon 完成后，应该调度 analysis 进行深度分析
 								- 如果 analysis 完成后有发现，可以调度 verification 验证
 								- 如果没有更多工作要做，使用 finish 结束审计
-												feat(agent): implement Agent audit module with LangGraph integration

- Introduce new Agent audit functionality for autonomous code security analysis and vulnerability verification.
- Add API endpoints for managing Agent tasks and configurations.
- Implement UI components for Agent mode selection and embedding model configuration.
- Enhance the overall architecture with a focus on RAG (Retrieval-Augmented Generation) for improved code semantic search.
- Create a sandbox environment for secure execution of vulnerability tests.
- Update documentation to include details on the new Agent audit features and usage instructions.

											
										
										
											2025-12-11 19:09:10 +08:00
-												feat(agent): enhance agent functionality with LLM-driven decision-making and event handling

- Introduce LLM-driven decision-making across various agents, allowing for dynamic adjustments based on real-time analysis.
- Implement new event types for LLM thinking, decisions, actions, and observations to enrich the event streaming experience.
- Update agent task responses to include additional metrics for better tracking of task progress and outcomes.
- Refactor UI components to highlight LLM-related events and improve user interaction during audits.
- Enhance API endpoints to support new event structures and improve overall error handling.

											
										
										
											2025-12-11 21:14:32 +08:00
+								现在，基于项目信息开始你的审计工作！"""
 								@dataclass
 								class AgentStep:
 								    """执行步骤"""
 								    thought: str
 								    action: str
 								    action_input: Dict[str, Any]
 								    observation: Optional[str] = None
 								    sub_agent_result: Optional[AgentResult] = None
-												feat(agent): implement Agent audit module with LangGraph integration

- Introduce new Agent audit functionality for autonomous code security analysis and vulnerability verification.
- Add API endpoints for managing Agent tasks and configurations.
- Implement UI components for Agent mode selection and embedding model configuration.
- Enhance the overall architecture with a focus on RAG (Retrieval-Augmented Generation) for improved code semantic search.
- Create a sandbox environment for secure execution of vulnerability tests.
- Update documentation to include details on the new Agent audit features and usage instructions.

											
										
										
											2025-12-11 19:09:10 +08:00
 								class OrchestratorAgent(BaseAgent):
 								    """
-												feat(agent): enhance agent functionality with LLM-driven decision-making and event handling

- Introduce LLM-driven decision-making across various agents, allowing for dynamic adjustments based on real-time analysis.
- Implement new event types for LLM thinking, decisions, actions, and observations to enrich the event streaming experience.
- Update agent task responses to include additional metrics for better tracking of task progress and outcomes.
- Refactor UI components to highlight LLM-related events and improve user interaction during audits.
- Enhance API endpoints to support new event structures and improve overall error handling.

											
										
										
											2025-12-11 21:14:32 +08:00
+								    编排 Agent - LLM 驱动版
-												feat(agent): implement Agent audit module with LangGraph integration

- Introduce new Agent audit functionality for autonomous code security analysis and vulnerability verification.
- Add API endpoints for managing Agent tasks and configurations.
- Implement UI components for Agent mode selection and embedding model configuration.
- Enhance the overall architecture with a focus on RAG (Retrieval-Augmented Generation) for improved code semantic search.
- Create a sandbox environment for secure execution of vulnerability tests.
- Update documentation to include details on the new Agent audit features and usage instructions.

											
										
										
											2025-12-11 19:09:10 +08:00
-												feat(agent): enhance agent functionality with LLM-driven decision-making and event handling

- Introduce LLM-driven decision-making across various agents, allowing for dynamic adjustments based on real-time analysis.
- Implement new event types for LLM thinking, decisions, actions, and observations to enrich the event streaming experience.
- Update agent task responses to include additional metrics for better tracking of task progress and outcomes.
- Refactor UI components to highlight LLM-related events and improve user interaction during audits.
- Enhance API endpoints to support new event structures and improve overall error handling.

											
										
										
											2025-12-11 21:14:32 +08:00
+								    LLM 全程参与决策：
 . LLM 思考当前状态
 . LLM 决定下一步操作
 . 执行操作，获取结果
 . LLM 分析结果，决定下一步
 . 重复直到 LLM 决定完成
-												feat(agent): implement Agent audit module with LangGraph integration

- Introduce new Agent audit functionality for autonomous code security analysis and vulnerability verification.
- Add API endpoints for managing Agent tasks and configurations.
- Implement UI components for Agent mode selection and embedding model configuration.
- Enhance the overall architecture with a focus on RAG (Retrieval-Augmented Generation) for improved code semantic search.
- Create a sandbox environment for secure execution of vulnerability tests.
- Update documentation to include details on the new Agent audit features and usage instructions.

											
										
										
											2025-12-11 19:09:10 +08:00
+								    """
 								    def __init__(
 								        self,
 								        llm_service,
 								        tools: Dict[str, Any],
 								        event_emitter=None,
 								        sub_agents: Optional[Dict[str, BaseAgent]] = None,
-												feat: 新增安全工具集成和漏洞知识库扩展

- 添加 Bandit 和 Safety 安全工具到依赖项
- 新增 CSRF、业务逻辑和开放重定向漏洞知识文档
- 实现安全工具一键安装脚本和文档
- 改进模式匹配工具支持直接文件扫描
- 增强遥测模块和 Agent 审计功能
- 修复验证节点中 findings 合并逻辑
- 优化前端 Agent 审计界面和状态展示

											
										
										
											2025-12-13 12:35:03 +08:00
+								        tracer=None,
-												feat(agent): implement Agent audit module with LangGraph integration

- Introduce new Agent audit functionality for autonomous code security analysis and vulnerability verification.
- Add API endpoints for managing Agent tasks and configurations.
- Implement UI components for Agent mode selection and embedding model configuration.
- Enhance the overall architecture with a focus on RAG (Retrieval-Augmented Generation) for improved code semantic search.
- Create a sandbox environment for secure execution of vulnerability tests.
- Update documentation to include details on the new Agent audit features and usage instructions.

											
										
										
											2025-12-11 19:09:10 +08:00
+								    ):
-												feat: 新增安全工具集成和漏洞知识库扩展

- 添加 Bandit 和 Safety 安全工具到依赖项
- 新增 CSRF、业务逻辑和开放重定向漏洞知识文档
- 实现安全工具一键安装脚本和文档
- 改进模式匹配工具支持直接文件扫描
- 增强遥测模块和 Agent 审计功能
- 修复验证节点中 findings 合并逻辑
- 优化前端 Agent 审计界面和状态展示

											
										
										
											2025-12-13 12:35:03 +08:00
+								        # 组合增强的系统提示词，注入多Agent协作规则和核心安全原则
 								        full_system_prompt = f"{ORCHESTRATOR_SYSTEM_PROMPT}\n\n{CORE_SECURITY_PRINCIPLES}\n\n{MULTI_AGENT_RULES}"
-												feat(agent): implement Agent audit module with LangGraph integration

- Introduce new Agent audit functionality for autonomous code security analysis and vulnerability verification.
- Add API endpoints for managing Agent tasks and configurations.
- Implement UI components for Agent mode selection and embedding model configuration.
- Enhance the overall architecture with a focus on RAG (Retrieval-Augmented Generation) for improved code semantic search.
- Create a sandbox environment for secure execution of vulnerability tests.
- Update documentation to include details on the new Agent audit features and usage instructions.

											
										
										
											2025-12-11 19:09:10 +08:00
+								        config = AgentConfig(
 								            name="Orchestrator",
 								            agent_type=AgentType.ORCHESTRATOR,
-												feat(agent): enhance agent functionality with LLM-driven decision-making and event handling

- Introduce LLM-driven decision-making across various agents, allowing for dynamic adjustments based on real-time analysis.
- Implement new event types for LLM thinking, decisions, actions, and observations to enrich the event streaming experience.
- Update agent task responses to include additional metrics for better tracking of task progress and outcomes.
- Refactor UI components to highlight LLM-related events and improve user interaction during audits.
- Enhance API endpoints to support new event structures and improve overall error handling.

											
										
										
											2025-12-11 21:14:32 +08:00
+								            pattern=AgentPattern.REACT,  # 改为 ReAct 模式！
 								            max_iterations=20,
-												feat: 新增安全工具集成和漏洞知识库扩展

- 添加 Bandit 和 Safety 安全工具到依赖项
- 新增 CSRF、业务逻辑和开放重定向漏洞知识文档
- 实现安全工具一键安装脚本和文档
- 改进模式匹配工具支持直接文件扫描
- 增强遥测模块和 Agent 审计功能
- 修复验证节点中 findings 合并逻辑
- 优化前端 Agent 审计界面和状态展示

											
										
										
											2025-12-13 12:35:03 +08:00
+								            system_prompt=full_system_prompt,
-												feat(agent): implement Agent audit module with LangGraph integration

- Introduce new Agent audit functionality for autonomous code security analysis and vulnerability verification.
- Add API endpoints for managing Agent tasks and configurations.
- Implement UI components for Agent mode selection and embedding model configuration.
- Enhance the overall architecture with a focus on RAG (Retrieval-Augmented Generation) for improved code semantic search.
- Create a sandbox environment for secure execution of vulnerability tests.
- Update documentation to include details on the new Agent audit features and usage instructions.

											
										
										
											2025-12-11 19:09:10 +08:00
+								        )
 								        super().__init__(config, llm_service, tools, event_emitter)
 								        self.sub_agents = sub_agents or {}
-												feat(agent): enhance agent functionality with LLM-driven decision-making and event handling

- Introduce LLM-driven decision-making across various agents, allowing for dynamic adjustments based on real-time analysis.
- Implement new event types for LLM thinking, decisions, actions, and observations to enrich the event streaming experience.
- Update agent task responses to include additional metrics for better tracking of task progress and outcomes.
- Refactor UI components to highlight LLM-related events and improve user interaction during audits.
- Enhance API endpoints to support new event structures and improve overall error handling.

											
										
										
											2025-12-11 21:14:32 +08:00
+								        self._conversation_history: List[Dict[str, str]] = []
 								        self._steps: List[AgentStep] = []
 								        self._all_findings: List[Dict] = []
-												feat(agent): implement comprehensive agent architecture with knowledge base and persistence layer

- Add database migrations for agent checkpoints and tree node tracking
- Implement core agent execution framework with executor, state management, and message handling
- Create knowledge base system with framework-specific modules (Django, FastAPI, Flask, Express, React, Supabase)
- Add vulnerability knowledge modules covering authentication, cryptography, injection, XSS, XXE, SSRF, path traversal, deserialization, and race conditions
- Introduce new agent tools: thinking tool, reporting tool, and agent-specific utilities
- Implement LLM memory compression and prompt caching for improved performance
- Add agent registry and persistence layer for checkpoint management
- Refactor agent implementations (analysis, recon, verification, orchestrator) with enhanced capabilities
- Remove legacy agent implementations (analysis_v2, react_agent)
- Update API endpoints for agent task creation and project management
- Add frontend components for agent task creation and enhanced audit UI
- Consolidate agent service architecture with improved separation of concerns
- This refactoring provides a scalable foundation for multi-agent collaboration with knowledge-driven decision making and state persistence

											
										
										
											2025-12-12 15:27:12 +08:00
-												feat: 新增安全工具集成和漏洞知识库扩展

- 添加 Bandit 和 Safety 安全工具到依赖项
- 新增 CSRF、业务逻辑和开放重定向漏洞知识文档
- 实现安全工具一键安装脚本和文档
- 改进模式匹配工具支持直接文件扫描
- 增强遥测模块和 Agent 审计功能
- 修复验证节点中 findings 合并逻辑
- 优化前端 Agent 审计界面和状态展示

											
										
										
											2025-12-13 12:35:03 +08:00
+								        # 🔥 Tracer 遥测支持
 								        self.tracer = tracer
-												feat(agent): implement comprehensive agent architecture with knowledge base and persistence layer

- Add database migrations for agent checkpoints and tree node tracking
- Implement core agent execution framework with executor, state management, and message handling
- Create knowledge base system with framework-specific modules (Django, FastAPI, Flask, Express, React, Supabase)
- Add vulnerability knowledge modules covering authentication, cryptography, injection, XSS, XXE, SSRF, path traversal, deserialization, and race conditions
- Introduce new agent tools: thinking tool, reporting tool, and agent-specific utilities
- Implement LLM memory compression and prompt caching for improved performance
- Add agent registry and persistence layer for checkpoint management
- Refactor agent implementations (analysis, recon, verification, orchestrator) with enhanced capabilities
- Remove legacy agent implementations (analysis_v2, react_agent)
- Update API endpoints for agent task creation and project management
- Add frontend components for agent task creation and enhanced audit UI
- Consolidate agent service architecture with improved separation of concerns
- This refactoring provides a scalable foundation for multi-agent collaboration with knowledge-driven decision making and state persistence

											
										
										
											2025-12-12 15:27:12 +08:00
+								        # 🔥 存储运行时上下文，用于传递给子 Agent
 								        self._runtime_context: Dict[str, Any] = {}
 								        # 🔥 跟踪已调度的 Agent 任务，避免重复调度
 								        self._dispatched_tasks: Dict[str, int] = {}  # agent_name -> dispatch_count
-												feat(agent): 新增多语言代码测试和漏洞验证工具并增强错误处理

新增 PHP、Python、JavaScript 等多语言代码测试工具和命令注入、SQL 注入等专用漏洞验证工具
优化错误处理逻辑，提供更详细的错误信息和堆栈跟踪
增强 JSON 解析器，优先使用 json-repair 库处理复杂格式
改进 Agent 响应解析逻辑，更健壮地提取思考内容和操作指令
完善沙箱管理器的初始化和错误处理机制

											
										
										
											2025-12-14 17:20:54 +08:00
 								        # 🔥 保存各个 Agent 的完整结果，用于传递给后续 Agent
 								        self._agent_results: Dict[str, Dict[str, Any]] = {}  # agent_name -> full result data
-												feat(agent): implement Agent audit module with LangGraph integration

- Introduce new Agent audit functionality for autonomous code security analysis and vulnerability verification.
- Add API endpoints for managing Agent tasks and configurations.
- Implement UI components for Agent mode selection and embedding model configuration.
- Enhance the overall architecture with a focus on RAG (Retrieval-Augmented Generation) for improved code semantic search.
- Create a sandbox environment for secure execution of vulnerability tests.
- Update documentation to include details on the new Agent audit features and usage instructions.

											
										
										
											2025-12-11 19:09:10 +08:00
 								    def register_sub_agent(self, name: str, agent: BaseAgent):
 								        """注册子 Agent"""
 								        self.sub_agents[name] = agent
-												feat(agent): implement comprehensive agent architecture with knowledge base and persistence layer

- Add database migrations for agent checkpoints and tree node tracking
- Implement core agent execution framework with executor, state management, and message handling
- Create knowledge base system with framework-specific modules (Django, FastAPI, Flask, Express, React, Supabase)
- Add vulnerability knowledge modules covering authentication, cryptography, injection, XSS, XXE, SSRF, path traversal, deserialization, and race conditions
- Introduce new agent tools: thinking tool, reporting tool, and agent-specific utilities
- Implement LLM memory compression and prompt caching for improved performance
- Add agent registry and persistence layer for checkpoint management
- Refactor agent implementations (analysis, recon, verification, orchestrator) with enhanced capabilities
- Remove legacy agent implementations (analysis_v2, react_agent)
- Update API endpoints for agent task creation and project management
- Add frontend components for agent task creation and enhanced audit UI
- Consolidate agent service architecture with improved separation of concerns
- This refactoring provides a scalable foundation for multi-agent collaboration with knowledge-driven decision making and state persistence

											
										
										
											2025-12-12 15:27:12 +08:00
+								    def cancel(self):
 								        """
 								        取消执行 - 同时取消所有子 Agent
 								        重写父类方法，确保取消信号传播到所有子 Agent
 								        """
 								        self._cancelled = True
 								        logger.info(f"[{self.name}] Cancel requested, propagating to {len(self.sub_agents)} sub-agents")
 								        # 🔥 传播取消信号到所有子 Agent
 								        for name, agent in self.sub_agents.items():
 								            if hasattr(agent, 'cancel'):
 								                agent.cancel()
 								                logger.info(f"[{self.name}] Cancelled sub-agent: {name}")
-												feat(agent): implement Agent audit module with LangGraph integration

- Introduce new Agent audit functionality for autonomous code security analysis and vulnerability verification.
- Add API endpoints for managing Agent tasks and configurations.
- Implement UI components for Agent mode selection and embedding model configuration.
- Enhance the overall architecture with a focus on RAG (Retrieval-Augmented Generation) for improved code semantic search.
- Create a sandbox environment for secure execution of vulnerability tests.
- Update documentation to include details on the new Agent audit features and usage instructions.

											
										
										
											2025-12-11 19:09:10 +08:00
+								    async def run(self, input_data: Dict[str, Any]) -> AgentResult:
 								        """
-												feat(agent): enhance agent functionality with LLM-driven decision-making and event handling

- Introduce LLM-driven decision-making across various agents, allowing for dynamic adjustments based on real-time analysis.
- Implement new event types for LLM thinking, decisions, actions, and observations to enrich the event streaming experience.
- Update agent task responses to include additional metrics for better tracking of task progress and outcomes.
- Refactor UI components to highlight LLM-related events and improve user interaction during audits.
- Enhance API endpoints to support new event structures and improve overall error handling.

											
										
										
											2025-12-11 21:14:32 +08:00
+								        执行编排任务 - LLM 全程参与！
-												feat(agent): implement Agent audit module with LangGraph integration

- Introduce new Agent audit functionality for autonomous code security analysis and vulnerability verification.
- Add API endpoints for managing Agent tasks and configurations.
- Implement UI components for Agent mode selection and embedding model configuration.
- Enhance the overall architecture with a focus on RAG (Retrieval-Augmented Generation) for improved code semantic search.
- Create a sandbox environment for secure execution of vulnerability tests.
- Update documentation to include details on the new Agent audit features and usage instructions.

											
										
										
											2025-12-11 19:09:10 +08:00
 								        Args:
 								            input_data: {
 								                "project_info": 项目信息,
 								                "config": 审计配置,
-												feat(agent): implement comprehensive agent architecture with knowledge base and persistence layer

- Add database migrations for agent checkpoints and tree node tracking
- Implement core agent execution framework with executor, state management, and message handling
- Create knowledge base system with framework-specific modules (Django, FastAPI, Flask, Express, React, Supabase)
- Add vulnerability knowledge modules covering authentication, cryptography, injection, XSS, XXE, SSRF, path traversal, deserialization, and race conditions
- Introduce new agent tools: thinking tool, reporting tool, and agent-specific utilities
- Implement LLM memory compression and prompt caching for improved performance
- Add agent registry and persistence layer for checkpoint management
- Refactor agent implementations (analysis, recon, verification, orchestrator) with enhanced capabilities
- Remove legacy agent implementations (analysis_v2, react_agent)
- Update API endpoints for agent task creation and project management
- Add frontend components for agent task creation and enhanced audit UI
- Consolidate agent service architecture with improved separation of concerns
- This refactoring provides a scalable foundation for multi-agent collaboration with knowledge-driven decision making and state persistence

											
										
										
											2025-12-12 15:27:12 +08:00
+								                "project_root": 项目根目录,
 								                "task_id": 任务ID,
-												feat(agent): implement Agent audit module with LangGraph integration

- Introduce new Agent audit functionality for autonomous code security analysis and vulnerability verification.
- Add API endpoints for managing Agent tasks and configurations.
- Implement UI components for Agent mode selection and embedding model configuration.
- Enhance the overall architecture with a focus on RAG (Retrieval-Augmented Generation) for improved code semantic search.
- Create a sandbox environment for secure execution of vulnerability tests.
- Update documentation to include details on the new Agent audit features and usage instructions.

											
										
										
											2025-12-11 19:09:10 +08:00
+								            }
 								        """
 								        import time
 								        start_time = time.time()
 								        project_info = input_data.get("project_info", {})
 								        config = input_data.get("config", {})
-												feat(agent): implement comprehensive agent architecture with knowledge base and persistence layer

- Add database migrations for agent checkpoints and tree node tracking
- Implement core agent execution framework with executor, state management, and message handling
- Create knowledge base system with framework-specific modules (Django, FastAPI, Flask, Express, React, Supabase)
- Add vulnerability knowledge modules covering authentication, cryptography, injection, XSS, XXE, SSRF, path traversal, deserialization, and race conditions
- Introduce new agent tools: thinking tool, reporting tool, and agent-specific utilities
- Implement LLM memory compression and prompt caching for improved performance
- Add agent registry and persistence layer for checkpoint management
- Refactor agent implementations (analysis, recon, verification, orchestrator) with enhanced capabilities
- Remove legacy agent implementations (analysis_v2, react_agent)
- Update API endpoints for agent task creation and project management
- Add frontend components for agent task creation and enhanced audit UI
- Consolidate agent service architecture with improved separation of concerns
- This refactoring provides a scalable foundation for multi-agent collaboration with knowledge-driven decision making and state persistence

											
										
										
											2025-12-12 15:27:12 +08:00
+								        # 🔥 保存运行时上下文，用于传递给子 Agent
 								        self._runtime_context = {
 								            "project_info": project_info,
 								            "config": config,
 								            "project_root": input_data.get("project_root", project_info.get("root", ".")),
 								            "task_id": input_data.get("task_id"),
 								        }
-												feat(agent): enhance agent functionality with LLM-driven decision-making and event handling

- Introduce LLM-driven decision-making across various agents, allowing for dynamic adjustments based on real-time analysis.
- Implement new event types for LLM thinking, decisions, actions, and observations to enrich the event streaming experience.
- Update agent task responses to include additional metrics for better tracking of task progress and outcomes.
- Refactor UI components to highlight LLM-related events and improve user interaction during audits.
- Enhance API endpoints to support new event structures and improve overall error handling.

											
										
										
											2025-12-11 21:14:32 +08:00
+								        # 构建初始消息
 								        initial_message = self._build_initial_message(project_info, config)
 								        # 初始化对话历史
 								        self._conversation_history = [
 								            {"role": "system", "content": self.config.system_prompt},
 								            {"role": "user", "content": initial_message},
 								        ]
 								        self._steps = []
 								        self._all_findings = []
-												feat(agent): 新增多语言代码测试和漏洞验证工具并增强错误处理

新增 PHP、Python、JavaScript 等多语言代码测试工具和命令注入、SQL 注入等专用漏洞验证工具
优化错误处理逻辑，提供更详细的错误信息和堆栈跟踪
增强 JSON 解析器，优先使用 json-repair 库处理复杂格式
改进 Agent 响应解析逻辑，更健壮地提取思考内容和操作指令
完善沙箱管理器的初始化和错误处理机制

											
										
										
											2025-12-14 17:20:54 +08:00
+								        self._agent_results = {}  # 🔥 重置 Agent 结果缓存
-												feat(agent): enhance agent functionality with LLM-driven decision-making and event handling

- Introduce LLM-driven decision-making across various agents, allowing for dynamic adjustments based on real-time analysis.
- Implement new event types for LLM thinking, decisions, actions, and observations to enrich the event streaming experience.
- Update agent task responses to include additional metrics for better tracking of task progress and outcomes.
- Refactor UI components to highlight LLM-related events and improve user interaction during audits.
- Enhance API endpoints to support new event structures and improve overall error handling.

											
										
										
											2025-12-11 21:14:32 +08:00
+								        final_result = None
-												feat(agent): implement comprehensive agent architecture with knowledge base and persistence layer

- Add database migrations for agent checkpoints and tree node tracking
- Implement core agent execution framework with executor, state management, and message handling
- Create knowledge base system with framework-specific modules (Django, FastAPI, Flask, Express, React, Supabase)
- Add vulnerability knowledge modules covering authentication, cryptography, injection, XSS, XXE, SSRF, path traversal, deserialization, and race conditions
- Introduce new agent tools: thinking tool, reporting tool, and agent-specific utilities
- Implement LLM memory compression and prompt caching for improved performance
- Add agent registry and persistence layer for checkpoint management
- Refactor agent implementations (analysis, recon, verification, orchestrator) with enhanced capabilities
- Remove legacy agent implementations (analysis_v2, react_agent)
- Update API endpoints for agent task creation and project management
- Add frontend components for agent task creation and enhanced audit UI
- Consolidate agent service architecture with improved separation of concerns
- This refactoring provides a scalable foundation for multi-agent collaboration with knowledge-driven decision making and state persistence

											
										
										
											2025-12-12 15:27:12 +08:00
+								        error_message = None  # 🔥 跟踪错误信息
-												feat(agent): enhance agent functionality with LLM-driven decision-making and event handling

- Introduce LLM-driven decision-making across various agents, allowing for dynamic adjustments based on real-time analysis.
- Implement new event types for LLM thinking, decisions, actions, and observations to enrich the event streaming experience.
- Update agent task responses to include additional metrics for better tracking of task progress and outcomes.
- Refactor UI components to highlight LLM-related events and improve user interaction during audits.
- Enhance API endpoints to support new event structures and improve overall error handling.

											
										
										
											2025-12-11 21:14:32 +08:00
 								        await self.emit_thinking("🧠 Orchestrator Agent 启动，LLM 开始自主编排决策...")
-												feat(agent): implement Agent audit module with LangGraph integration

- Introduce new Agent audit functionality for autonomous code security analysis and vulnerability verification.
- Add API endpoints for managing Agent tasks and configurations.
- Implement UI components for Agent mode selection and embedding model configuration.
- Enhance the overall architecture with a focus on RAG (Retrieval-Augmented Generation) for improved code semantic search.
- Create a sandbox environment for secure execution of vulnerability tests.
- Update documentation to include details on the new Agent audit features and usage instructions.

											
										
										
											2025-12-11 19:09:10 +08:00
+								        try:
-												feat(agent): enhance agent functionality with LLM-driven decision-making and event handling

- Introduce LLM-driven decision-making across various agents, allowing for dynamic adjustments based on real-time analysis.
- Implement new event types for LLM thinking, decisions, actions, and observations to enrich the event streaming experience.
- Update agent task responses to include additional metrics for better tracking of task progress and outcomes.
- Refactor UI components to highlight LLM-related events and improve user interaction during audits.
- Enhance API endpoints to support new event structures and improve overall error handling.

											
										
										
											2025-12-11 21:14:32 +08:00
+								            for iteration in range(self.config.max_iterations):
-												feat(agent): implement Agent audit module with LangGraph integration

- Introduce new Agent audit functionality for autonomous code security analysis and vulnerability verification.
- Add API endpoints for managing Agent tasks and configurations.
- Implement UI components for Agent mode selection and embedding model configuration.
- Enhance the overall architecture with a focus on RAG (Retrieval-Augmented Generation) for improved code semantic search.
- Create a sandbox environment for secure execution of vulnerability tests.
- Update documentation to include details on the new Agent audit features and usage instructions.

											
										
										
											2025-12-11 19:09:10 +08:00
+								                if self.is_cancelled:
 								                    break
-												feat(agent): enhance agent functionality with LLM-driven decision-making and event handling

- Introduce LLM-driven decision-making across various agents, allowing for dynamic adjustments based on real-time analysis.
- Implement new event types for LLM thinking, decisions, actions, and observations to enrich the event streaming experience.
- Update agent task responses to include additional metrics for better tracking of task progress and outcomes.
- Refactor UI components to highlight LLM-related events and improve user interaction during audits.
- Enhance API endpoints to support new event structures and improve overall error handling.

											
										
										
											2025-12-11 21:14:32 +08:00
+								                self._iteration = iteration + 1
-												feat(agent): implement Agent audit module with LangGraph integration

- Introduce new Agent audit functionality for autonomous code security analysis and vulnerability verification.
- Add API endpoints for managing Agent tasks and configurations.
- Implement UI components for Agent mode selection and embedding model configuration.
- Enhance the overall architecture with a focus on RAG (Retrieval-Augmented Generation) for improved code semantic search.
- Create a sandbox environment for secure execution of vulnerability tests.
- Update documentation to include details on the new Agent audit features and usage instructions.

											
										
										
											2025-12-11 19:09:10 +08:00
-												feat: Introduce structured agent collaboration with `TaskHandoff` and `analysis_v2` agent, updating core agent logic, tools, and audit UI.

											
										
										
											2025-12-11 23:29:04 +08:00
+								                # 🔥 再次检查取消标志（在LLM调用之前）
 								                if self.is_cancelled:
 								                    await self.emit_thinking("🛑 任务已取消，停止执行")
 								                    break
-												feat(agent): implement Agent audit module with LangGraph integration

- Introduce new Agent audit functionality for autonomous code security analysis and vulnerability verification.
- Add API endpoints for managing Agent tasks and configurations.
- Implement UI components for Agent mode selection and embedding model configuration.
- Enhance the overall architecture with a focus on RAG (Retrieval-Augmented Generation) for improved code semantic search.
- Create a sandbox environment for secure execution of vulnerability tests.
- Update documentation to include details on the new Agent audit features and usage instructions.

											
										
										
											2025-12-11 19:09:10 +08:00
-												feat: Introduce structured agent collaboration with `TaskHandoff` and `analysis_v2` agent, updating core agent logic, tools, and audit UI.

											
										
										
											2025-12-11 23:29:04 +08:00
+								                # 调用 LLM 进行思考和决策（流式输出）
 								                try:
 								                    llm_output, tokens_this_round = await self.stream_llm_call(
 								                        self._conversation_history,
-												feat(agent): 使用用户配置的LLM参数替代硬编码值

重构所有Agent和LLM服务，移除硬编码的temperature和max_tokens参数
添加get_analysis_config函数统一处理分析配置
在LLM测试接口中显示用户保存的配置参数
前端调试面板默认显示LLM测试详细信息

											
										
										
											2025-12-19 16:08:26 +08:00
+								                        # 🔥 不传递 temperature 和 max_tokens，使用用户配置
-												feat: Introduce structured agent collaboration with `TaskHandoff` and `analysis_v2` agent, updating core agent logic, tools, and audit UI.

											
										
										
											2025-12-11 23:29:04 +08:00
+								                    )
 								                except asyncio.CancelledError:
 								                    logger.info(f"[{self.name}] LLM call cancelled")
 								                    break
-												feat(agent): implement Agent audit module with LangGraph integration

- Introduce new Agent audit functionality for autonomous code security analysis and vulnerability verification.
- Add API endpoints for managing Agent tasks and configurations.
- Implement UI components for Agent mode selection and embedding model configuration.
- Enhance the overall architecture with a focus on RAG (Retrieval-Augmented Generation) for improved code semantic search.
- Create a sandbox environment for secure execution of vulnerability tests.
- Update documentation to include details on the new Agent audit features and usage instructions.

											
										
										
											2025-12-11 19:09:10 +08:00
-												feat(agent): enhance agent functionality with LLM-driven decision-making and event handling

- Introduce LLM-driven decision-making across various agents, allowing for dynamic adjustments based on real-time analysis.
- Implement new event types for LLM thinking, decisions, actions, and observations to enrich the event streaming experience.
- Update agent task responses to include additional metrics for better tracking of task progress and outcomes.
- Refactor UI components to highlight LLM-related events and improve user interaction during audits.
- Enhance API endpoints to support new event structures and improve overall error handling.

											
										
										
											2025-12-11 21:14:32 +08:00
+								                self._total_tokens += tokens_this_round
-												feat(agent): implement Agent audit module with LangGraph integration

- Introduce new Agent audit functionality for autonomous code security analysis and vulnerability verification.
- Add API endpoints for managing Agent tasks and configurations.
- Implement UI components for Agent mode selection and embedding model configuration.
- Enhance the overall architecture with a focus on RAG (Retrieval-Augmented Generation) for improved code semantic search.
- Create a sandbox environment for secure execution of vulnerability tests.
- Update documentation to include details on the new Agent audit features and usage instructions.

											
										
										
											2025-12-11 19:09:10 +08:00
-												feat(agent): implement comprehensive agent architecture with knowledge base and persistence layer

- Add database migrations for agent checkpoints and tree node tracking
- Implement core agent execution framework with executor, state management, and message handling
- Create knowledge base system with framework-specific modules (Django, FastAPI, Flask, Express, React, Supabase)
- Add vulnerability knowledge modules covering authentication, cryptography, injection, XSS, XXE, SSRF, path traversal, deserialization, and race conditions
- Introduce new agent tools: thinking tool, reporting tool, and agent-specific utilities
- Implement LLM memory compression and prompt caching for improved performance
- Add agent registry and persistence layer for checkpoint management
- Refactor agent implementations (analysis, recon, verification, orchestrator) with enhanced capabilities
- Remove legacy agent implementations (analysis_v2, react_agent)
- Update API endpoints for agent task creation and project management
- Add frontend components for agent task creation and enhanced audit UI
- Consolidate agent service architecture with improved separation of concerns
- This refactoring provides a scalable foundation for multi-agent collaboration with knowledge-driven decision making and state persistence

											
										
										
											2025-12-12 15:27:12 +08:00
+								                # 🔥 检测空响应
 								                if not llm_output or not llm_output.strip():
 								                    logger.warning(f"[{self.name}] Empty LLM response")
 								                    empty_retry_count = getattr(self, '_empty_retry_count', 0) + 1
 								                    self._empty_retry_count = empty_retry_count
-												feat: 新增安全工具集成和漏洞知识库扩展

- 添加 Bandit 和 Safety 安全工具到依赖项
- 新增 CSRF、业务逻辑和开放重定向漏洞知识文档
- 实现安全工具一键安装脚本和文档
- 改进模式匹配工具支持直接文件扫描
- 增强遥测模块和 Agent 审计功能
- 修复验证节点中 findings 合并逻辑
- 优化前端 Agent 审计界面和状态展示

											
										
										
											2025-12-13 12:35:03 +08:00
+								                    if empty_retry_count >= 5:  # 🔥 增加重试次数到5次
-												feat(agent): implement comprehensive agent architecture with knowledge base and persistence layer

- Add database migrations for agent checkpoints and tree node tracking
- Implement core agent execution framework with executor, state management, and message handling
- Create knowledge base system with framework-specific modules (Django, FastAPI, Flask, Express, React, Supabase)
- Add vulnerability knowledge modules covering authentication, cryptography, injection, XSS, XXE, SSRF, path traversal, deserialization, and race conditions
- Introduce new agent tools: thinking tool, reporting tool, and agent-specific utilities
- Implement LLM memory compression and prompt caching for improved performance
- Add agent registry and persistence layer for checkpoint management
- Refactor agent implementations (analysis, recon, verification, orchestrator) with enhanced capabilities
- Remove legacy agent implementations (analysis_v2, react_agent)
- Update API endpoints for agent task creation and project management
- Add frontend components for agent task creation and enhanced audit UI
- Consolidate agent service architecture with improved separation of concerns
- This refactoring provides a scalable foundation for multi-agent collaboration with knowledge-driven decision making and state persistence

											
										
										
											2025-12-12 15:27:12 +08:00
+								                        logger.error(f"[{self.name}] Too many empty responses, stopping")
 								                        error_message = "连续收到空响应，停止编排"
 								                        await self.emit_event("error", error_message)
 								                        break
-												feat: 新增安全工具集成和漏洞知识库扩展

- 添加 Bandit 和 Safety 安全工具到依赖项
- 新增 CSRF、业务逻辑和开放重定向漏洞知识文档
- 实现安全工具一键安装脚本和文档
- 改进模式匹配工具支持直接文件扫描
- 增强遥测模块和 Agent 审计功能
- 修复验证节点中 findings 合并逻辑
- 优化前端 Agent 审计界面和状态展示

											
										
										
											2025-12-13 12:35:03 +08:00
 								                    # 🔥 添加短暂延迟，避免快速重试
 								                    await asyncio.sleep(1.0)
 								                    # 🔥 更详细的重试提示
 								                    retry_prompt = f"""收到空响应（第 {empty_retry_count} 次）。请严格按照以下格式输出你的决策：
 								Thought: [你对当前审计状态的思考]
 								Action: [dispatch_agent|summarize|finish]
 								Action Input: {{"参数": "值"}}
 								当前可调度的子 Agent: {list(self.sub_agents.keys())}
 								当前已收集发现: {len(self._all_findings)} 个
 								请立即输出你的下一步决策。"""
-												feat(agent): implement comprehensive agent architecture with knowledge base and persistence layer

- Add database migrations for agent checkpoints and tree node tracking
- Implement core agent execution framework with executor, state management, and message handling
- Create knowledge base system with framework-specific modules (Django, FastAPI, Flask, Express, React, Supabase)
- Add vulnerability knowledge modules covering authentication, cryptography, injection, XSS, XXE, SSRF, path traversal, deserialization, and race conditions
- Introduce new agent tools: thinking tool, reporting tool, and agent-specific utilities
- Implement LLM memory compression and prompt caching for improved performance
- Add agent registry and persistence layer for checkpoint management
- Refactor agent implementations (analysis, recon, verification, orchestrator) with enhanced capabilities
- Remove legacy agent implementations (analysis_v2, react_agent)
- Update API endpoints for agent task creation and project management
- Add frontend components for agent task creation and enhanced audit UI
- Consolidate agent service architecture with improved separation of concerns
- This refactoring provides a scalable foundation for multi-agent collaboration with knowledge-driven decision making and state persistence

											
										
										
											2025-12-12 15:27:12 +08:00
+								                    self._conversation_history.append({
 								                        "role": "user",
-												feat: 新增安全工具集成和漏洞知识库扩展

- 添加 Bandit 和 Safety 安全工具到依赖项
- 新增 CSRF、业务逻辑和开放重定向漏洞知识文档
- 实现安全工具一键安装脚本和文档
- 改进模式匹配工具支持直接文件扫描
- 增强遥测模块和 Agent 审计功能
- 修复验证节点中 findings 合并逻辑
- 优化前端 Agent 审计界面和状态展示

											
										
										
											2025-12-13 12:35:03 +08:00
+								                        "content": retry_prompt,
-												feat(agent): implement comprehensive agent architecture with knowledge base and persistence layer

- Add database migrations for agent checkpoints and tree node tracking
- Implement core agent execution framework with executor, state management, and message handling
- Create knowledge base system with framework-specific modules (Django, FastAPI, Flask, Express, React, Supabase)
- Add vulnerability knowledge modules covering authentication, cryptography, injection, XSS, XXE, SSRF, path traversal, deserialization, and race conditions
- Introduce new agent tools: thinking tool, reporting tool, and agent-specific utilities
- Implement LLM memory compression and prompt caching for improved performance
- Add agent registry and persistence layer for checkpoint management
- Refactor agent implementations (analysis, recon, verification, orchestrator) with enhanced capabilities
- Remove legacy agent implementations (analysis_v2, react_agent)
- Update API endpoints for agent task creation and project management
- Add frontend components for agent task creation and enhanced audit UI
- Consolidate agent service architecture with improved separation of concerns
- This refactoring provides a scalable foundation for multi-agent collaboration with knowledge-driven decision making and state persistence

											
										
										
											2025-12-12 15:27:12 +08:00
+								                    })
 								                    continue
 								                # 重置空响应计数器
 								                self._empty_retry_count = 0
-												feat(agent): 增强API错误处理机制

添加对API错误的分类处理，包括速率限制、配额用尽、认证和连接错误
在base.py中标记API错误前缀，orchestrator.py中实现重试逻辑
litellm_adapter.py中完善错误类型识别和用户友好提示

											
										
										
											2025-12-25 17:35:31 +08:00
 								                # 🔥 检查是否是 API 错误（而非格式错误）
 								                if llm_output.startswith("[API_ERROR:"):
 								                    # 提取错误类型和消息
 								                    match = re.match(r"\[API_ERROR:(\w+)\]\s*(.*)", llm_output)
 								                    if match:
 								                        error_type = match.group(1)
 								                        error_message = match.group(2)
 								                        if error_type == "rate_limit":
 								                            # 速率限制 - 等待后重试
 								                            api_retry_count = getattr(self, '_api_retry_count', 0) + 1
 								                            self._api_retry_count = api_retry_count
 								                            if api_retry_count >= 3:
 								                                logger.error(f"[{self.name}] Too many rate limit errors, stopping")
 								                                await self.emit_event("error", f"API 速率限制重试次数过多: {error_message}")
 								                                break
 								                            logger.warning(f"[{self.name}] Rate limit hit, waiting before retry ({api_retry_count}/3)")
 								                            await self.emit_event("warning", f"API 速率限制，等待后重试 ({api_retry_count}/3)")
 								                            await asyncio.sleep(30)  # 等待 30 秒后重试
 								                            continue
 								                        elif error_type == "quota_exceeded":
 								                            # 配额用尽 - 终止任务
 								                            logger.error(f"[{self.name}] API quota exceeded: {error_message}")
 								                            await self.emit_event("error", f"API 配额已用尽: {error_message}")
 								                            break
 								                        elif error_type == "authentication":
 								                            # 认证错误 - 终止任务
 								                            logger.error(f"[{self.name}] API authentication error: {error_message}")
 								                            await self.emit_event("error", f"API 认证失败: {error_message}")
 								                            break
 								                        elif error_type == "connection":
 								                            # 连接错误 - 重试
 								                            api_retry_count = getattr(self, '_api_retry_count', 0) + 1
 								                            self._api_retry_count = api_retry_count
 								                            if api_retry_count >= 3:
 								                                logger.error(f"[{self.name}] Too many connection errors, stopping")
 								                                await self.emit_event("error", f"API 连接错误重试次数过多: {error_message}")
 								                                break
 								                            logger.warning(f"[{self.name}] Connection error, retrying ({api_retry_count}/3)")
 								                            await self.emit_event("warning", f"API 连接错误，重试中 ({api_retry_count}/3)")
 								                            await asyncio.sleep(5)  # 等待 5 秒后重试
 								                            continue
-												feat: Implement incremental historical event loading and a centralized state synchronization mechanism, including stream reconnection, for the AgentAudit page.

											
										
										
											2026-01-29 14:51:48 +08:00
+								                        elif error_type == "server_error":
 								                            # 服务器错误 (5xx) - 重试
 								                            api_retry_count = getattr(self, '_api_retry_count', 0) + 1
 								                            self._api_retry_count = api_retry_count
 								                            if api_retry_count >= 3:
 								                                logger.error(f"[{self.name}] Too many server errors, stopping")
 								                                await self.emit_event("error", f"API 服务端错误重试次数过多: {error_message}")
 								                                break
 								                            logger.warning(f"[{self.name}] Server error, retrying ({api_retry_count}/3)")
 								                            await self.emit_event("warning", f"API 服务端繁忙或异常，重试中 ({api_retry_count}/3)")
 								                            await asyncio.sleep(10)  # 等待 10 秒后重试（服务端错误通常需要更久恢复）
 								                            continue
-												feat(agent): 增强API错误处理机制

添加对API错误的分类处理，包括速率限制、配额用尽、认证和连接错误
在base.py中标记API错误前缀，orchestrator.py中实现重试逻辑
litellm_adapter.py中完善错误类型识别和用户友好提示

											
										
										
											2025-12-25 17:35:31 +08:00
+								                # 重置 API 重试计数器（成功获取响应后）
 								                self._api_retry_count = 0
-												feat(agent): enhance agent functionality with LLM-driven decision-making and event handling

- Introduce LLM-driven decision-making across various agents, allowing for dynamic adjustments based on real-time analysis.
- Implement new event types for LLM thinking, decisions, actions, and observations to enrich the event streaming experience.
- Update agent task responses to include additional metrics for better tracking of task progress and outcomes.
- Refactor UI components to highlight LLM-related events and improve user interaction during audits.
- Enhance API endpoints to support new event structures and improve overall error handling.

											
										
										
											2025-12-11 21:14:32 +08:00
+								                # 解析 LLM 的决策
 								                step = self._parse_llm_response(llm_output)
-												feat(agent): implement Agent audit module with LangGraph integration

- Introduce new Agent audit functionality for autonomous code security analysis and vulnerability verification.
- Add API endpoints for managing Agent tasks and configurations.
- Implement UI components for Agent mode selection and embedding model configuration.
- Enhance the overall architecture with a focus on RAG (Retrieval-Augmented Generation) for improved code semantic search.
- Create a sandbox environment for secure execution of vulnerability tests.
- Update documentation to include details on the new Agent audit features and usage instructions.

											
										
										
											2025-12-11 19:09:10 +08:00
-												feat(agent): enhance agent functionality with LLM-driven decision-making and event handling

- Introduce LLM-driven decision-making across various agents, allowing for dynamic adjustments based on real-time analysis.
- Implement new event types for LLM thinking, decisions, actions, and observations to enrich the event streaming experience.
- Update agent task responses to include additional metrics for better tracking of task progress and outcomes.
- Refactor UI components to highlight LLM-related events and improve user interaction during audits.
- Enhance API endpoints to support new event structures and improve overall error handling.

											
										
										
											2025-12-11 21:14:32 +08:00
+								                if not step:
 								                    # LLM 输出格式不正确，提示重试
-												feat(agent): implement comprehensive agent architecture with knowledge base and persistence layer

- Add database migrations for agent checkpoints and tree node tracking
- Implement core agent execution framework with executor, state management, and message handling
- Create knowledge base system with framework-specific modules (Django, FastAPI, Flask, Express, React, Supabase)
- Add vulnerability knowledge modules covering authentication, cryptography, injection, XSS, XXE, SSRF, path traversal, deserialization, and race conditions
- Introduce new agent tools: thinking tool, reporting tool, and agent-specific utilities
- Implement LLM memory compression and prompt caching for improved performance
- Add agent registry and persistence layer for checkpoint management
- Refactor agent implementations (analysis, recon, verification, orchestrator) with enhanced capabilities
- Remove legacy agent implementations (analysis_v2, react_agent)
- Update API endpoints for agent task creation and project management
- Add frontend components for agent task creation and enhanced audit UI
- Consolidate agent service architecture with improved separation of concerns
- This refactoring provides a scalable foundation for multi-agent collaboration with knowledge-driven decision making and state persistence

											
										
										
											2025-12-12 15:27:12 +08:00
+								                    format_retry_count = getattr(self, '_format_retry_count', 0) + 1
 								                    self._format_retry_count = format_retry_count
 								                    if format_retry_count >= 3:
 								                        logger.error(f"[{self.name}] Too many format errors, stopping")
 								                        error_message = "连续格式错误，停止编排"
 								                        await self.emit_event("error", error_message)
 								                        break
-												feat(agent): enhance agent functionality with LLM-driven decision-making and event handling

- Introduce LLM-driven decision-making across various agents, allowing for dynamic adjustments based on real-time analysis.
- Implement new event types for LLM thinking, decisions, actions, and observations to enrich the event streaming experience.
- Update agent task responses to include additional metrics for better tracking of task progress and outcomes.
- Refactor UI components to highlight LLM-related events and improve user interaction during audits.
- Enhance API endpoints to support new event structures and improve overall error handling.

											
										
										
											2025-12-11 21:14:32 +08:00
+								                    await self.emit_llm_decision("格式错误", "需要重新输出")
 								                    self._conversation_history.append({
 								                        "role": "assistant",
 								                        "content": llm_output,
 								                    })
 								                    self._conversation_history.append({
 								                        "role": "user",
 								                        "content": "请按照规定格式输出：Thought + Action + Action Input",
 								                    })
 								                    continue
-												feat(agent): implement comprehensive agent architecture with knowledge base and persistence layer

- Add database migrations for agent checkpoints and tree node tracking
- Implement core agent execution framework with executor, state management, and message handling
- Create knowledge base system with framework-specific modules (Django, FastAPI, Flask, Express, React, Supabase)
- Add vulnerability knowledge modules covering authentication, cryptography, injection, XSS, XXE, SSRF, path traversal, deserialization, and race conditions
- Introduce new agent tools: thinking tool, reporting tool, and agent-specific utilities
- Implement LLM memory compression and prompt caching for improved performance
- Add agent registry and persistence layer for checkpoint management
- Refactor agent implementations (analysis, recon, verification, orchestrator) with enhanced capabilities
- Remove legacy agent implementations (analysis_v2, react_agent)
- Update API endpoints for agent task creation and project management
- Add frontend components for agent task creation and enhanced audit UI
- Consolidate agent service architecture with improved separation of concerns
- This refactoring provides a scalable foundation for multi-agent collaboration with knowledge-driven decision making and state persistence

											
										
										
											2025-12-12 15:27:12 +08:00
+								                # 重置格式重试计数器
 								                self._format_retry_count = 0
-												feat(agent): enhance agent functionality with LLM-driven decision-making and event handling

- Introduce LLM-driven decision-making across various agents, allowing for dynamic adjustments based on real-time analysis.
- Implement new event types for LLM thinking, decisions, actions, and observations to enrich the event streaming experience.
- Update agent task responses to include additional metrics for better tracking of task progress and outcomes.
- Refactor UI components to highlight LLM-related events and improve user interaction during audits.
- Enhance API endpoints to support new event structures and improve overall error handling.

											
										
										
											2025-12-11 21:14:32 +08:00
+								                self._steps.append(step)
 								                # 🔥 发射 LLM 思考内容事件 - 展示编排决策的思考过程
 								                if step.thought:
 								                    await self.emit_llm_thought(step.thought, iteration + 1)
 								                # 添加 LLM 响应到历史
 								                self._conversation_history.append({
 								                    "role": "assistant",
 								                    "content": llm_output,
 								                })
 								                # 执行 LLM 决定的操作
 								                if step.action == "finish":
 								                    # 🔥 LLM 决定完成审计
 								                    await self.emit_llm_decision("完成审计", "LLM 判断审计已充分完成")
 								                    await self.emit_llm_complete(
 								                        f"编排完成，发现 {len(self._all_findings)} 个漏洞",
 								                        self._total_tokens
 								                    )
 								                    final_result = step.action_input
 								                    break
 								                elif step.action == "dispatch_agent":
 								                    # 🔥 LLM 决定调度子 Agent
 								                    agent_name = step.action_input.get("agent", "unknown")
 								                    task_desc = step.action_input.get("task", "")
 								                    await self.emit_llm_decision(
 								                        f"调度 {agent_name} Agent",
 								                        f"任务: {task_desc[:100]}"
 								                    )
 								                    await self.emit_llm_action("dispatch_agent", step.action_input)
 								                    observation = await self._dispatch_agent(step.action_input)
 								                    step.observation = observation
-												feat(agent): implement comprehensive agent architecture with knowledge base and persistence layer

- Add database migrations for agent checkpoints and tree node tracking
- Implement core agent execution framework with executor, state management, and message handling
- Create knowledge base system with framework-specific modules (Django, FastAPI, Flask, Express, React, Supabase)
- Add vulnerability knowledge modules covering authentication, cryptography, injection, XSS, XXE, SSRF, path traversal, deserialization, and race conditions
- Introduce new agent tools: thinking tool, reporting tool, and agent-specific utilities
- Implement LLM memory compression and prompt caching for improved performance
- Add agent registry and persistence layer for checkpoint management
- Refactor agent implementations (analysis, recon, verification, orchestrator) with enhanced capabilities
- Remove legacy agent implementations (analysis_v2, react_agent)
- Update API endpoints for agent task creation and project management
- Add frontend components for agent task creation and enhanced audit UI
- Consolidate agent service architecture with improved separation of concerns
- This refactoring provides a scalable foundation for multi-agent collaboration with knowledge-driven decision making and state persistence

											
										
										
											2025-12-12 15:27:12 +08:00
+								                    # 🔥 子 Agent 执行完成后检查取消状态
 								                    if self.is_cancelled:
 								                        logger.info(f"[{self.name}] Cancelled after sub-agent dispatch")
 								                        break
-												feat(agent): enhance agent functionality with LLM-driven decision-making and event handling

- Introduce LLM-driven decision-making across various agents, allowing for dynamic adjustments based on real-time analysis.
- Implement new event types for LLM thinking, decisions, actions, and observations to enrich the event streaming experience.
- Update agent task responses to include additional metrics for better tracking of task progress and outcomes.
- Refactor UI components to highlight LLM-related events and improve user interaction during audits.
- Enhance API endpoints to support new event structures and improve overall error handling.

											
										
										
											2025-12-11 21:14:32 +08:00
+								                    # 🔥 发射观察事件
 								                    await self.emit_llm_observation(observation)
 								                elif step.action == "summarize":
 								                    # LLM 要求汇总
 								                    await self.emit_llm_decision("汇总发现", "LLM 请求查看当前发现汇总")
 								                    observation = self._summarize_findings()
 								                    step.observation = observation
 								                    await self.emit_llm_observation(observation)
 								                else:
 								                    observation = f"未知操作: {step.action}，可用操作: dispatch_agent, summarize, finish"
 								                    await self.emit_llm_decision("未知操作", observation)
 								                # 添加观察结果到历史
 								                self._conversation_history.append({
 								                    "role": "user",
 								                    "content": f"Observation:\n{step.observation}",
 								                })
-												feat(agent): implement Agent audit module with LangGraph integration

- Introduce new Agent audit functionality for autonomous code security analysis and vulnerability verification.
- Add API endpoints for managing Agent tasks and configurations.
- Implement UI components for Agent mode selection and embedding model configuration.
- Enhance the overall architecture with a focus on RAG (Retrieval-Augmented Generation) for improved code semantic search.
- Create a sandbox environment for secure execution of vulnerability tests.
- Update documentation to include details on the new Agent audit features and usage instructions.

											
										
										
											2025-12-11 19:09:10 +08:00
-												feat(agent): enhance agent functionality with LLM-driven decision-making and event handling

- Introduce LLM-driven decision-making across various agents, allowing for dynamic adjustments based on real-time analysis.
- Implement new event types for LLM thinking, decisions, actions, and observations to enrich the event streaming experience.
- Update agent task responses to include additional metrics for better tracking of task progress and outcomes.
- Refactor UI components to highlight LLM-related events and improve user interaction during audits.
- Enhance API endpoints to support new event structures and improve overall error handling.

											
										
										
											2025-12-11 21:14:32 +08:00
+								            # 生成最终结果
 								            duration_ms = int((time.time() - start_time) * 1000)
-												feat(agent): implement Agent audit module with LangGraph integration

- Introduce new Agent audit functionality for autonomous code security analysis and vulnerability verification.
- Add API endpoints for managing Agent tasks and configurations.
- Implement UI components for Agent mode selection and embedding model configuration.
- Enhance the overall architecture with a focus on RAG (Retrieval-Augmented Generation) for improved code semantic search.
- Create a sandbox environment for secure execution of vulnerability tests.
- Update documentation to include details on the new Agent audit features and usage instructions.

											
										
										
											2025-12-11 19:09:10 +08:00
-												feat(agent): implement comprehensive agent architecture with knowledge base and persistence layer

- Add database migrations for agent checkpoints and tree node tracking
- Implement core agent execution framework with executor, state management, and message handling
- Create knowledge base system with framework-specific modules (Django, FastAPI, Flask, Express, React, Supabase)
- Add vulnerability knowledge modules covering authentication, cryptography, injection, XSS, XXE, SSRF, path traversal, deserialization, and race conditions
- Introduce new agent tools: thinking tool, reporting tool, and agent-specific utilities
- Implement LLM memory compression and prompt caching for improved performance
- Add agent registry and persistence layer for checkpoint management
- Refactor agent implementations (analysis, recon, verification, orchestrator) with enhanced capabilities
- Remove legacy agent implementations (analysis_v2, react_agent)
- Update API endpoints for agent task creation and project management
- Add frontend components for agent task creation and enhanced audit UI
- Consolidate agent service architecture with improved separation of concerns
- This refactoring provides a scalable foundation for multi-agent collaboration with knowledge-driven decision making and state persistence

											
										
										
											2025-12-12 15:27:12 +08:00
+								            # 🔥 如果被取消，返回取消结果
 								            if self.is_cancelled:
 								                await self.emit_event(
 								                    "info",
 								                    f"🛑 Orchestrator 已取消: {len(self._all_findings)} 个发现, {self._iteration} 轮决策"
 								                )
 								                return AgentResult(
 								                    success=False,
 								                    error="任务已取消",
 								                    data={
 								                        "findings": self._all_findings,
 								                        "steps": [
 								                            {
 								                                "thought": s.thought,
 								                                "action": s.action,
 								                                "action_input": s.action_input,
 								                                "observation": s.observation[:500] if s.observation else None,
 								                            }
 								                            for s in self._steps
 								                        ],
 								                    },
 								                    iterations=self._iteration,
 								                    tool_calls=self._tool_calls,
 								                    tokens_used=self._total_tokens,
 								                    duration_ms=duration_ms,
 								                )
 								            # 🔥 如果有错误，返回失败结果
 								            if error_message:
 								                await self.emit_event(
 								                    "error",
 								                    f"❌ Orchestrator 失败: {error_message}"
 								                )
 								                return AgentResult(
 								                    success=False,
 								                    error=error_message,
 								                    data={
 								                        "findings": self._all_findings,
 								                        "steps": [
 								                            {
 								                                "thought": s.thought,
 								                                "action": s.action,
 								                                "action_input": s.action_input,
 								                                "observation": s.observation[:500] if s.observation else None,
 								                            }
 								                            for s in self._steps
 								                        ],
 								                    },
 								                    iterations=self._iteration,
 								                    tool_calls=self._tool_calls,
 								                    tokens_used=self._total_tokens,
 								                    duration_ms=duration_ms,
 								                )
-												feat(agent): enhance agent functionality with LLM-driven decision-making and event handling

- Introduce LLM-driven decision-making across various agents, allowing for dynamic adjustments based on real-time analysis.
- Implement new event types for LLM thinking, decisions, actions, and observations to enrich the event streaming experience.
- Update agent task responses to include additional metrics for better tracking of task progress and outcomes.
- Refactor UI components to highlight LLM-related events and improve user interaction during audits.
- Enhance API endpoints to support new event structures and improve overall error handling.

											
										
										
											2025-12-11 21:14:32 +08:00
+								            await self.emit_event(
 								                "info",
 								                f"🎯 Orchestrator 完成: {len(self._all_findings)} 个发现, {self._iteration} 轮决策"
-												feat(agent): implement Agent audit module with LangGraph integration

- Introduce new Agent audit functionality for autonomous code security analysis and vulnerability verification.
- Add API endpoints for managing Agent tasks and configurations.
- Implement UI components for Agent mode selection and embedding model configuration.
- Enhance the overall architecture with a focus on RAG (Retrieval-Augmented Generation) for improved code semantic search.
- Create a sandbox environment for secure execution of vulnerability tests.
- Update documentation to include details on the new Agent audit features and usage instructions.

											
										
										
											2025-12-11 19:09:10 +08:00
+								            )
-												feat: 新增安全工具集成和漏洞知识库扩展

- 添加 Bandit 和 Safety 安全工具到依赖项
- 新增 CSRF、业务逻辑和开放重定向漏洞知识文档
- 实现安全工具一键安装脚本和文档
- 改进模式匹配工具支持直接文件扫描
- 增强遥测模块和 Agent 审计功能
- 修复验证节点中 findings 合并逻辑
- 优化前端 Agent 审计界面和状态展示

											
										
										
											2025-12-13 12:35:03 +08:00
 								            # 🔥 CRITICAL: Log final findings count before returning
 								            logger.info(f"[Orchestrator] Final result: {len(self._all_findings)} findings collected")
-												feat(agent): 增强漏洞发现处理流程和前端兼容性

- 后端添加对旧事件类型'finding'的兼容支持
- 改进漏洞发现标准化和去重逻辑
- 新增PoC生成要求和相关字段
- 优化沙箱配置初始化流程
- 前端添加ADD_FINDING操作和状态管理
- 增强事件流处理和序列号过滤
- 改进历史事件加载和SSE连接逻辑
- 添加漏洞验证状态和PoC信息到报告

											
										
										
											2025-12-13 18:45:05 +08:00
+								            if len(self._all_findings) == 0:
 								                logger.warning(f"[Orchestrator] ⚠️ No findings collected! Dispatched agents: {list(self._dispatched_tasks.keys())}, Iterations: {self._iteration}")
-												feat: 新增安全工具集成和漏洞知识库扩展

- 添加 Bandit 和 Safety 安全工具到依赖项
- 新增 CSRF、业务逻辑和开放重定向漏洞知识文档
- 实现安全工具一键安装脚本和文档
- 改进模式匹配工具支持直接文件扫描
- 增强遥测模块和 Agent 审计功能
- 修复验证节点中 findings 合并逻辑
- 优化前端 Agent 审计界面和状态展示

											
										
										
											2025-12-13 12:35:03 +08:00
+								            for i, f in enumerate(self._all_findings[:5]):  # Log first 5 for debugging
 								                logger.debug(f"[Orchestrator] Finding {i+1}: {f.get('title', 'N/A')} - {f.get('vulnerability_type', 'N/A')}")
-												feat(agent): implement Agent audit module with LangGraph integration

- Introduce new Agent audit functionality for autonomous code security analysis and vulnerability verification.
- Add API endpoints for managing Agent tasks and configurations.
- Implement UI components for Agent mode selection and embedding model configuration.
- Enhance the overall architecture with a focus on RAG (Retrieval-Augmented Generation) for improved code semantic search.
- Create a sandbox environment for secure execution of vulnerability tests.
- Update documentation to include details on the new Agent audit features and usage instructions.

											
										
										
											2025-12-11 19:09:10 +08:00
+								            return AgentResult(
 								                success=True,
 								                data={
-												feat(agent): enhance agent functionality with LLM-driven decision-making and event handling

- Introduce LLM-driven decision-making across various agents, allowing for dynamic adjustments based on real-time analysis.
- Implement new event types for LLM thinking, decisions, actions, and observations to enrich the event streaming experience.
- Update agent task responses to include additional metrics for better tracking of task progress and outcomes.
- Refactor UI components to highlight LLM-related events and improve user interaction during audits.
- Enhance API endpoints to support new event structures and improve overall error handling.

											
										
										
											2025-12-11 21:14:32 +08:00
+								                    "findings": self._all_findings,
 								                    "summary": final_result or self._generate_default_summary(),
 								                    "steps": [
 								                        {
 								                            "thought": s.thought,
 								                            "action": s.action,
 								                            "action_input": s.action_input,
 								                            "observation": s.observation[:500] if s.observation else None,
 								                        }
 								                        for s in self._steps
 								                    ],
-												feat(agent): implement Agent audit module with LangGraph integration

- Introduce new Agent audit functionality for autonomous code security analysis and vulnerability verification.
- Add API endpoints for managing Agent tasks and configurations.
- Implement UI components for Agent mode selection and embedding model configuration.
- Enhance the overall architecture with a focus on RAG (Retrieval-Augmented Generation) for improved code semantic search.
- Create a sandbox environment for secure execution of vulnerability tests.
- Update documentation to include details on the new Agent audit features and usage instructions.

											
										
										
											2025-12-11 19:09:10 +08:00
+								                },
 								                iterations=self._iteration,
 								                tool_calls=self._tool_calls,
 								                tokens_used=self._total_tokens,
 								                duration_ms=duration_ms,
 								            )
 								        except Exception as e:
 								            logger.error(f"Orchestrator failed: {e}", exc_info=True)
 								            return AgentResult(
 								                success=False,
 								                error=str(e),
 								            )
-												feat(agent): enhance agent functionality with LLM-driven decision-making and event handling

- Introduce LLM-driven decision-making across various agents, allowing for dynamic adjustments based on real-time analysis.
- Implement new event types for LLM thinking, decisions, actions, and observations to enrich the event streaming experience.
- Update agent task responses to include additional metrics for better tracking of task progress and outcomes.
- Refactor UI components to highlight LLM-related events and improve user interaction during audits.
- Enhance API endpoints to support new event structures and improve overall error handling.

											
										
										
											2025-12-11 21:14:32 +08:00
+								    def _build_initial_message(
-												feat(agent): implement Agent audit module with LangGraph integration

- Introduce new Agent audit functionality for autonomous code security analysis and vulnerability verification.
- Add API endpoints for managing Agent tasks and configurations.
- Implement UI components for Agent mode selection and embedding model configuration.
- Enhance the overall architecture with a focus on RAG (Retrieval-Augmented Generation) for improved code semantic search.
- Create a sandbox environment for secure execution of vulnerability tests.
- Update documentation to include details on the new Agent audit features and usage instructions.

											
										
										
											2025-12-11 19:09:10 +08:00
+								        self,
 								        project_info: Dict[str, Any],
 								        config: Dict[str, Any],
-												feat(agent): enhance agent functionality with LLM-driven decision-making and event handling

- Introduce LLM-driven decision-making across various agents, allowing for dynamic adjustments based on real-time analysis.
- Implement new event types for LLM thinking, decisions, actions, and observations to enrich the event streaming experience.
- Update agent task responses to include additional metrics for better tracking of task progress and outcomes.
- Refactor UI components to highlight LLM-related events and improve user interaction during audits.
- Enhance API endpoints to support new event structures and improve overall error handling.

											
										
										
											2025-12-11 21:14:32 +08:00
+								    ) -> str:
 								        """构建初始消息"""
-												feat(agent): enhance error handling and project scope filtering

- Downgrade Python version from 3.13 to 3.11.12 for compatibility
- Improve empty LLM response handling with better diagnostics and retry logic in AnalysisAgent
- Add detailed logging for empty response retries with token count and iteration tracking
- Implement fallback result generation instead of immediate failure on consecutive empty responses
- Enhance stream error handling with partial content recovery and error message propagation
- Add comprehensive exception handling in stream_llm_call to prevent error suppression
- Implement project scope filtering to ensure consistent filtered views across Orchestrator and sub-agents
- Track filtered files and directories separately when target_files are specified
- Add scope_limited flag and scope_message to project structure for transparency
- Remove manual progress_percentage setting and rely on computed property for COMPLETED status
- Improve code comments with diagnostic markers (🔥) for critical sections

											
										
										
											2025-12-12 16:36:39 +08:00
+								        structure = project_info.get('structure', {})
 								        # 🔥 检查是否是限定范围的审计
 								        scope_limited = structure.get('scope_limited', False)
 								        scope_message = structure.get('scope_message', '')
-												feat(agent): enhance agent functionality with LLM-driven decision-making and event handling

- Introduce LLM-driven decision-making across various agents, allowing for dynamic adjustments based on real-time analysis.
- Implement new event types for LLM thinking, decisions, actions, and observations to enrich the event streaming experience.
- Update agent task responses to include additional metrics for better tracking of task progress and outcomes.
- Refactor UI components to highlight LLM-related events and improve user interaction during audits.
- Enhance API endpoints to support new event structures and improve overall error handling.

											
										
										
											2025-12-11 21:14:32 +08:00
+								        msg = f"""请开始对以下项目进行安全审计。
-												feat(agent): implement Agent audit module with LangGraph integration

- Introduce new Agent audit functionality for autonomous code security analysis and vulnerability verification.
- Add API endpoints for managing Agent tasks and configurations.
- Implement UI components for Agent mode selection and embedding model configuration.
- Enhance the overall architecture with a focus on RAG (Retrieval-Augmented Generation) for improved code semantic search.
- Create a sandbox environment for secure execution of vulnerability tests.
- Update documentation to include details on the new Agent audit features and usage instructions.

											
										
										
											2025-12-11 19:09:10 +08:00
 								## 项目信息
 								- 名称: {project_info.get('name', 'unknown')}
 								- 语言: {project_info.get('languages', [])}
 								- 文件数量: {project_info.get('file_count', 0)}
-												feat(agent): enhance error handling and project scope filtering

- Downgrade Python version from 3.13 to 3.11.12 for compatibility
- Improve empty LLM response handling with better diagnostics and retry logic in AnalysisAgent
- Add detailed logging for empty response retries with token count and iteration tracking
- Implement fallback result generation instead of immediate failure on consecutive empty responses
- Enhance stream error handling with partial content recovery and error message propagation
- Add comprehensive exception handling in stream_llm_call to prevent error suppression
- Implement project scope filtering to ensure consistent filtered views across Orchestrator and sub-agents
- Track filtered files and directories separately when target_files are specified
- Add scope_limited flag and scope_message to project structure for transparency
- Remove manual progress_percentage setting and rely on computed property for COMPLETED status
- Improve code comments with diagnostic markers (🔥) for critical sections

											
										
										
											2025-12-12 16:36:39 +08:00
+								"""
 								        # 🔥 根据是否限定范围显示不同的结构信息
 								        if scope_limited:
 								            msg += f"""
 								## ⚠️ 审计范围限定
 								**{scope_message}**
-												feat(agent): implement Agent audit module with LangGraph integration

- Introduce new Agent audit functionality for autonomous code security analysis and vulnerability verification.
- Add API endpoints for managing Agent tasks and configurations.
- Implement UI components for Agent mode selection and embedding model configuration.
- Enhance the overall architecture with a focus on RAG (Retrieval-Augmented Generation) for improved code semantic search.
- Create a sandbox environment for secure execution of vulnerability tests.
- Update documentation to include details on the new Agent audit features and usage instructions.

											
										
										
											2025-12-11 19:09:10 +08:00
-												feat(agent): enhance error handling and project scope filtering

- Downgrade Python version from 3.13 to 3.11.12 for compatibility
- Improve empty LLM response handling with better diagnostics and retry logic in AnalysisAgent
- Add detailed logging for empty response retries with token count and iteration tracking
- Implement fallback result generation instead of immediate failure on consecutive empty responses
- Enhance stream error handling with partial content recovery and error message propagation
- Add comprehensive exception handling in stream_llm_call to prevent error suppression
- Implement project scope filtering to ensure consistent filtered views across Orchestrator and sub-agents
- Track filtered files and directories separately when target_files are specified
- Add scope_limited flag and scope_message to project structure for transparency
- Remove manual progress_percentage setting and rely on computed property for COMPLETED status
- Improve code comments with diagnostic markers (🔥) for critical sections

											
										
										
											2025-12-12 16:36:39 +08:00
+								### 目标文件列表
 								"""
 								            for f in structure.get('files', []):
 								                msg += f"- {f}\n"
 								            if structure.get('directories'):
 								                msg += f"""
 								### 相关目录
 								{structure.get('directories', [])}
 								"""
 								        else:
 								            msg += f"""
 								## 目录结构
 								{json.dumps(structure, ensure_ascii=False, indent=2)}
 								"""
 								        # 🔥 如果配置了 target_files，也明确显示
 								        target_files = config.get('target_files', [])
 								        if target_files:
 								            msg += f"""
 								## ⚠️ 重要提示
 								用户指定了 **{len(target_files)}** 个目标文件进行审计。
 								请确保你的分析集中在这些指定的文件上，不要浪费时间分析其他文件。
 								"""
 								        msg += f"""
-												feat(agent): implement Agent audit module with LangGraph integration

- Introduce new Agent audit functionality for autonomous code security analysis and vulnerability verification.
- Add API endpoints for managing Agent tasks and configurations.
- Implement UI components for Agent mode selection and embedding model configuration.
- Enhance the overall architecture with a focus on RAG (Retrieval-Augmented Generation) for improved code semantic search.
- Create a sandbox environment for secure execution of vulnerability tests.
- Update documentation to include details on the new Agent audit features and usage instructions.

											
										
										
											2025-12-11 19:09:10 +08:00
+								## 用户配置
-												feat(agent): enhance agent functionality with LLM-driven decision-making and event handling

- Introduce LLM-driven decision-making across various agents, allowing for dynamic adjustments based on real-time analysis.
- Implement new event types for LLM thinking, decisions, actions, and observations to enrich the event streaming experience.
- Update agent task responses to include additional metrics for better tracking of task progress and outcomes.
- Refactor UI components to highlight LLM-related events and improve user interaction during audits.
- Enhance API endpoints to support new event structures and improve overall error handling.

											
										
										
											2025-12-11 21:14:32 +08:00
+								- 目标漏洞: {config.get('target_vulnerabilities', ['all'])}
-												feat(agent): implement Agent audit module with LangGraph integration

- Introduce new Agent audit functionality for autonomous code security analysis and vulnerability verification.
- Add API endpoints for managing Agent tasks and configurations.
- Implement UI components for Agent mode selection and embedding model configuration.
- Enhance the overall architecture with a focus on RAG (Retrieval-Augmented Generation) for improved code semantic search.
- Create a sandbox environment for secure execution of vulnerability tests.
- Update documentation to include details on the new Agent audit features and usage instructions.

											
										
										
											2025-12-11 19:09:10 +08:00
+								- 验证级别: {config.get('verification_level', 'sandbox')}
 								- 排除模式: {config.get('exclude_patterns', [])}
-												feat(agent): enhance agent functionality with LLM-driven decision-making and event handling

- Introduce LLM-driven decision-making across various agents, allowing for dynamic adjustments based on real-time analysis.
- Implement new event types for LLM thinking, decisions, actions, and observations to enrich the event streaming experience.
- Update agent task responses to include additional metrics for better tracking of task progress and outcomes.
- Refactor UI components to highlight LLM-related events and improve user interaction during audits.
- Enhance API endpoints to support new event structures and improve overall error handling.

											
										
										
											2025-12-11 21:14:32 +08:00
+								## 可用子 Agent
 								{', '.join(self.sub_agents.keys()) if self.sub_agents else '(暂无子 Agent)'}
 								请开始你的审计工作。首先思考应该如何开展，然后决定第一步做什么。"""
 								        return msg
 								    def _parse_llm_response(self, response: str) -> Optional[AgentStep]:
 								        """解析 LLM 响应"""
-												feat(agent): 增强文件路径验证防止幻觉报告

添加文件路径验证规则和检查逻辑，确保漏洞报告中的文件真实存在
移除LLM响应中的Markdown格式标记，统一解析处理
更新报告工具和端点以支持项目根目录验证

											
										
										
											2025-12-19 19:08:36 +08:00
+								        # 🔥 v2.1: 预处理 - 移除 Markdown 格式标记（LLM 有时会输出 **Action:** 而非 Action:）
 								        cleaned_response = response
 								        cleaned_response = re.sub(r'\*\*Action:\*\*', 'Action:', cleaned_response)
 								        cleaned_response = re.sub(r'\*\*Action Input:\*\*', 'Action Input:', cleaned_response)
 								        cleaned_response = re.sub(r'\*\*Thought:\*\*', 'Thought:', cleaned_response)
 								        cleaned_response = re.sub(r'\*\*Observation:\*\*', 'Observation:', cleaned_response)
-												feat(agent): enhance agent functionality with LLM-driven decision-making and event handling

- Introduce LLM-driven decision-making across various agents, allowing for dynamic adjustments based on real-time analysis.
- Implement new event types for LLM thinking, decisions, actions, and observations to enrich the event streaming experience.
- Update agent task responses to include additional metrics for better tracking of task progress and outcomes.
- Refactor UI components to highlight LLM-related events and improve user interaction during audits.
- Enhance API endpoints to support new event structures and improve overall error handling.

											
										
										
											2025-12-11 21:14:32 +08:00
+								        # 提取 Thought
-												feat(agent): 增强文件路径验证防止幻觉报告

添加文件路径验证规则和检查逻辑，确保漏洞报告中的文件真实存在
移除LLM响应中的Markdown格式标记，统一解析处理
更新报告工具和端点以支持项目根目录验证

											
										
										
											2025-12-19 19:08:36 +08:00
+								        thought_match = re.search(r'Thought:\s*(.*?)(?=Action:|$)', cleaned_response, re.DOTALL)
-												feat(agent): enhance agent functionality with LLM-driven decision-making and event handling

- Introduce LLM-driven decision-making across various agents, allowing for dynamic adjustments based on real-time analysis.
- Implement new event types for LLM thinking, decisions, actions, and observations to enrich the event streaming experience.
- Update agent task responses to include additional metrics for better tracking of task progress and outcomes.
- Refactor UI components to highlight LLM-related events and improve user interaction during audits.
- Enhance API endpoints to support new event structures and improve overall error handling.

											
										
										
											2025-12-11 21:14:32 +08:00
+								        thought = thought_match.group(1).strip() if thought_match else ""
-												feat(agent): 增强文件路径验证防止幻觉报告

添加文件路径验证规则和检查逻辑，确保漏洞报告中的文件真实存在
移除LLM响应中的Markdown格式标记，统一解析处理
更新报告工具和端点以支持项目根目录验证

											
										
										
											2025-12-19 19:08:36 +08:00
-												feat(agent): enhance agent functionality with LLM-driven decision-making and event handling

- Introduce LLM-driven decision-making across various agents, allowing for dynamic adjustments based on real-time analysis.
- Implement new event types for LLM thinking, decisions, actions, and observations to enrich the event streaming experience.
- Update agent task responses to include additional metrics for better tracking of task progress and outcomes.
- Refactor UI components to highlight LLM-related events and improve user interaction during audits.
- Enhance API endpoints to support new event structures and improve overall error handling.

											
										
										
											2025-12-11 21:14:32 +08:00
+								        # 提取 Action
-												feat(agent): 增强文件路径验证防止幻觉报告

添加文件路径验证规则和检查逻辑，确保漏洞报告中的文件真实存在
移除LLM响应中的Markdown格式标记，统一解析处理
更新报告工具和端点以支持项目根目录验证

											
										
										
											2025-12-19 19:08:36 +08:00
+								        action_match = re.search(r'Action:\s*(\w+)', cleaned_response)
-												feat(agent): enhance agent functionality with LLM-driven decision-making and event handling

- Introduce LLM-driven decision-making across various agents, allowing for dynamic adjustments based on real-time analysis.
- Implement new event types for LLM thinking, decisions, actions, and observations to enrich the event streaming experience.
- Update agent task responses to include additional metrics for better tracking of task progress and outcomes.
- Refactor UI components to highlight LLM-related events and improve user interaction during audits.
- Enhance API endpoints to support new event structures and improve overall error handling.

											
										
										
											2025-12-11 21:14:32 +08:00
+								        if not action_match:
 								            return None
 								        action = action_match.group(1).strip()
-												feat(agent): 增强文件路径验证防止幻觉报告

添加文件路径验证规则和检查逻辑，确保漏洞报告中的文件真实存在
移除LLM响应中的Markdown格式标记，统一解析处理
更新报告工具和端点以支持项目根目录验证

											
										
										
											2025-12-19 19:08:36 +08:00
-												feat(agent): enhance agent functionality with LLM-driven decision-making and event handling

- Introduce LLM-driven decision-making across various agents, allowing for dynamic adjustments based on real-time analysis.
- Implement new event types for LLM thinking, decisions, actions, and observations to enrich the event streaming experience.
- Update agent task responses to include additional metrics for better tracking of task progress and outcomes.
- Refactor UI components to highlight LLM-related events and improve user interaction during audits.
- Enhance API endpoints to support new event structures and improve overall error handling.

											
										
										
											2025-12-11 21:14:32 +08:00
+								        # 提取 Action Input
-												feat(agent): 增强文件路径验证防止幻觉报告

添加文件路径验证规则和检查逻辑，确保漏洞报告中的文件真实存在
移除LLM响应中的Markdown格式标记，统一解析处理
更新报告工具和端点以支持项目根目录验证

											
										
										
											2025-12-19 19:08:36 +08:00
+								        input_match = re.search(r'Action Input:\s*(.*?)(?=Thought:|Observation:|$)', cleaned_response, re.DOTALL)
-												feat(agent): enhance agent functionality with LLM-driven decision-making and event handling

- Introduce LLM-driven decision-making across various agents, allowing for dynamic adjustments based on real-time analysis.
- Implement new event types for LLM thinking, decisions, actions, and observations to enrich the event streaming experience.
- Update agent task responses to include additional metrics for better tracking of task progress and outcomes.
- Refactor UI components to highlight LLM-related events and improve user interaction during audits.
- Enhance API endpoints to support new event structures and improve overall error handling.

											
										
										
											2025-12-11 21:14:32 +08:00
+								        if not input_match:
 								            return None
-												feat(agent): 增强文件路径验证防止幻觉报告

添加文件路径验证规则和检查逻辑，确保漏洞报告中的文件真实存在
移除LLM响应中的Markdown格式标记，统一解析处理
更新报告工具和端点以支持项目根目录验证

											
										
										
											2025-12-19 19:08:36 +08:00
-												feat(agent): enhance agent functionality with LLM-driven decision-making and event handling

- Introduce LLM-driven decision-making across various agents, allowing for dynamic adjustments based on real-time analysis.
- Implement new event types for LLM thinking, decisions, actions, and observations to enrich the event streaming experience.
- Update agent task responses to include additional metrics for better tracking of task progress and outcomes.
- Refactor UI components to highlight LLM-related events and improve user interaction during audits.
- Enhance API endpoints to support new event structures and improve overall error handling.

											
										
										
											2025-12-11 21:14:32 +08:00
+								        input_text = input_match.group(1).strip()
 								        # 移除 markdown 代码块
 								        input_text = re.sub(r'```json\s*', '', input_text)
 								        input_text = re.sub(r'```\s*', '', input_text)
-												feat(agent): 增强文件路径验证防止幻觉报告

添加文件路径验证规则和检查逻辑，确保漏洞报告中的文件真实存在
移除LLM响应中的Markdown格式标记，统一解析处理
更新报告工具和端点以支持项目根目录验证

											
										
										
											2025-12-19 19:08:36 +08:00
-												feat: Introduce structured agent collaboration with `TaskHandoff` and `analysis_v2` agent, updating core agent logic, tools, and audit UI.

											
										
										
											2025-12-11 23:29:04 +08:00
+								        # 使用增强的 JSON 解析器
 								        action_input = AgentJsonParser.parse(
 								            input_text,
 								            default={"raw": input_text}
 								        )
-												feat(agent): 增强文件路径验证防止幻觉报告

添加文件路径验证规则和检查逻辑，确保漏洞报告中的文件真实存在
移除LLM响应中的Markdown格式标记，统一解析处理
更新报告工具和端点以支持项目根目录验证

											
										
										
											2025-12-19 19:08:36 +08:00
-												feat(agent): enhance agent functionality with LLM-driven decision-making and event handling

- Introduce LLM-driven decision-making across various agents, allowing for dynamic adjustments based on real-time analysis.
- Implement new event types for LLM thinking, decisions, actions, and observations to enrich the event streaming experience.
- Update agent task responses to include additional metrics for better tracking of task progress and outcomes.
- Refactor UI components to highlight LLM-related events and improve user interaction during audits.
- Enhance API endpoints to support new event structures and improve overall error handling.

											
										
										
											2025-12-11 21:14:32 +08:00
+								        return AgentStep(
 								            thought=thought,
 								            action=action,
 								            action_input=action_input,
 								        )
 								    async def _dispatch_agent(self, params: Dict[str, Any]) -> str:
 								        """调度子 Agent"""
 								        agent_name = params.get("agent", "")
 								        task = params.get("task", "")
 								        context = params.get("context", "")
-												chore: reduce logging verbosity and clean up file formatting

- Change logger.info to logger.debug in agent_tasks.py streaming and tree endpoints
- Disable SQLAlchemy echo mode in database session configuration
- Suppress uvicorn access logs and LiteLLM INFO level logging in main application
- Remove LogViewer component and LogsPage from frontend
- Add trailing newlines to multiple backend configuration and model files
- Update frontend routing to remove logs page reference
- Improve application startup logging clarity by filtering verbose third-party logs

											
										
										
											2025-12-12 15:50:48 +08:00
+								        logger.debug(f"[Orchestrator] _dispatch_agent 被调用: agent_name='{agent_name}', task='{task[:50]}...'")
 								        # 🔥 尝试大小写不敏感匹配
-												feat(agent): enhance agent functionality with LLM-driven decision-making and event handling

- Introduce LLM-driven decision-making across various agents, allowing for dynamic adjustments based on real-time analysis.
- Implement new event types for LLM thinking, decisions, actions, and observations to enrich the event streaming experience.
- Update agent task responses to include additional metrics for better tracking of task progress and outcomes.
- Refactor UI components to highlight LLM-related events and improve user interaction during audits.
- Enhance API endpoints to support new event structures and improve overall error handling.

											
										
										
											2025-12-11 21:14:32 +08:00
+								        agent = self.sub_agents.get(agent_name)
-												chore: reduce logging verbosity and clean up file formatting

- Change logger.info to logger.debug in agent_tasks.py streaming and tree endpoints
- Disable SQLAlchemy echo mode in database session configuration
- Suppress uvicorn access logs and LiteLLM INFO level logging in main application
- Remove LogViewer component and LogsPage from frontend
- Add trailing newlines to multiple backend configuration and model files
- Update frontend routing to remove logs page reference
- Improve application startup logging clarity by filtering verbose third-party logs

											
										
										
											2025-12-12 15:50:48 +08:00
+								        if not agent:
 								            # 尝试小写匹配
 								            agent_name_lower = agent_name.lower()
 								            agent = self.sub_agents.get(agent_name_lower)
 								            if agent:
 								                agent_name = agent_name_lower
 								                logger.debug(f"[Orchestrator] 使用小写匹配: {agent_name}")
-												feat(agent): enhance agent functionality with LLM-driven decision-making and event handling

- Introduce LLM-driven decision-making across various agents, allowing for dynamic adjustments based on real-time analysis.
- Implement new event types for LLM thinking, decisions, actions, and observations to enrich the event streaming experience.
- Update agent task responses to include additional metrics for better tracking of task progress and outcomes.
- Refactor UI components to highlight LLM-related events and improve user interaction during audits.
- Enhance API endpoints to support new event structures and improve overall error handling.

											
										
										
											2025-12-11 21:14:32 +08:00
 								        if not agent:
 								            available = list(self.sub_agents.keys())
-												chore: reduce logging verbosity and clean up file formatting

- Change logger.info to logger.debug in agent_tasks.py streaming and tree endpoints
- Disable SQLAlchemy echo mode in database session configuration
- Suppress uvicorn access logs and LiteLLM INFO level logging in main application
- Remove LogViewer component and LogsPage from frontend
- Add trailing newlines to multiple backend configuration and model files
- Update frontend routing to remove logs page reference
- Improve application startup logging clarity by filtering verbose third-party logs

											
										
										
											2025-12-12 15:50:48 +08:00
+								            logger.warning(f"[Orchestrator] Agent '{agent_name}' 不存在，可用: {available}")
-												feat(agent): enhance agent functionality with LLM-driven decision-making and event handling

- Introduce LLM-driven decision-making across various agents, allowing for dynamic adjustments based on real-time analysis.
- Implement new event types for LLM thinking, decisions, actions, and observations to enrich the event streaming experience.
- Update agent task responses to include additional metrics for better tracking of task progress and outcomes.
- Refactor UI components to highlight LLM-related events and improve user interaction during audits.
- Enhance API endpoints to support new event structures and improve overall error handling.

											
										
										
											2025-12-11 21:14:32 +08:00
+								            return f"错误: Agent '{agent_name}' 不存在。可用的 Agent: {available}"
-												feat(agent): implement comprehensive agent architecture with knowledge base and persistence layer

- Add database migrations for agent checkpoints and tree node tracking
- Implement core agent execution framework with executor, state management, and message handling
- Create knowledge base system with framework-specific modules (Django, FastAPI, Flask, Express, React, Supabase)
- Add vulnerability knowledge modules covering authentication, cryptography, injection, XSS, XXE, SSRF, path traversal, deserialization, and race conditions
- Introduce new agent tools: thinking tool, reporting tool, and agent-specific utilities
- Implement LLM memory compression and prompt caching for improved performance
- Add agent registry and persistence layer for checkpoint management
- Refactor agent implementations (analysis, recon, verification, orchestrator) with enhanced capabilities
- Remove legacy agent implementations (analysis_v2, react_agent)
- Update API endpoints for agent task creation and project management
- Add frontend components for agent task creation and enhanced audit UI
- Consolidate agent service architecture with improved separation of concerns
- This refactoring provides a scalable foundation for multi-agent collaboration with knowledge-driven decision making and state persistence

											
										
										
											2025-12-12 15:27:12 +08:00
+								        # 🔥 检查是否重复调度同一个 Agent
 								        dispatch_count = self._dispatched_tasks.get(agent_name, 0)
 								        if dispatch_count >= 2:
 								            return f"""## ⚠️ 重复调度警告
 								你已经调度 {agent_name} Agent {dispatch_count} 次了。
 								如果之前的调度没有返回有用的结果，请考虑：
 . 尝试调度其他 Agent（如 analysis 或 verification）
 . 使用 finish 操作结束审计并汇总已有发现
 . 提供更具体的任务描述
 								当前已收集的发现数量: {len(self._all_findings)}
 								"""
 								        self._dispatched_tasks[agent_name] = dispatch_count + 1
 								        # 🔥 设置父 Agent ID 并注册到注册表（动态 Agent 树）
-												chore: reduce logging verbosity and clean up file formatting

- Change logger.info to logger.debug in agent_tasks.py streaming and tree endpoints
- Disable SQLAlchemy echo mode in database session configuration
- Suppress uvicorn access logs and LiteLLM INFO level logging in main application
- Remove LogViewer component and LogsPage from frontend
- Add trailing newlines to multiple backend configuration and model files
- Update frontend routing to remove logs page reference
- Improve application startup logging clarity by filtering verbose third-party logs

											
										
										
											2025-12-12 15:50:48 +08:00
+								        logger.debug(f"[Orchestrator] 准备调度 {agent_name} Agent, agent._registered={agent._registered}")
-												feat(agent): implement comprehensive agent architecture with knowledge base and persistence layer

- Add database migrations for agent checkpoints and tree node tracking
- Implement core agent execution framework with executor, state management, and message handling
- Create knowledge base system with framework-specific modules (Django, FastAPI, Flask, Express, React, Supabase)
- Add vulnerability knowledge modules covering authentication, cryptography, injection, XSS, XXE, SSRF, path traversal, deserialization, and race conditions
- Introduce new agent tools: thinking tool, reporting tool, and agent-specific utilities
- Implement LLM memory compression and prompt caching for improved performance
- Add agent registry and persistence layer for checkpoint management
- Refactor agent implementations (analysis, recon, verification, orchestrator) with enhanced capabilities
- Remove legacy agent implementations (analysis_v2, react_agent)
- Update API endpoints for agent task creation and project management
- Add frontend components for agent task creation and enhanced audit UI
- Consolidate agent service architecture with improved separation of concerns
- This refactoring provides a scalable foundation for multi-agent collaboration with knowledge-driven decision making and state persistence

											
										
										
											2025-12-12 15:27:12 +08:00
+								        agent.set_parent_id(self._agent_id)
-												chore: reduce logging verbosity and clean up file formatting

- Change logger.info to logger.debug in agent_tasks.py streaming and tree endpoints
- Disable SQLAlchemy echo mode in database session configuration
- Suppress uvicorn access logs and LiteLLM INFO level logging in main application
- Remove LogViewer component and LogsPage from frontend
- Add trailing newlines to multiple backend configuration and model files
- Update frontend routing to remove logs page reference
- Improve application startup logging clarity by filtering verbose third-party logs

											
										
										
											2025-12-12 15:50:48 +08:00
+								        logger.debug(f"[Orchestrator] 设置 parent_id 完成，准备注册 {agent_name}")
-												feat(agent): implement comprehensive agent architecture with knowledge base and persistence layer

- Add database migrations for agent checkpoints and tree node tracking
- Implement core agent execution framework with executor, state management, and message handling
- Create knowledge base system with framework-specific modules (Django, FastAPI, Flask, Express, React, Supabase)
- Add vulnerability knowledge modules covering authentication, cryptography, injection, XSS, XXE, SSRF, path traversal, deserialization, and race conditions
- Introduce new agent tools: thinking tool, reporting tool, and agent-specific utilities
- Implement LLM memory compression and prompt caching for improved performance
- Add agent registry and persistence layer for checkpoint management
- Refactor agent implementations (analysis, recon, verification, orchestrator) with enhanced capabilities
- Remove legacy agent implementations (analysis_v2, react_agent)
- Update API endpoints for agent task creation and project management
- Add frontend components for agent task creation and enhanced audit UI
- Consolidate agent service architecture with improved separation of concerns
- This refactoring provides a scalable foundation for multi-agent collaboration with knowledge-driven decision making and state persistence

											
										
										
											2025-12-12 15:27:12 +08:00
+								        agent._register_to_registry(task=task)
-												chore: reduce logging verbosity and clean up file formatting

- Change logger.info to logger.debug in agent_tasks.py streaming and tree endpoints
- Disable SQLAlchemy echo mode in database session configuration
- Suppress uvicorn access logs and LiteLLM INFO level logging in main application
- Remove LogViewer component and LogsPage from frontend
- Add trailing newlines to multiple backend configuration and model files
- Update frontend routing to remove logs page reference
- Improve application startup logging clarity by filtering verbose third-party logs

											
										
										
											2025-12-12 15:50:48 +08:00
+								        logger.debug(f"[Orchestrator] {agent_name} 注册完成，agent._registered={agent._registered}")
-												feat(agent): implement comprehensive agent architecture with knowledge base and persistence layer

- Add database migrations for agent checkpoints and tree node tracking
- Implement core agent execution framework with executor, state management, and message handling
- Create knowledge base system with framework-specific modules (Django, FastAPI, Flask, Express, React, Supabase)
- Add vulnerability knowledge modules covering authentication, cryptography, injection, XSS, XXE, SSRF, path traversal, deserialization, and race conditions
- Introduce new agent tools: thinking tool, reporting tool, and agent-specific utilities
- Implement LLM memory compression and prompt caching for improved performance
- Add agent registry and persistence layer for checkpoint management
- Refactor agent implementations (analysis, recon, verification, orchestrator) with enhanced capabilities
- Remove legacy agent implementations (analysis_v2, react_agent)
- Update API endpoints for agent task creation and project management
- Add frontend components for agent task creation and enhanced audit UI
- Consolidate agent service architecture with improved separation of concerns
- This refactoring provides a scalable foundation for multi-agent collaboration with knowledge-driven decision making and state persistence

											
										
										
											2025-12-12 15:27:12 +08:00
-												feat(agent): enhance agent functionality with LLM-driven decision-making and event handling

- Introduce LLM-driven decision-making across various agents, allowing for dynamic adjustments based on real-time analysis.
- Implement new event types for LLM thinking, decisions, actions, and observations to enrich the event streaming experience.
- Update agent task responses to include additional metrics for better tracking of task progress and outcomes.
- Refactor UI components to highlight LLM-related events and improve user interaction during audits.
- Enhance API endpoints to support new event structures and improve overall error handling.

											
										
										
											2025-12-11 21:14:32 +08:00
+								        await self.emit_event(
 								            "dispatch",
 								            f"📤 调度 {agent_name} Agent: {task[:100]}...",
 								            agent=agent_name,
 								            task=task,
 								        )
 								        self._tool_calls += 1
 								        try:
-												feat(agent): implement comprehensive agent architecture with knowledge base and persistence layer

- Add database migrations for agent checkpoints and tree node tracking
- Implement core agent execution framework with executor, state management, and message handling
- Create knowledge base system with framework-specific modules (Django, FastAPI, Flask, Express, React, Supabase)
- Add vulnerability knowledge modules covering authentication, cryptography, injection, XSS, XXE, SSRF, path traversal, deserialization, and race conditions
- Introduce new agent tools: thinking tool, reporting tool, and agent-specific utilities
- Implement LLM memory compression and prompt caching for improved performance
- Add agent registry and persistence layer for checkpoint management
- Refactor agent implementations (analysis, recon, verification, orchestrator) with enhanced capabilities
- Remove legacy agent implementations (analysis_v2, react_agent)
- Update API endpoints for agent task creation and project management
- Add frontend components for agent task creation and enhanced audit UI
- Consolidate agent service architecture with improved separation of concerns
- This refactoring provides a scalable foundation for multi-agent collaboration with knowledge-driven decision making and state persistence

											
										
										
											2025-12-12 15:27:12 +08:00
+								            # 🔥 构建子 Agent 输入 - 传递完整的运行时上下文
 								            project_info = self._runtime_context.get("project_info", {}).copy()
 								            # 确保 project_info 包含 root 路径
 								            if "root" not in project_info:
 								                project_info["root"] = self._runtime_context.get("project_root", ".")
-												feat(agent): 新增多语言代码测试和漏洞验证工具并增强错误处理

新增 PHP、Python、JavaScript 等多语言代码测试工具和命令注入、SQL 注入等专用漏洞验证工具
优化错误处理逻辑，提供更详细的错误信息和堆栈跟踪
增强 JSON 解析器，优先使用 json-repair 库处理复杂格式
改进 Agent 响应解析逻辑，更健壮地提取思考内容和操作指令
完善沙箱管理器的初始化和错误处理机制

											
										
										
											2025-12-14 17:20:54 +08:00
 								            # 🔥 FIX: 构建完整的 previous_results，包含所有已执行 Agent 的结果
 								            previous_results = {
 								                "findings": self._all_findings,  # 传递已收集的发现
 								            }
 								            # 🔥 将之前 Agent 的完整结果传递给后续 Agent
 								            for prev_agent, prev_data in self._agent_results.items():
 								                previous_results[prev_agent] = {"data": prev_data}
-												feat(agent): enhance agent functionality with LLM-driven decision-making and event handling

- Introduce LLM-driven decision-making across various agents, allowing for dynamic adjustments based on real-time analysis.
- Implement new event types for LLM thinking, decisions, actions, and observations to enrich the event streaming experience.
- Update agent task responses to include additional metrics for better tracking of task progress and outcomes.
- Refactor UI components to highlight LLM-related events and improve user interaction during audits.
- Enhance API endpoints to support new event structures and improve overall error handling.

											
										
										
											2025-12-11 21:14:32 +08:00
+								            sub_input = {
 								                "task": task,
 								                "task_context": context,
-												feat(agent): implement comprehensive agent architecture with knowledge base and persistence layer

- Add database migrations for agent checkpoints and tree node tracking
- Implement core agent execution framework with executor, state management, and message handling
- Create knowledge base system with framework-specific modules (Django, FastAPI, Flask, Express, React, Supabase)
- Add vulnerability knowledge modules covering authentication, cryptography, injection, XSS, XXE, SSRF, path traversal, deserialization, and race conditions
- Introduce new agent tools: thinking tool, reporting tool, and agent-specific utilities
- Implement LLM memory compression and prompt caching for improved performance
- Add agent registry and persistence layer for checkpoint management
- Refactor agent implementations (analysis, recon, verification, orchestrator) with enhanced capabilities
- Remove legacy agent implementations (analysis_v2, react_agent)
- Update API endpoints for agent task creation and project management
- Add frontend components for agent task creation and enhanced audit UI
- Consolidate agent service architecture with improved separation of concerns
- This refactoring provides a scalable foundation for multi-agent collaboration with knowledge-driven decision making and state persistence

											
										
										
											2025-12-12 15:27:12 +08:00
+								                "project_info": project_info,
 								                "config": self._runtime_context.get("config", {}),
 								                "project_root": self._runtime_context.get("project_root", "."),
-												feat(agent): 新增多语言代码测试和漏洞验证工具并增强错误处理

新增 PHP、Python、JavaScript 等多语言代码测试工具和命令注入、SQL 注入等专用漏洞验证工具
优化错误处理逻辑，提供更详细的错误信息和堆栈跟踪
增强 JSON 解析器，优先使用 json-repair 库处理复杂格式
改进 Agent 响应解析逻辑，更健壮地提取思考内容和操作指令
完善沙箱管理器的初始化和错误处理机制

											
										
										
											2025-12-14 17:20:54 +08:00
+								                "previous_results": previous_results,
-												feat(agent): enhance agent functionality with LLM-driven decision-making and event handling

- Introduce LLM-driven decision-making across various agents, allowing for dynamic adjustments based on real-time analysis.
- Implement new event types for LLM thinking, decisions, actions, and observations to enrich the event streaming experience.
- Update agent task responses to include additional metrics for better tracking of task progress and outcomes.
- Refactor UI components to highlight LLM-related events and improve user interaction during audits.
- Enhance API endpoints to support new event structures and improve overall error handling.

											
										
										
											2025-12-11 21:14:32 +08:00
+								            }
-												feat(agent): 实现任务取消和超时处理机制

添加对Agent任务的取消和超时处理支持，包括：
- 在工具执行、子Agent运行和项目初始化阶段检查取消状态
- 为不同工具和Agent类型设置合理的超时时间
- 使用asyncio实现取消检查和超时控制
- 优化取消响应速度，减少资源浪费

											
										
										
											2025-12-16 17:31:29 +08:00
-												feat(agent): implement comprehensive agent architecture with knowledge base and persistence layer

- Add database migrations for agent checkpoints and tree node tracking
- Implement core agent execution framework with executor, state management, and message handling
- Create knowledge base system with framework-specific modules (Django, FastAPI, Flask, Express, React, Supabase)
- Add vulnerability knowledge modules covering authentication, cryptography, injection, XSS, XXE, SSRF, path traversal, deserialization, and race conditions
- Introduce new agent tools: thinking tool, reporting tool, and agent-specific utilities
- Implement LLM memory compression and prompt caching for improved performance
- Add agent registry and persistence layer for checkpoint management
- Refactor agent implementations (analysis, recon, verification, orchestrator) with enhanced capabilities
- Remove legacy agent implementations (analysis_v2, react_agent)
- Update API endpoints for agent task creation and project management
- Add frontend components for agent task creation and enhanced audit UI
- Consolidate agent service architecture with improved separation of concerns
- This refactoring provides a scalable foundation for multi-agent collaboration with knowledge-driven decision making and state persistence

											
										
										
											2025-12-12 15:27:12 +08:00
+								            # 🔥 执行子 Agent 前检查取消状态
 								            if self.is_cancelled:
 								                return f"## {agent_name} Agent 执行取消\n\n任务已被用户取消"
-												feat(agent): 实现任务取消和超时处理机制

添加对Agent任务的取消和超时处理支持，包括：
- 在工具执行、子Agent运行和项目初始化阶段检查取消状态
- 为不同工具和Agent类型设置合理的超时时间
- 使用asyncio实现取消检查和超时控制
- 优化取消响应速度，减少资源浪费

											
										
										
											2025-12-16 17:31:29 +08:00
 								            # 🔥 执行子 Agent - 支持取消和超时
 								            # 设置子 Agent 超时（根据 Agent 类型）
 								            agent_timeouts = {
 								                "recon": 300,        # 5 分钟
 								                "analysis": 600,     # 10 分钟
-												feat: enhance Gitea support and merge upstream v3.0.0

- Merge upstream v3.0.0 changes
- Fix security vulnerabilities (SSRF, Path Traversal) by introducing `parse_repository_url` utility
- Fix token leakage and handling in `scanner.py` and `projects.py`
- Fix `NameError` in `scanner.py`
- Fix `frontend/docker-entrypoint.sh` API URL escaping
- Standardize Gitea token naming to `gitea_token`

											
										
										
											2025-12-17 11:02:42 +08:00
+								                "verification": 600, # 10 分钟
-												feat(agent): 实现任务取消和超时处理机制

添加对Agent任务的取消和超时处理支持，包括：
- 在工具执行、子Agent运行和项目初始化阶段检查取消状态
- 为不同工具和Agent类型设置合理的超时时间
- 使用asyncio实现取消检查和超时控制
- 优化取消响应速度，减少资源浪费

											
										
										
											2025-12-16 17:31:29 +08:00
+								            }
 								            timeout = agent_timeouts.get(agent_name, 300)
 								            async def run_with_cancel_check():
 								                """包装子 Agent 执行，定期检查取消状态"""
 								                run_task = asyncio.create_task(agent.run(sub_input))
 								                try:
 								                    while not run_task.done():
 								                        if self.is_cancelled:
-												feat: enhance Gitea support and merge upstream v3.0.0

- Merge upstream v3.0.0 changes
- Fix security vulnerabilities (SSRF, Path Traversal) by introducing `parse_repository_url` utility
- Fix token leakage and handling in `scanner.py` and `projects.py`
- Fix `NameError` in `scanner.py`
- Fix `frontend/docker-entrypoint.sh` API URL escaping
- Standardize Gitea token naming to `gitea_token`

											
										
										
											2025-12-17 11:02:42 +08:00
+								                            # 🔥 传播取消到子 Agent
 								                            logger.info(f"[{self.name}] Cancelling sub-agent {agent_name} due to parent cancel")
-												feat(agent): 实现任务取消和超时处理机制

添加对Agent任务的取消和超时处理支持，包括：
- 在工具执行、子Agent运行和项目初始化阶段检查取消状态
- 为不同工具和Agent类型设置合理的超时时间
- 使用asyncio实现取消检查和超时控制
- 优化取消响应速度，减少资源浪费

											
										
										
											2025-12-16 17:31:29 +08:00
+								                            if hasattr(agent, 'cancel'):
 								                                agent.cancel()
 								                            run_task.cancel()
 								                            try:
 								                                await run_task
 								                            except asyncio.CancelledError:
 								                                pass
 								                            raise asyncio.CancelledError("任务已取消")
-												feat: enhance Gitea support and merge upstream v3.0.0

- Merge upstream v3.0.0 changes
- Fix security vulnerabilities (SSRF, Path Traversal) by introducing `parse_repository_url` utility
- Fix token leakage and handling in `scanner.py` and `projects.py`
- Fix `NameError` in `scanner.py`
- Fix `frontend/docker-entrypoint.sh` API URL escaping
- Standardize Gitea token naming to `gitea_token`

											
										
										
											2025-12-17 11:02:42 +08:00
+								                        # Use asyncio.wait to poll without cancelling the task
 								                        done, pending = await asyncio.wait(
 								                            [run_task],
 								                            timeout=0.5,
 								                            return_when=asyncio.FIRST_COMPLETED
 								                        )
 								                        if run_task in done:
 								                            return run_task.result()
 								                        # If not done, continue loop
 								                        continue
-												feat(agent): 实现任务取消和超时处理机制

添加对Agent任务的取消和超时处理支持，包括：
- 在工具执行、子Agent运行和项目初始化阶段检查取消状态
- 为不同工具和Agent类型设置合理的超时时间
- 使用asyncio实现取消检查和超时控制
- 优化取消响应速度，减少资源浪费

											
										
										
											2025-12-16 17:31:29 +08:00
 								                    return await run_task
 								                except asyncio.CancelledError:
-												feat: enhance Gitea support and merge upstream v3.0.0

- Merge upstream v3.0.0 changes
- Fix security vulnerabilities (SSRF, Path Traversal) by introducing `parse_repository_url` utility
- Fix token leakage and handling in `scanner.py` and `projects.py`
- Fix `NameError` in `scanner.py`
- Fix `frontend/docker-entrypoint.sh` API URL escaping
- Standardize Gitea token naming to `gitea_token`

											
										
										
											2025-12-17 11:02:42 +08:00
+								                    # 🔥 确保子任务被取消
-												feat(agent): 实现任务取消和超时处理机制

添加对Agent任务的取消和超时处理支持，包括：
- 在工具执行、子Agent运行和项目初始化阶段检查取消状态
- 为不同工具和Agent类型设置合理的超时时间
- 使用asyncio实现取消检查和超时控制
- 优化取消响应速度，减少资源浪费

											
										
										
											2025-12-16 17:31:29 +08:00
+								                    if not run_task.done():
-												feat: enhance Gitea support and merge upstream v3.0.0

- Merge upstream v3.0.0 changes
- Fix security vulnerabilities (SSRF, Path Traversal) by introducing `parse_repository_url` utility
- Fix token leakage and handling in `scanner.py` and `projects.py`
- Fix `NameError` in `scanner.py`
- Fix `frontend/docker-entrypoint.sh` API URL escaping
- Standardize Gitea token naming to `gitea_token`

											
										
										
											2025-12-17 11:02:42 +08:00
+								                        if hasattr(agent, 'cancel'):
 								                            agent.cancel()
-												feat(agent): 实现任务取消和超时处理机制

添加对Agent任务的取消和超时处理支持，包括：
- 在工具执行、子Agent运行和项目初始化阶段检查取消状态
- 为不同工具和Agent类型设置合理的超时时间
- 使用asyncio实现取消检查和超时控制
- 优化取消响应速度，减少资源浪费

											
										
										
											2025-12-16 17:31:29 +08:00
+								                        run_task.cancel()
-												feat: enhance Gitea support and merge upstream v3.0.0

- Merge upstream v3.0.0 changes
- Fix security vulnerabilities (SSRF, Path Traversal) by introducing `parse_repository_url` utility
- Fix token leakage and handling in `scanner.py` and `projects.py`
- Fix `NameError` in `scanner.py`
- Fix `frontend/docker-entrypoint.sh` API URL escaping
- Standardize Gitea token naming to `gitea_token`

											
										
										
											2025-12-17 11:02:42 +08:00
+								                        try:
 								                            await run_task
 								                        except asyncio.CancelledError:
 								                            pass
-												feat(agent): 实现任务取消和超时处理机制

添加对Agent任务的取消和超时处理支持，包括：
- 在工具执行、子Agent运行和项目初始化阶段检查取消状态
- 为不同工具和Agent类型设置合理的超时时间
- 使用asyncio实现取消检查和超时控制
- 优化取消响应速度，减少资源浪费

											
										
										
											2025-12-16 17:31:29 +08:00
+								                    raise
 								            try:
 								                result = await asyncio.wait_for(
 								                    run_with_cancel_check(),
 								                    timeout=timeout
 								                )
 								            except asyncio.TimeoutError:
 								                logger.warning(f"[{self.name}] Sub-agent {agent_name} timed out after {timeout}s")
 								                return f"## {agent_name} Agent 执行超时\n\n子 Agent 执行超过 {timeout} 秒，已强制终止。请尝试更具体的任务或使用其他 Agent。"
 								            except asyncio.CancelledError:
 								                logger.info(f"[{self.name}] Sub-agent {agent_name} was cancelled")
 								                return f"## {agent_name} Agent 执行取消\n\n任务已被用户取消"
-												feat(agent): implement comprehensive agent architecture with knowledge base and persistence layer

- Add database migrations for agent checkpoints and tree node tracking
- Implement core agent execution framework with executor, state management, and message handling
- Create knowledge base system with framework-specific modules (Django, FastAPI, Flask, Express, React, Supabase)
- Add vulnerability knowledge modules covering authentication, cryptography, injection, XSS, XXE, SSRF, path traversal, deserialization, and race conditions
- Introduce new agent tools: thinking tool, reporting tool, and agent-specific utilities
- Implement LLM memory compression and prompt caching for improved performance
- Add agent registry and persistence layer for checkpoint management
- Refactor agent implementations (analysis, recon, verification, orchestrator) with enhanced capabilities
- Remove legacy agent implementations (analysis_v2, react_agent)
- Update API endpoints for agent task creation and project management
- Add frontend components for agent task creation and enhanced audit UI
- Consolidate agent service architecture with improved separation of concerns
- This refactoring provides a scalable foundation for multi-agent collaboration with knowledge-driven decision making and state persistence

											
										
										
											2025-12-12 15:27:12 +08:00
+								            # 🔥 执行后再次检查取消状态
 								            if self.is_cancelled:
 								                return f"## {agent_name} Agent 执行中断\n\n任务已被用户取消"
-												feat(agent): 新增多语言代码测试和漏洞验证工具并增强错误处理

新增 PHP、Python、JavaScript 等多语言代码测试工具和命令注入、SQL 注入等专用漏洞验证工具
优化错误处理逻辑，提供更详细的错误信息和堆栈跟踪
增强 JSON 解析器，优先使用 json-repair 库处理复杂格式
改进 Agent 响应解析逻辑，更健壮地提取思考内容和操作指令
完善沙箱管理器的初始化和错误处理机制

											
										
										
											2025-12-14 17:20:54 +08:00
-												feat(agent): implement comprehensive agent architecture with knowledge base and persistence layer

- Add database migrations for agent checkpoints and tree node tracking
- Implement core agent execution framework with executor, state management, and message handling
- Create knowledge base system with framework-specific modules (Django, FastAPI, Flask, Express, React, Supabase)
- Add vulnerability knowledge modules covering authentication, cryptography, injection, XSS, XXE, SSRF, path traversal, deserialization, and race conditions
- Introduce new agent tools: thinking tool, reporting tool, and agent-specific utilities
- Implement LLM memory compression and prompt caching for improved performance
- Add agent registry and persistence layer for checkpoint management
- Refactor agent implementations (analysis, recon, verification, orchestrator) with enhanced capabilities
- Remove legacy agent implementations (analysis_v2, react_agent)
- Update API endpoints for agent task creation and project management
- Add frontend components for agent task creation and enhanced audit UI
- Consolidate agent service architecture with improved separation of concerns
- This refactoring provides a scalable foundation for multi-agent collaboration with knowledge-driven decision making and state persistence

											
										
										
											2025-12-12 15:27:12 +08:00
+								            # 🔥 处理子 Agent 结果 - 不同 Agent 返回不同的数据结构
-												feat(agent): 新增多语言代码测试和漏洞验证工具并增强错误处理

新增 PHP、Python、JavaScript 等多语言代码测试工具和命令注入、SQL 注入等专用漏洞验证工具
优化错误处理逻辑，提供更详细的错误信息和堆栈跟踪
增强 JSON 解析器，优先使用 json-repair 库处理复杂格式
改进 Agent 响应解析逻辑，更健壮地提取思考内容和操作指令
完善沙箱管理器的初始化和错误处理机制

											
										
										
											2025-12-14 17:20:54 +08:00
+								            # 🔥 DEBUG: 添加诊断日志
 								            logger.info(f"[Orchestrator] Processing {agent_name} result: success={result.success}, data_type={type(result.data).__name__}, data_keys={list(result.data.keys()) if isinstance(result.data, dict) else 'N/A'}")
-												feat(agent): enhance agent functionality with LLM-driven decision-making and event handling

- Introduce LLM-driven decision-making across various agents, allowing for dynamic adjustments based on real-time analysis.
- Implement new event types for LLM thinking, decisions, actions, and observations to enrich the event streaming experience.
- Update agent task responses to include additional metrics for better tracking of task progress and outcomes.
- Refactor UI components to highlight LLM-related events and improve user interaction during audits.
- Enhance API endpoints to support new event structures and improve overall error handling.

											
										
										
											2025-12-11 21:14:32 +08:00
+								            if result.success and result.data:
-												feat(agent): implement comprehensive agent architecture with knowledge base and persistence layer

- Add database migrations for agent checkpoints and tree node tracking
- Implement core agent execution framework with executor, state management, and message handling
- Create knowledge base system with framework-specific modules (Django, FastAPI, Flask, Express, React, Supabase)
- Add vulnerability knowledge modules covering authentication, cryptography, injection, XSS, XXE, SSRF, path traversal, deserialization, and race conditions
- Introduce new agent tools: thinking tool, reporting tool, and agent-specific utilities
- Implement LLM memory compression and prompt caching for improved performance
- Add agent registry and persistence layer for checkpoint management
- Refactor agent implementations (analysis, recon, verification, orchestrator) with enhanced capabilities
- Remove legacy agent implementations (analysis_v2, react_agent)
- Update API endpoints for agent task creation and project management
- Add frontend components for agent task creation and enhanced audit UI
- Consolidate agent service architecture with improved separation of concerns
- This refactoring provides a scalable foundation for multi-agent collaboration with knowledge-driven decision making and state persistence

											
										
										
											2025-12-12 15:27:12 +08:00
+								                data = result.data
-												feat: 新增安全工具集成和漏洞知识库扩展

- 添加 Bandit 和 Safety 安全工具到依赖项
- 新增 CSRF、业务逻辑和开放重定向漏洞知识文档
- 实现安全工具一键安装脚本和文档
- 改进模式匹配工具支持直接文件扫描
- 增强遥测模块和 Agent 审计功能
- 修复验证节点中 findings 合并逻辑
- 优化前端 Agent 审计界面和状态展示

											
										
										
											2025-12-13 12:35:03 +08:00
-												feat(agent): 新增多语言代码测试和漏洞验证工具并增强错误处理

新增 PHP、Python、JavaScript 等多语言代码测试工具和命令注入、SQL 注入等专用漏洞验证工具
优化错误处理逻辑，提供更详细的错误信息和堆栈跟踪
增强 JSON 解析器，优先使用 json-repair 库处理复杂格式
改进 Agent 响应解析逻辑，更健壮地提取思考内容和操作指令
完善沙箱管理器的初始化和错误处理机制

											
										
										
											2025-12-14 17:20:54 +08:00
+								                # 🔥 FIX: 保存 Agent 的完整结果，供后续 Agent 使用
 								                self._agent_results[agent_name] = data
 								                logger.info(f"[Orchestrator] Saved {agent_name} result with keys: {list(data.keys())}")
-												feat: 新增安全工具集成和漏洞知识库扩展

- 添加 Bandit 和 Safety 安全工具到依赖项
- 新增 CSRF、业务逻辑和开放重定向漏洞知识文档
- 实现安全工具一键安装脚本和文档
- 改进模式匹配工具支持直接文件扫描
- 增强遥测模块和 Agent 审计功能
- 修复验证节点中 findings 合并逻辑
- 优化前端 Agent 审计界面和状态展示

											
										
										
											2025-12-13 12:35:03 +08:00
+								                # 🔥 CRITICAL FIX: 收集发现 - 支持多种字段名
 								                # findings 字段通常来自 Analysis/Verification Agent
 								                # initial_findings 来自 Recon Agent
 								                raw_findings = data.get("findings", [])
-												feat(agent): 增强漏洞发现处理流程和前端兼容性

- 后端添加对旧事件类型'finding'的兼容支持
- 改进漏洞发现标准化和去重逻辑
- 新增PoC生成要求和相关字段
- 优化沙箱配置初始化流程
- 前端添加ADD_FINDING操作和状态管理
- 增强事件流处理和序列号过滤
- 改进历史事件加载和SSE连接逻辑
- 添加漏洞验证状态和PoC信息到报告

											
										
										
											2025-12-13 18:45:05 +08:00
+								                logger.info(f"[Orchestrator] {agent_name} returned data with {len(raw_findings)} findings in 'findings' field")
-												feat: 新增安全工具集成和漏洞知识库扩展

- 添加 Bandit 和 Safety 安全工具到依赖项
- 新增 CSRF、业务逻辑和开放重定向漏洞知识文档
- 实现安全工具一键安装脚本和文档
- 改进模式匹配工具支持直接文件扫描
- 增强遥测模块和 Agent 审计功能
- 修复验证节点中 findings 合并逻辑
- 优化前端 Agent 审计界面和状态展示

											
										
										
											2025-12-13 12:35:03 +08:00
-												feat(agent): 增强漏洞发现处理流程和前端兼容性

- 后端添加对旧事件类型'finding'的兼容支持
- 改进漏洞发现标准化和去重逻辑
- 新增PoC生成要求和相关字段
- 优化沙箱配置初始化流程
- 前端添加ADD_FINDING操作和状态管理
- 增强事件流处理和序列号过滤
- 改进历史事件加载和SSE连接逻辑
- 添加漏洞验证状态和PoC信息到报告

											
										
										
											2025-12-13 18:45:05 +08:00
+								                # 🔥 ENHANCED: Also check for initial_findings (from Recon) - 改进逻辑
 								                # 即使 findings 为空列表，也检查 initial_findings
 								                if "initial_findings" in data:
-												feat: 新增安全工具集成和漏洞知识库扩展

- 添加 Bandit 和 Safety 安全工具到依赖项
- 新增 CSRF、业务逻辑和开放重定向漏洞知识文档
- 实现安全工具一键安装脚本和文档
- 改进模式匹配工具支持直接文件扫描
- 增强遥测模块和 Agent 审计功能
- 修复验证节点中 findings 合并逻辑
- 优化前端 Agent 审计界面和状态展示

											
										
										
											2025-12-13 12:35:03 +08:00
+								                    initial = data.get("initial_findings", [])
-												feat(agent): 新增多语言代码测试和漏洞验证工具并增强错误处理

新增 PHP、Python、JavaScript 等多语言代码测试工具和命令注入、SQL 注入等专用漏洞验证工具
优化错误处理逻辑，提供更详细的错误信息和堆栈跟踪
增强 JSON 解析器，优先使用 json-repair 库处理复杂格式
改进 Agent 响应解析逻辑，更健壮地提取思考内容和操作指令
完善沙箱管理器的初始化和错误处理机制

											
										
										
											2025-12-14 17:20:54 +08:00
+								                    logger.info(f"[Orchestrator] {agent_name} has {len(initial)} initial_findings, types: {[type(f).__name__ for f in initial[:3]]}")
-												feat: 新增安全工具集成和漏洞知识库扩展

- 添加 Bandit 和 Safety 安全工具到依赖项
- 新增 CSRF、业务逻辑和开放重定向漏洞知识文档
- 实现安全工具一键安装脚本和文档
- 改进模式匹配工具支持直接文件扫描
- 增强遥测模块和 Agent 审计功能
- 修复验证节点中 findings 合并逻辑
- 优化前端 Agent 审计界面和状态展示

											
										
										
											2025-12-13 12:35:03 +08:00
+								                    for f in initial:
 								                        if isinstance(f, dict):
-												feat(agent): 增强漏洞发现处理流程和前端兼容性

- 后端添加对旧事件类型'finding'的兼容支持
- 改进漏洞发现标准化和去重逻辑
- 新增PoC生成要求和相关字段
- 优化沙箱配置初始化流程
- 前端添加ADD_FINDING操作和状态管理
- 增强事件流处理和序列号过滤
- 改进历史事件加载和SSE连接逻辑
- 添加漏洞验证状态和PoC信息到报告

											
										
										
											2025-12-13 18:45:05 +08:00
+								                            # 🔥 Normalize finding format - 处理 Recon 返回的格式
 								                            normalized = self._normalize_finding(f)
 								                            if normalized not in raw_findings:
 								                                raw_findings.append(normalized)
-												feat(agent): 新增多语言代码测试和漏洞验证工具并增强错误处理

新增 PHP、Python、JavaScript 等多语言代码测试工具和命令注入、SQL 注入等专用漏洞验证工具
优化错误处理逻辑，提供更详细的错误信息和堆栈跟踪
增强 JSON 解析器，优先使用 json-repair 库处理复杂格式
改进 Agent 响应解析逻辑，更健壮地提取思考内容和操作指令
完善沙箱管理器的初始化和错误处理机制

											
										
										
											2025-12-14 17:20:54 +08:00
+								                                logger.info(f"[Orchestrator] Added dict finding from initial_findings")
 								                        elif isinstance(f, str) and f.strip():
 								                            # 🔥 FIX: Convert string finding to dict format instead of skipping
 								                            # Recon Agent 有时候会返回字符串格式的发现
 								                            # 尝试从字符串中提取文件路径（格式如 "app.py:36 - 描述"）
 								                            file_path = ""
 								                            line_start = 0
 								                            if ":" in f:
 								                                parts = f.split(":", 1)
 								                                potential_file = parts[0].strip()
 								                                # 检查是否像文件路径
 								                                if "." in potential_file and "/" not in potential_file[:3]:
 								                                    file_path = potential_file
 								                                    # 尝试提取行号
 								                                    if len(parts) > 1:
 								                                        remaining = parts[1].strip()
 								                                        line_match = remaining.split()[0] if remaining else ""
 								                                        if line_match.isdigit():
 								                                            line_start = int(line_match)
 								                            string_finding = {
 								                                "title": f[:100] if len(f) > 100 else f,
 								                                "description": f,
 								                                "file_path": file_path,
 								                                "line_start": line_start,
 								                                "severity": "medium",  # 默认中等严重度，Analysis 会重新评估
 								                                "vulnerability_type": "potential_issue",
 								                                "source": "recon",
 								                                "needs_verification": True,
 								                                "confidence": 0.5,  # 较低置信度，需要进一步分析
 								                            }
 								                            logger.info(f"[Orchestrator] Converted string finding to dict: {f[:80]}... (file={file_path}, line={line_start})")
 								                            raw_findings.append(string_finding)
 								                else:
 								                    logger.info(f"[Orchestrator] {agent_name} has no 'initial_findings' key in data")
-												feat(agent): 增强漏洞发现处理流程和前端兼容性

- 后端添加对旧事件类型'finding'的兼容支持
- 改进漏洞发现标准化和去重逻辑
- 新增PoC生成要求和相关字段
- 优化沙箱配置初始化流程
- 前端添加ADD_FINDING操作和状态管理
- 增强事件流处理和序列号过滤
- 改进历史事件加载和SSE连接逻辑
- 添加漏洞验证状态和PoC信息到报告

											
										
										
											2025-12-13 18:45:05 +08:00
 								                # 🔥 Also check high_risk_areas from Recon for potential findings
 								                if agent_name == "recon" and "high_risk_areas" in data:
 								                    high_risk = data.get("high_risk_areas", [])
 								                    logger.info(f"[Orchestrator] {agent_name} identified {len(high_risk)} high risk areas")
-												feat(agent): 新增多语言代码测试和漏洞验证工具并增强错误处理

新增 PHP、Python、JavaScript 等多语言代码测试工具和命令注入、SQL 注入等专用漏洞验证工具
优化错误处理逻辑，提供更详细的错误信息和堆栈跟踪
增强 JSON 解析器，优先使用 json-repair 库处理复杂格式
改进 Agent 响应解析逻辑，更健壮地提取思考内容和操作指令
完善沙箱管理器的初始化和错误处理机制

											
										
										
											2025-12-14 17:20:54 +08:00
+								                    # 🔥 FIX: 将 high_risk_areas 也转换为发现
 								                    for area in high_risk:
 								                        if isinstance(area, str) and area.strip():
 								                            # 尝试从描述中提取文件路径和漏洞类型
 								                            file_path = ""
 								                            line_start = 0
 								                            vuln_type = "potential_issue"
 								                            # 🔥 FIX: 改进文件路径提取逻辑
 								                            # 格式1: "file.py:36 - 描述" -> 提取 file.py 和 36
 								                            # 格式2: "描述性文本" -> 不提取文件路径
 								                            if ":" in area:
 								                                parts = area.split(":", 1)
 								                                potential_file = parts[0].strip()
 								                                # 只有当 parts[0] 看起来像文件路径时才提取
 								                                # 文件路径通常包含 . 且没有空格（或只在结尾有扩展名）
 								                                if ("." in potential_file and
 								                                    " " not in potential_file and
 								                                    len(potential_file) < 100 and
 								                                    any(potential_file.endswith(ext) for ext in ['.py', '.js', '.ts', '.java', '.go', '.php', '.rb', '.c', '.cpp', '.h'])):
 								                                    file_path = potential_file
 								                                    # 尝试提取行号
 								                                    if len(parts) > 1:
 								                                        remaining = parts[1].strip()
 								                                        line_match = remaining.split()[0] if remaining else ""
 								                                        if line_match.isdigit():
 								                                            line_start = int(line_match)
 								                            # 推断漏洞类型
 								                            area_lower = area.lower()
 								                            if "command" in area_lower or "命令" in area_lower or "subprocess" in area_lower:
 								                                vuln_type = "command_injection"
 								                            elif "sql" in area_lower:
 								                                vuln_type = "sql_injection"
 								                            elif "xss" in area_lower:
 								                                vuln_type = "xss"
 								                            elif "path" in area_lower or "traversal" in area_lower or "路径" in area_lower:
 								                                vuln_type = "path_traversal"
 								                            elif "ssrf" in area_lower:
 								                                vuln_type = "ssrf"
 								                            elif "secret" in area_lower or "密钥" in area_lower or "key" in area_lower:
 								                                vuln_type = "hardcoded_secret"
 								                            high_risk_finding = {
 								                                "title": area[:100] if len(area) > 100 else area,
 								                                "description": area,
 								                                "file_path": file_path,
 								                                "line_start": line_start,
 								                                "severity": "high",  # 高风险区域默认高严重度
 								                                "vulnerability_type": vuln_type,
 								                                "source": "recon_high_risk",
 								                                "needs_verification": True,
 								                                "confidence": 0.6,
 								                            }
 								                            raw_findings.append(high_risk_finding)
 								                            logger.info(f"[Orchestrator] Converted high_risk_area to finding: {area[:60]}... (file={file_path}, type={vuln_type})")
 								                # 🔥 初始化 valid_findings，确保后续代码可以访问
 								                valid_findings = []
-												feat: 新增安全工具集成和漏洞知识库扩展

- 添加 Bandit 和 Safety 安全工具到依赖项
- 新增 CSRF、业务逻辑和开放重定向漏洞知识文档
- 实现安全工具一键安装脚本和文档
- 改进模式匹配工具支持直接文件扫描
- 增强遥测模块和 Agent 审计功能
- 修复验证节点中 findings 合并逻辑
- 优化前端 Agent 审计界面和状态展示

											
										
										
											2025-12-13 12:35:03 +08:00
 								                if raw_findings:
-												feat(agent): implement comprehensive agent architecture with knowledge base and persistence layer

- Add database migrations for agent checkpoints and tree node tracking
- Implement core agent execution framework with executor, state management, and message handling
- Create knowledge base system with framework-specific modules (Django, FastAPI, Flask, Express, React, Supabase)
- Add vulnerability knowledge modules covering authentication, cryptography, injection, XSS, XXE, SSRF, path traversal, deserialization, and race conditions
- Introduce new agent tools: thinking tool, reporting tool, and agent-specific utilities
- Implement LLM memory compression and prompt caching for improved performance
- Add agent registry and persistence layer for checkpoint management
- Refactor agent implementations (analysis, recon, verification, orchestrator) with enhanced capabilities
- Remove legacy agent implementations (analysis_v2, react_agent)
- Update API endpoints for agent task creation and project management
- Add frontend components for agent task creation and enhanced audit UI
- Consolidate agent service architecture with improved separation of concerns
- This refactoring provides a scalable foundation for multi-agent collaboration with knowledge-driven decision making and state persistence

											
										
										
											2025-12-12 15:27:12 +08:00
+								                    # 只添加字典格式的发现
-												feat: 新增安全工具集成和漏洞知识库扩展

- 添加 Bandit 和 Safety 安全工具到依赖项
- 新增 CSRF、业务逻辑和开放重定向漏洞知识文档
- 实现安全工具一键安装脚本和文档
- 改进模式匹配工具支持直接文件扫描
- 增强遥测模块和 Agent 审计功能
- 修复验证节点中 findings 合并逻辑
- 优化前端 Agent 审计界面和状态展示

											
										
										
											2025-12-13 12:35:03 +08:00
+								                    valid_findings = [f for f in raw_findings if isinstance(f, dict)]
 								                    logger.info(f"[Orchestrator] {agent_name} returned {len(valid_findings)} valid findings")
-												feat(agent): 增强漏洞发现处理流程和前端兼容性

- 后端添加对旧事件类型'finding'的兼容支持
- 改进漏洞发现标准化和去重逻辑
- 新增PoC生成要求和相关字段
- 优化沙箱配置初始化流程
- 前端添加ADD_FINDING操作和状态管理
- 增强事件流处理和序列号过滤
- 改进历史事件加载和SSE连接逻辑
- 添加漏洞验证状态和PoC信息到报告

											
										
										
											2025-12-13 18:45:05 +08:00
+								                    # 🔥 ENHANCED: Merge findings with better deduplication
-												feat: 新增安全工具集成和漏洞知识库扩展

- 添加 Bandit 和 Safety 安全工具到依赖项
- 新增 CSRF、业务逻辑和开放重定向漏洞知识文档
- 实现安全工具一键安装脚本和文档
- 改进模式匹配工具支持直接文件扫描
- 增强遥测模块和 Agent 审计功能
- 修复验证节点中 findings 合并逻辑
- 优化前端 Agent 审计界面和状态展示

											
										
										
											2025-12-13 12:35:03 +08:00
+								                    for new_f in valid_findings:
-												feat(agent): 增强漏洞发现处理流程和前端兼容性

- 后端添加对旧事件类型'finding'的兼容支持
- 改进漏洞发现标准化和去重逻辑
- 新增PoC生成要求和相关字段
- 优化沙箱配置初始化流程
- 前端添加ADD_FINDING操作和状态管理
- 增强事件流处理和序列号过滤
- 改进历史事件加载和SSE连接逻辑
- 添加漏洞验证状态和PoC信息到报告

											
										
										
											2025-12-13 18:45:05 +08:00
+								                        # Normalize the finding first
 								                        normalized_new = self._normalize_finding(new_f)
-												Fix capitalization issues and handle cases where the answer is "none".

											
										
										
											2026-01-12 14:04:12 +08:00
 								                        # 🔥 FIX: Skip if normalization returned None (e.g., file path validation failed)
 								                        if normalized_new is None:
 								                            logger.debug(f"[Orchestrator] Skipping invalid finding: {new_f.get('title', 'N/A')[:50]}")
 								                            continue
-												feat(agent): 增强漏洞发现处理流程和前端兼容性

- 后端添加对旧事件类型'finding'的兼容支持
- 改进漏洞发现标准化和去重逻辑
- 新增PoC生成要求和相关字段
- 优化沙箱配置初始化流程
- 前端添加ADD_FINDING操作和状态管理
- 增强事件流处理和序列号过滤
- 改进历史事件加载和SSE连接逻辑
- 添加漏洞验证状态和PoC信息到报告

											
										
										
											2025-12-13 18:45:05 +08:00
 								                        # Create fingerprint for deduplication (file + description similarity)
 								                        new_file = normalized_new.get("file_path", "").lower().strip()
 								                        new_desc = (normalized_new.get("description", "") or "").lower()[:100]
 								                        new_type = (normalized_new.get("vulnerability_type", "") or "").lower()
 								                        new_line = normalized_new.get("line_start") or normalized_new.get("line", 0)
 								                        # Check if exists (more flexible matching)
-												feat: 新增安全工具集成和漏洞知识库扩展

- 添加 Bandit 和 Safety 安全工具到依赖项
- 新增 CSRF、业务逻辑和开放重定向漏洞知识文档
- 实现安全工具一键安装脚本和文档
- 改进模式匹配工具支持直接文件扫描
- 增强遥测模块和 Agent 审计功能
- 修复验证节点中 findings 合并逻辑
- 优化前端 Agent 审计界面和状态展示

											
										
										
											2025-12-13 12:35:03 +08:00
+								                        found = False
 								                        for i, existing_f in enumerate(self._all_findings):
-												feat(agent): 增强漏洞发现处理流程和前端兼容性

- 后端添加对旧事件类型'finding'的兼容支持
- 改进漏洞发现标准化和去重逻辑
- 新增PoC生成要求和相关字段
- 优化沙箱配置初始化流程
- 前端添加ADD_FINDING操作和状态管理
- 增强事件流处理和序列号过滤
- 改进历史事件加载和SSE连接逻辑
- 添加漏洞验证状态和PoC信息到报告

											
										
										
											2025-12-13 18:45:05 +08:00
+								                            existing_file = (existing_f.get("file_path", "") or existing_f.get("file", "")).lower().strip()
 								                            existing_desc = (existing_f.get("description", "") or "").lower()[:100]
 								                            existing_type = (existing_f.get("vulnerability_type", "") or existing_f.get("type", "")).lower()
 								                            existing_line = existing_f.get("line_start") or existing_f.get("line", 0)
 								                            # Match if same file AND (same line OR similar description OR same vulnerability type)
 								                            same_file = new_file and existing_file and (
 								                                new_file == existing_file or
 								                                new_file.endswith(existing_file) or
 								                                existing_file.endswith(new_file)
-												feat: 新增安全工具集成和漏洞知识库扩展

- 添加 Bandit 和 Safety 安全工具到依赖项
- 新增 CSRF、业务逻辑和开放重定向漏洞知识文档
- 实现安全工具一键安装脚本和文档
- 改进模式匹配工具支持直接文件扫描
- 增强遥测模块和 Agent 审计功能
- 修复验证节点中 findings 合并逻辑
- 优化前端 Agent 审计界面和状态展示

											
										
										
											2025-12-13 12:35:03 +08:00
+								                            )
-												feat(agent): 增强漏洞发现处理流程和前端兼容性

- 后端添加对旧事件类型'finding'的兼容支持
- 改进漏洞发现标准化和去重逻辑
- 新增PoC生成要求和相关字段
- 优化沙箱配置初始化流程
- 前端添加ADD_FINDING操作和状态管理
- 增强事件流处理和序列号过滤
- 改进历史事件加载和SSE连接逻辑
- 添加漏洞验证状态和PoC信息到报告

											
										
										
											2025-12-13 18:45:05 +08:00
+								                            same_line = new_line and existing_line and new_line == existing_line
 								                            similar_desc = new_desc and existing_desc and (
 								                                new_desc in existing_desc or existing_desc in new_desc
 								                            )
 								                            same_type = new_type and existing_type and (
 								                                new_type == existing_type or
 								                                (new_type in existing_type) or (existing_type in new_type)
 								                            )
 								                            if same_file and (same_line or similar_desc or same_type):
-												feat: 新增安全工具集成和漏洞知识库扩展

- 添加 Bandit 和 Safety 安全工具到依赖项
- 新增 CSRF、业务逻辑和开放重定向漏洞知识文档
- 实现安全工具一键安装脚本和文档
- 改进模式匹配工具支持直接文件扫描
- 增强遥测模块和 Agent 审计功能
- 修复验证节点中 findings 合并逻辑
- 优化前端 Agent 审计界面和状态展示

											
										
										
											2025-12-13 12:35:03 +08:00
+								                                # Update existing with new info (e.g. verification results)
-												feat: enhance Gitea support and merge upstream v3.0.0

- Merge upstream v3.0.0 changes
- Fix security vulnerabilities (SSRF, Path Traversal) by introducing `parse_repository_url` utility
- Fix token leakage and handling in `scanner.py` and `projects.py`
- Fix `NameError` in `scanner.py`
- Fix `frontend/docker-entrypoint.sh` API URL escaping
- Standardize Gitea token naming to `gitea_token`

											
										
										
											2025-12-17 11:02:42 +08:00
+								                                # 🔥 FIX: Smart merge - don't overwrite good data with empty values
 								                                merged = dict(existing_f)  # Start with existing data
 								                                for key, value in normalized_new.items():
 								                                    # Only overwrite if new value is meaningful
 								                                    if value is not None and value != "" and value != 0:
 								                                        merged[key] = value
 								                                    elif key not in merged or merged[key] is None:
 								                                        # Fill in missing fields even with empty values
 								                                        merged[key] = value
-												feat(agent): 增强漏洞发现处理流程和前端兼容性

- 后端添加对旧事件类型'finding'的兼容支持
- 改进漏洞发现标准化和去重逻辑
- 新增PoC生成要求和相关字段
- 优化沙箱配置初始化流程
- 前端添加ADD_FINDING操作和状态管理
- 增强事件流处理和序列号过滤
- 改进历史事件加载和SSE连接逻辑
- 添加漏洞验证状态和PoC信息到报告

											
										
										
											2025-12-13 18:45:05 +08:00
+								                                # Keep the better title
 								                                if normalized_new.get("title") and len(normalized_new.get("title", "")) > len(existing_f.get("title", "")):
 								                                    merged["title"] = normalized_new["title"]
 								                                # Keep verified status if either is verified
 								                                if existing_f.get("is_verified") or normalized_new.get("is_verified"):
 								                                    merged["is_verified"] = True
-												feat: enhance Gitea support and merge upstream v3.0.0

- Merge upstream v3.0.0 changes
- Fix security vulnerabilities (SSRF, Path Traversal) by introducing `parse_repository_url` utility
- Fix token leakage and handling in `scanner.py` and `projects.py`
- Fix `NameError` in `scanner.py`
- Fix `frontend/docker-entrypoint.sh` API URL escaping
- Standardize Gitea token naming to `gitea_token`

											
										
										
											2025-12-17 11:02:42 +08:00
+								                                # 🔥 FIX: Preserve non-zero line numbers
 								                                if existing_f.get("line_start") and not normalized_new.get("line_start"):
 								                                    merged["line_start"] = existing_f["line_start"]
 								                                # 🔥 FIX: Preserve vulnerability_type
 								                                if existing_f.get("vulnerability_type") and not normalized_new.get("vulnerability_type"):
 								                                    merged["vulnerability_type"] = existing_f["vulnerability_type"]
-												feat(agent): 增强漏洞发现处理流程和前端兼容性

- 后端添加对旧事件类型'finding'的兼容支持
- 改进漏洞发现标准化和去重逻辑
- 新增PoC生成要求和相关字段
- 优化沙箱配置初始化流程
- 前端添加ADD_FINDING操作和状态管理
- 增强事件流处理和序列号过滤
- 改进历史事件加载和SSE连接逻辑
- 添加漏洞验证状态和PoC信息到报告

											
										
										
											2025-12-13 18:45:05 +08:00
+								                                self._all_findings[i] = merged
-												feat: 新增安全工具集成和漏洞知识库扩展

- 添加 Bandit 和 Safety 安全工具到依赖项
- 新增 CSRF、业务逻辑和开放重定向漏洞知识文档
- 实现安全工具一键安装脚本和文档
- 改进模式匹配工具支持直接文件扫描
- 增强遥测模块和 Agent 审计功能
- 修复验证节点中 findings 合并逻辑
- 优化前端 Agent 审计界面和状态展示

											
										
										
											2025-12-13 12:35:03 +08:00
+								                                found = True
-												feat: enhance Gitea support and merge upstream v3.0.0

- Merge upstream v3.0.0 changes
- Fix security vulnerabilities (SSRF, Path Traversal) by introducing `parse_repository_url` utility
- Fix token leakage and handling in `scanner.py` and `projects.py`
- Fix `NameError` in `scanner.py`
- Fix `frontend/docker-entrypoint.sh` API URL escaping
- Standardize Gitea token naming to `gitea_token`

											
										
										
											2025-12-17 11:02:42 +08:00
+								                                logger.info(f"[Orchestrator] Merged finding: {new_file}:{merged.get('line_start', 0)} ({merged.get('vulnerability_type', '')})")
-												feat: 新增安全工具集成和漏洞知识库扩展

- 添加 Bandit 和 Safety 安全工具到依赖项
- 新增 CSRF、业务逻辑和开放重定向漏洞知识文档
- 实现安全工具一键安装脚本和文档
- 改进模式匹配工具支持直接文件扫描
- 增强遥测模块和 Agent 审计功能
- 修复验证节点中 findings 合并逻辑
- 优化前端 Agent 审计界面和状态展示

											
										
										
											2025-12-13 12:35:03 +08:00
+								                                break
 								                        if not found:
-												feat(agent): 增强漏洞发现处理流程和前端兼容性

- 后端添加对旧事件类型'finding'的兼容支持
- 改进漏洞发现标准化和去重逻辑
- 新增PoC生成要求和相关字段
- 优化沙箱配置初始化流程
- 前端添加ADD_FINDING操作和状态管理
- 增强事件流处理和序列号过滤
- 改进历史事件加载和SSE连接逻辑
- 添加漏洞验证状态和PoC信息到报告

											
										
										
											2025-12-13 18:45:05 +08:00
+								                            self._all_findings.append(normalized_new)
 								                            logger.info(f"[Orchestrator] Added new finding: {new_file}:{new_line} ({new_type})")
-												feat: 新增安全工具集成和漏洞知识库扩展

- 添加 Bandit 和 Safety 安全工具到依赖项
- 新增 CSRF、业务逻辑和开放重定向漏洞知识文档
- 实现安全工具一键安装脚本和文档
- 改进模式匹配工具支持直接文件扫描
- 增强遥测模块和 Agent 审计功能
- 修复验证节点中 findings 合并逻辑
- 优化前端 Agent 审计界面和状态展示

											
										
										
											2025-12-13 12:35:03 +08:00
 								                    logger.info(f"[Orchestrator] Total findings now: {len(self._all_findings)}")
 								                else:
 								                    logger.info(f"[Orchestrator] {agent_name} returned no findings")
-												feat(agent): implement Agent audit module with LangGraph integration

- Introduce new Agent audit functionality for autonomous code security analysis and vulnerability verification.
- Add API endpoints for managing Agent tasks and configurations.
- Implement UI components for Agent mode selection and embedding model configuration.
- Enhance the overall architecture with a focus on RAG (Retrieval-Augmented Generation) for improved code semantic search.
- Create a sandbox environment for secure execution of vulnerability tests.
- Update documentation to include details on the new Agent audit features and usage instructions.

											
										
										
											2025-12-11 19:09:10 +08:00
-												feat(agent): enhance agent functionality with LLM-driven decision-making and event handling

- Introduce LLM-driven decision-making across various agents, allowing for dynamic adjustments based on real-time analysis.
- Implement new event types for LLM thinking, decisions, actions, and observations to enrich the event streaming experience.
- Update agent task responses to include additional metrics for better tracking of task progress and outcomes.
- Refactor UI components to highlight LLM-related events and improve user interaction during audits.
- Enhance API endpoints to support new event structures and improve overall error handling.

											
										
										
											2025-12-11 21:14:32 +08:00
+								                await self.emit_event(
 								                    "dispatch_complete",
-												feat(agent): implement comprehensive agent architecture with knowledge base and persistence layer

- Add database migrations for agent checkpoints and tree node tracking
- Implement core agent execution framework with executor, state management, and message handling
- Create knowledge base system with framework-specific modules (Django, FastAPI, Flask, Express, React, Supabase)
- Add vulnerability knowledge modules covering authentication, cryptography, injection, XSS, XXE, SSRF, path traversal, deserialization, and race conditions
- Introduce new agent tools: thinking tool, reporting tool, and agent-specific utilities
- Implement LLM memory compression and prompt caching for improved performance
- Add agent registry and persistence layer for checkpoint management
- Refactor agent implementations (analysis, recon, verification, orchestrator) with enhanced capabilities
- Remove legacy agent implementations (analysis_v2, react_agent)
- Update API endpoints for agent task creation and project management
- Add frontend components for agent task creation and enhanced audit UI
- Consolidate agent service architecture with improved separation of concerns
- This refactoring provides a scalable foundation for multi-agent collaboration with knowledge-driven decision making and state persistence

											
										
										
											2025-12-12 15:27:12 +08:00
+								                    f"✅ {agent_name} Agent 完成",
-												feat(agent): enhance agent functionality with LLM-driven decision-making and event handling

- Introduce LLM-driven decision-making across various agents, allowing for dynamic adjustments based on real-time analysis.
- Implement new event types for LLM thinking, decisions, actions, and observations to enrich the event streaming experience.
- Update agent task responses to include additional metrics for better tracking of task progress and outcomes.
- Refactor UI components to highlight LLM-related events and improve user interaction during audits.
- Enhance API endpoints to support new event structures and improve overall error handling.

											
										
										
											2025-12-11 21:14:32 +08:00
+								                    agent=agent_name,
-												feat: 新增安全工具集成和漏洞知识库扩展

- 添加 Bandit 和 Safety 安全工具到依赖项
- 新增 CSRF、业务逻辑和开放重定向漏洞知识文档
- 实现安全工具一键安装脚本和文档
- 改进模式匹配工具支持直接文件扫描
- 增强遥测模块和 Agent 审计功能
- 修复验证节点中 findings 合并逻辑
- 优化前端 Agent 审计界面和状态展示

											
										
										
											2025-12-13 12:35:03 +08:00
+								                    findings_count=len(self._all_findings),  # 🔥 Use total findings count
-												feat(agent): implement Agent audit module with LangGraph integration

- Introduce new Agent audit functionality for autonomous code security analysis and vulnerability verification.
- Add API endpoints for managing Agent tasks and configurations.
- Implement UI components for Agent mode selection and embedding model configuration.
- Enhance the overall architecture with a focus on RAG (Retrieval-Augmented Generation) for improved code semantic search.
- Create a sandbox environment for secure execution of vulnerability tests.
- Update documentation to include details on the new Agent audit features and usage instructions.

											
										
										
											2025-12-11 19:09:10 +08:00
+								                )
-												feat(agent): enhance agent functionality with LLM-driven decision-making and event handling

- Introduce LLM-driven decision-making across various agents, allowing for dynamic adjustments based on real-time analysis.
- Implement new event types for LLM thinking, decisions, actions, and observations to enrich the event streaming experience.
- Update agent task responses to include additional metrics for better tracking of task progress and outcomes.
- Refactor UI components to highlight LLM-related events and improve user interaction during audits.
- Enhance API endpoints to support new event structures and improve overall error handling.

											
										
										
											2025-12-11 21:14:32 +08:00
-												feat(agent): implement comprehensive agent architecture with knowledge base and persistence layer

- Add database migrations for agent checkpoints and tree node tracking
- Implement core agent execution framework with executor, state management, and message handling
- Create knowledge base system with framework-specific modules (Django, FastAPI, Flask, Express, React, Supabase)
- Add vulnerability knowledge modules covering authentication, cryptography, injection, XSS, XXE, SSRF, path traversal, deserialization, and race conditions
- Introduce new agent tools: thinking tool, reporting tool, and agent-specific utilities
- Implement LLM memory compression and prompt caching for improved performance
- Add agent registry and persistence layer for checkpoint management
- Refactor agent implementations (analysis, recon, verification, orchestrator) with enhanced capabilities
- Remove legacy agent implementations (analysis_v2, react_agent)
- Update API endpoints for agent task creation and project management
- Add frontend components for agent task creation and enhanced audit UI
- Consolidate agent service architecture with improved separation of concerns
- This refactoring provides a scalable foundation for multi-agent collaboration with knowledge-driven decision making and state persistence

											
										
										
											2025-12-12 15:27:12 +08:00
+								                # 🔥 根据 Agent 类型构建不同的观察结果
 								                if agent_name == "recon":
 								                    # Recon Agent 返回项目信息
 								                    observation = f"""## Recon Agent 执行结果
 								**状态**: 成功
 								**迭代次数**: {result.iterations}
 								**耗时**: {result.duration_ms}ms
 								### 项目结构
 								{json.dumps(data.get('project_structure', {}), ensure_ascii=False, indent=2)}
 								### 技术栈
 								- 语言: {data.get('tech_stack', {}).get('languages', [])}
 								- 框架: {data.get('tech_stack', {}).get('frameworks', [])}
 								- 数据库: {data.get('tech_stack', {}).get('databases', [])}
 								### 入口点 ({len(data.get('entry_points', []))} 个)
 								"""
 								                    for i, ep in enumerate(data.get('entry_points', [])[:10]):
 								                        if isinstance(ep, dict):
 								                            observation += f"{i+1}. [{ep.get('type', 'unknown')}] {ep.get('file', '')}:{ep.get('line', '')}\n"
 								                    observation += f"""
 								### 高风险区域
 								{data.get('high_risk_areas', [])}
 								### 初步发现 ({len(data.get('initial_findings', []))} 个)
 								"""
 								                    for finding in data.get('initial_findings', [])[:5]:
 								                        if isinstance(finding, str):
 								                            observation += f"- {finding}\n"
 								                        elif isinstance(finding, dict):
 								                            observation += f"- {finding.get('title', finding)}\n"
 								                else:
 								                    # Analysis/Verification Agent 返回漏洞发现
 								                    observation = f"""## {agent_name} Agent 执行结果
-												feat(agent): enhance agent functionality with LLM-driven decision-making and event handling

- Introduce LLM-driven decision-making across various agents, allowing for dynamic adjustments based on real-time analysis.
- Implement new event types for LLM thinking, decisions, actions, and observations to enrich the event streaming experience.
- Update agent task responses to include additional metrics for better tracking of task progress and outcomes.
- Refactor UI components to highlight LLM-related events and improve user interaction during audits.
- Enhance API endpoints to support new event structures and improve overall error handling.

											
										
										
											2025-12-11 21:14:32 +08:00
 								**状态**: 成功
-												feat(agent): 增强漏洞发现处理流程和前端兼容性

- 后端添加对旧事件类型'finding'的兼容支持
- 改进漏洞发现标准化和去重逻辑
- 新增PoC生成要求和相关字段
- 优化沙箱配置初始化流程
- 前端添加ADD_FINDING操作和状态管理
- 增强事件流处理和序列号过滤
- 改进历史事件加载和SSE连接逻辑
- 添加漏洞验证状态和PoC信息到报告

											
										
										
											2025-12-13 18:45:05 +08:00
+								**发现数量**: {len(valid_findings)}
-												feat(agent): enhance agent functionality with LLM-driven decision-making and event handling

- Introduce LLM-driven decision-making across various agents, allowing for dynamic adjustments based on real-time analysis.
- Implement new event types for LLM thinking, decisions, actions, and observations to enrich the event streaming experience.
- Update agent task responses to include additional metrics for better tracking of task progress and outcomes.
- Refactor UI components to highlight LLM-related events and improve user interaction during audits.
- Enhance API endpoints to support new event structures and improve overall error handling.

											
										
										
											2025-12-11 21:14:32 +08:00
+								**迭代次数**: {result.iterations}
 								**耗时**: {result.duration_ms}ms
 								### 发现摘要
 								"""
-												feat(agent): 增强漏洞发现处理流程和前端兼容性

- 后端添加对旧事件类型'finding'的兼容支持
- 改进漏洞发现标准化和去重逻辑
- 新增PoC生成要求和相关字段
- 优化沙箱配置初始化流程
- 前端添加ADD_FINDING操作和状态管理
- 增强事件流处理和序列号过滤
- 改进历史事件加载和SSE连接逻辑
- 添加漏洞验证状态和PoC信息到报告

											
										
										
											2025-12-13 18:45:05 +08:00
+								                    for i, f in enumerate(valid_findings[:10]):
-												feat(agent): implement comprehensive agent architecture with knowledge base and persistence layer

- Add database migrations for agent checkpoints and tree node tracking
- Implement core agent execution framework with executor, state management, and message handling
- Create knowledge base system with framework-specific modules (Django, FastAPI, Flask, Express, React, Supabase)
- Add vulnerability knowledge modules covering authentication, cryptography, injection, XSS, XXE, SSRF, path traversal, deserialization, and race conditions
- Introduce new agent tools: thinking tool, reporting tool, and agent-specific utilities
- Implement LLM memory compression and prompt caching for improved performance
- Add agent registry and persistence layer for checkpoint management
- Refactor agent implementations (analysis, recon, verification, orchestrator) with enhanced capabilities
- Remove legacy agent implementations (analysis_v2, react_agent)
- Update API endpoints for agent task creation and project management
- Add frontend components for agent task creation and enhanced audit UI
- Consolidate agent service architecture with improved separation of concerns
- This refactoring provides a scalable foundation for multi-agent collaboration with knowledge-driven decision making and state persistence

											
										
										
											2025-12-12 15:27:12 +08:00
+								                        if not isinstance(f, dict):
 								                            continue
 								                        observation += f"""
-												feat(agent): enhance agent functionality with LLM-driven decision-making and event handling

- Introduce LLM-driven decision-making across various agents, allowing for dynamic adjustments based on real-time analysis.
- Implement new event types for LLM thinking, decisions, actions, and observations to enrich the event streaming experience.
- Update agent task responses to include additional metrics for better tracking of task progress and outcomes.
- Refactor UI components to highlight LLM-related events and improve user interaction during audits.
- Enhance API endpoints to support new event structures and improve overall error handling.

											
										
										
											2025-12-11 21:14:32 +08:00
+								{i+1}. [{f.get('severity', 'unknown')}] {f.get('title', 'Unknown')}
 								   - 类型: {f.get('vulnerability_type', 'unknown')}
 								   - 文件: {f.get('file_path', 'unknown')}
 								   - 描述: {f.get('description', '')[:200]}...
 								"""
-												feat(agent): 增强漏洞发现处理流程和前端兼容性

- 后端添加对旧事件类型'finding'的兼容支持
- 改进漏洞发现标准化和去重逻辑
- 新增PoC生成要求和相关字段
- 优化沙箱配置初始化流程
- 前端添加ADD_FINDING操作和状态管理
- 增强事件流处理和序列号过滤
- 改进历史事件加载和SSE连接逻辑
- 添加漏洞验证状态和PoC信息到报告

											
										
										
											2025-12-13 18:45:05 +08:00
 								                    if len(valid_findings) > 10:
 								                        observation += f"\n... 还有 {len(valid_findings) - 10} 个发现"
-												feat(agent): enhance agent functionality with LLM-driven decision-making and event handling

- Introduce LLM-driven decision-making across various agents, allowing for dynamic adjustments based on real-time analysis.
- Implement new event types for LLM thinking, decisions, actions, and observations to enrich the event streaming experience.
- Update agent task responses to include additional metrics for better tracking of task progress and outcomes.
- Refactor UI components to highlight LLM-related events and improve user interaction during audits.
- Enhance API endpoints to support new event structures and improve overall error handling.

											
										
										
											2025-12-11 21:14:32 +08:00
-												feat(agent): implement comprehensive agent architecture with knowledge base and persistence layer

- Add database migrations for agent checkpoints and tree node tracking
- Implement core agent execution framework with executor, state management, and message handling
- Create knowledge base system with framework-specific modules (Django, FastAPI, Flask, Express, React, Supabase)
- Add vulnerability knowledge modules covering authentication, cryptography, injection, XSS, XXE, SSRF, path traversal, deserialization, and race conditions
- Introduce new agent tools: thinking tool, reporting tool, and agent-specific utilities
- Implement LLM memory compression and prompt caching for improved performance
- Add agent registry and persistence layer for checkpoint management
- Refactor agent implementations (analysis, recon, verification, orchestrator) with enhanced capabilities
- Remove legacy agent implementations (analysis_v2, react_agent)
- Update API endpoints for agent task creation and project management
- Add frontend components for agent task creation and enhanced audit UI
- Consolidate agent service architecture with improved separation of concerns
- This refactoring provides a scalable foundation for multi-agent collaboration with knowledge-driven decision making and state persistence

											
										
										
											2025-12-12 15:27:12 +08:00
+								                if data.get("summary"):
 								                    observation += f"\n\n### Agent 总结\n{data['summary']}"
-												feat(agent): enhance agent functionality with LLM-driven decision-making and event handling

- Introduce LLM-driven decision-making across various agents, allowing for dynamic adjustments based on real-time analysis.
- Implement new event types for LLM thinking, decisions, actions, and observations to enrich the event streaming experience.
- Update agent task responses to include additional metrics for better tracking of task progress and outcomes.
- Refactor UI components to highlight LLM-related events and improve user interaction during audits.
- Enhance API endpoints to support new event structures and improve overall error handling.

											
										
										
											2025-12-11 21:14:32 +08:00
 								                return observation
-												feat(agent): implement Agent audit module with LangGraph integration

- Introduce new Agent audit functionality for autonomous code security analysis and vulnerability verification.
- Add API endpoints for managing Agent tasks and configurations.
- Implement UI components for Agent mode selection and embedding model configuration.
- Enhance the overall architecture with a focus on RAG (Retrieval-Augmented Generation) for improved code semantic search.
- Create a sandbox environment for secure execution of vulnerability tests.
- Update documentation to include details on the new Agent audit features and usage instructions.

											
										
										
											2025-12-11 19:09:10 +08:00
+								            else:
-												feat(agent): enhance agent functionality with LLM-driven decision-making and event handling

- Introduce LLM-driven decision-making across various agents, allowing for dynamic adjustments based on real-time analysis.
- Implement new event types for LLM thinking, decisions, actions, and observations to enrich the event streaming experience.
- Update agent task responses to include additional metrics for better tracking of task progress and outcomes.
- Refactor UI components to highlight LLM-related events and improve user interaction during audits.
- Enhance API endpoints to support new event structures and improve overall error handling.

											
										
										
											2025-12-11 21:14:32 +08:00
+								                return f"## {agent_name} Agent 执行失败\n\n错误: {result.error}"
-												feat(agent): implement Agent audit module with LangGraph integration

- Introduce new Agent audit functionality for autonomous code security analysis and vulnerability verification.
- Add API endpoints for managing Agent tasks and configurations.
- Implement UI components for Agent mode selection and embedding model configuration.
- Enhance the overall architecture with a focus on RAG (Retrieval-Augmented Generation) for improved code semantic search.
- Create a sandbox environment for secure execution of vulnerability tests.
- Update documentation to include details on the new Agent audit features and usage instructions.

											
										
										
											2025-12-11 19:09:10 +08:00
 								        except Exception as e:
-												feat(agent): enhance agent functionality with LLM-driven decision-making and event handling

- Introduce LLM-driven decision-making across various agents, allowing for dynamic adjustments based on real-time analysis.
- Implement new event types for LLM thinking, decisions, actions, and observations to enrich the event streaming experience.
- Update agent task responses to include additional metrics for better tracking of task progress and outcomes.
- Refactor UI components to highlight LLM-related events and improve user interaction during audits.
- Enhance API endpoints to support new event structures and improve overall error handling.

											
										
										
											2025-12-11 21:14:32 +08:00
+								            logger.error(f"Sub-agent dispatch failed: {e}", exc_info=True)
 								            return f"## 调度失败\n\n错误: {str(e)}"
-												feat(agent): 增强文件路径验证防止幻觉报告

添加文件路径验证规则和检查逻辑，确保漏洞报告中的文件真实存在
移除LLM响应中的Markdown格式标记，统一解析处理
更新报告工具和端点以支持项目根目录验证

											
										
										
											2025-12-19 19:08:36 +08:00
 								    def _validate_file_path(self, file_path: str) -> bool:
 								        """
 								        🔥 v2.1: 验证文件路径是否真实存在
 								        Args:
 								            file_path: 相对或绝对文件路径（可能包含行号，如 "app.py:36"）
 								        Returns:
 								            bool: 文件是否存在
 								        """
 								        if not file_path or not file_path.strip():
 								            return False
 								        # 获取项目根目录
 								        project_root = self._runtime_context.get("project_root", "")
 								        if not project_root:
 								            # 没有项目根目录时，无法验证，返回 True 以避免误判
 								            return True
 								        # 清理路径（移除可能的行号）
 								        clean_path = file_path.split(":")[0].strip() if ":" in file_path else file_path.strip()
 								        # 尝试相对路径
 								        full_path = os.path.join(project_root, clean_path)
 								        if os.path.isfile(full_path):
 								            return True
 								        # 尝试绝对路径
 								        if os.path.isabs(clean_path) and os.path.isfile(clean_path):
 								            return True
 								        return False
 								    def _normalize_finding(self, finding: Dict[str, Any]) -> Optional[Dict[str, Any]]:
-												feat(agent): 增强漏洞发现处理流程和前端兼容性

- 后端添加对旧事件类型'finding'的兼容支持
- 改进漏洞发现标准化和去重逻辑
- 新增PoC生成要求和相关字段
- 优化沙箱配置初始化流程
- 前端添加ADD_FINDING操作和状态管理
- 增强事件流处理和序列号过滤
- 改进历史事件加载和SSE连接逻辑
- 添加漏洞验证状态和PoC信息到报告

											
										
										
											2025-12-13 18:45:05 +08:00
+								        """
 								        标准化发现格式
 								        不同 Agent 可能返回不同格式的发现，这个方法将它们标准化为统一格式
-												feat(agent): 增强文件路径验证防止幻觉报告

添加文件路径验证规则和检查逻辑，确保漏洞报告中的文件真实存在
移除LLM响应中的Markdown格式标记，统一解析处理
更新报告工具和端点以支持项目根目录验证

											
										
										
											2025-12-19 19:08:36 +08:00
 								        🔥 v2.1: 添加文件路径验证，返回 None 表示发现无效（幻觉）
-												feat(agent): 增强漏洞发现处理流程和前端兼容性

- 后端添加对旧事件类型'finding'的兼容支持
- 改进漏洞发现标准化和去重逻辑
- 新增PoC生成要求和相关字段
- 优化沙箱配置初始化流程
- 前端添加ADD_FINDING操作和状态管理
- 增强事件流处理和序列号过滤
- 改进历史事件加载和SSE连接逻辑
- 添加漏洞验证状态和PoC信息到报告

											
										
										
											2025-12-13 18:45:05 +08:00
+								        """
 								        normalized = dict(finding)  # 复制原始数据
 								        # 🔥 处理 location 字段 -> file_path + line_start
 								        if "location" in normalized and "file_path" not in normalized:
 								            location = normalized["location"]
 								            if isinstance(location, str) and ":" in location:
 								                parts = location.split(":")
 								                normalized["file_path"] = parts[0]
 								                try:
 								                    normalized["line_start"] = int(parts[1])
 								                except (ValueError, IndexError):
 								                    pass
 								            elif isinstance(location, str):
 								                normalized["file_path"] = location
 								        # 🔥 处理 file 字段 -> file_path
 								        if "file" in normalized and "file_path" not in normalized:
 								            normalized["file_path"] = normalized["file"]
 								        # 🔥 处理 line 字段 -> line_start
 								        if "line" in normalized and "line_start" not in normalized:
 								            normalized["line_start"] = normalized["line"]
 								        # 🔥 处理 type 字段 -> vulnerability_type
 								        if "type" in normalized and "vulnerability_type" not in normalized:
 								            # 不是所有 type 都是漏洞类型，比如 "Vulnerability" 只是标记
 								            type_val = normalized["type"]
 								            if type_val and type_val.lower() not in ["vulnerability", "finding", "issue"]:
 								                normalized["vulnerability_type"] = type_val
 								            elif "description" in normalized:
 								                # 尝试从描述中推断漏洞类型
 								                desc = normalized["description"].lower()
 								                if "command injection" in desc or "rce" in desc or "system(" in desc:
 								                    normalized["vulnerability_type"] = "command_injection"
 								                elif "sql injection" in desc or "sqli" in desc:
 								                    normalized["vulnerability_type"] = "sql_injection"
 								                elif "xss" in desc or "cross-site scripting" in desc:
 								                    normalized["vulnerability_type"] = "xss"
 								                elif "path traversal" in desc or "directory traversal" in desc:
 								                    normalized["vulnerability_type"] = "path_traversal"
 								                elif "ssrf" in desc:
 								                    normalized["vulnerability_type"] = "ssrf"
 								                elif "xxe" in desc:
 								                    normalized["vulnerability_type"] = "xxe"
 								                else:
 								                    normalized["vulnerability_type"] = "other"
 								        # 🔥 确保 severity 字段存在且为小写
 								        if "severity" in normalized:
 								            normalized["severity"] = str(normalized["severity"]).lower()
 								        else:
 								            normalized["severity"] = "medium"
 								        # 🔥 处理 risk 字段 -> severity
 								        if "risk" in normalized and "severity" not in normalized:
 								            normalized["severity"] = str(normalized["risk"]).lower()
 								        # 🔥 生成 title 如果不存在
 								        if "title" not in normalized:
 								            vuln_type = normalized.get("vulnerability_type", "Unknown")
 								            file_path = normalized.get("file_path", "")
 								            if file_path:
 								                import os
 								                normalized["title"] = f"{vuln_type.replace('_', ' ').title()} in {os.path.basename(file_path)}"
 								            else:
 								                normalized["title"] = f"{vuln_type.replace('_', ' ').title()} Vulnerability"
 								        # 🔥 处理 code 字段 -> code_snippet
 								        if "code" in normalized and "code_snippet" not in normalized:
 								            normalized["code_snippet"] = normalized["code"]
 								        # 🔥 处理 recommendation -> suggestion
 								        if "recommendation" in normalized and "suggestion" not in normalized:
 								            normalized["suggestion"] = normalized["recommendation"]
 								        # 🔥 处理 impact -> 添加到 description
 								        if "impact" in normalized and normalized.get("description"):
 								            if "impact" not in normalized["description"].lower():
 								                normalized["description"] += f"\n\nImpact: {normalized['impact']}"
-												feat(agent): 增强文件路径验证防止幻觉报告

添加文件路径验证规则和检查逻辑，确保漏洞报告中的文件真实存在
移除LLM响应中的Markdown格式标记，统一解析处理
更新报告工具和端点以支持项目根目录验证

											
										
										
											2025-12-19 19:08:36 +08:00
+								        # 🔥 v2.1: 验证文件路径存在性
 								        file_path = normalized.get("file_path", "")
 								        if file_path and not self._validate_file_path(file_path):
 								            logger.warning(
 								                f"[Orchestrator] 🚫 过滤幻觉发现: 文件不存在 '{file_path}' "
 								                f"(title: {normalized.get('title', 'N/A')[:50]})"
 								            )
 								            return None  # 返回 None 表示发现无效
-												feat(agent): 增强漏洞发现处理流程和前端兼容性

- 后端添加对旧事件类型'finding'的兼容支持
- 改进漏洞发现标准化和去重逻辑
- 新增PoC生成要求和相关字段
- 优化沙箱配置初始化流程
- 前端添加ADD_FINDING操作和状态管理
- 增强事件流处理和序列号过滤
- 改进历史事件加载和SSE连接逻辑
- 添加漏洞验证状态和PoC信息到报告

											
										
										
											2025-12-13 18:45:05 +08:00
+								        return normalized
-												feat(agent): enhance agent functionality with LLM-driven decision-making and event handling

- Introduce LLM-driven decision-making across various agents, allowing for dynamic adjustments based on real-time analysis.
- Implement new event types for LLM thinking, decisions, actions, and observations to enrich the event streaming experience.
- Update agent task responses to include additional metrics for better tracking of task progress and outcomes.
- Refactor UI components to highlight LLM-related events and improve user interaction during audits.
- Enhance API endpoints to support new event structures and improve overall error handling.

											
										
										
											2025-12-11 21:14:32 +08:00
+								    def _summarize_findings(self) -> str:
 								        """汇总当前发现"""
 								        if not self._all_findings:
 								            return "目前还没有发现任何漏洞。"
-												feat(agent): implement Agent audit module with LangGraph integration

- Introduce new Agent audit functionality for autonomous code security analysis and vulnerability verification.
- Add API endpoints for managing Agent tasks and configurations.
- Implement UI components for Agent mode selection and embedding model configuration.
- Enhance the overall architecture with a focus on RAG (Retrieval-Augmented Generation) for improved code semantic search.
- Create a sandbox environment for secure execution of vulnerability tests.
- Update documentation to include details on the new Agent audit features and usage instructions.

											
										
										
											2025-12-11 19:09:10 +08:00
-												feat(agent): enhance agent functionality with LLM-driven decision-making and event handling

- Introduce LLM-driven decision-making across various agents, allowing for dynamic adjustments based on real-time analysis.
- Implement new event types for LLM thinking, decisions, actions, and observations to enrich the event streaming experience.
- Update agent task responses to include additional metrics for better tracking of task progress and outcomes.
- Refactor UI components to highlight LLM-related events and improve user interaction during audits.
- Enhance API endpoints to support new event structures and improve overall error handling.

											
										
										
											2025-12-11 21:14:32 +08:00
+								        # 统计
-												feat(agent): implement Agent audit module with LangGraph integration

- Introduce new Agent audit functionality for autonomous code security analysis and vulnerability verification.
- Add API endpoints for managing Agent tasks and configurations.
- Implement UI components for Agent mode selection and embedding model configuration.
- Enhance the overall architecture with a focus on RAG (Retrieval-Augmented Generation) for improved code semantic search.
- Create a sandbox environment for secure execution of vulnerability tests.
- Update documentation to include details on the new Agent audit features and usage instructions.

											
										
										
											2025-12-11 19:09:10 +08:00
+								        severity_counts = {"critical": 0, "high": 0, "medium": 0, "low": 0}
 								        type_counts = {}
-												feat(agent): enhance agent functionality with LLM-driven decision-making and event handling

- Introduce LLM-driven decision-making across various agents, allowing for dynamic adjustments based on real-time analysis.
- Implement new event types for LLM thinking, decisions, actions, and observations to enrich the event streaming experience.
- Update agent task responses to include additional metrics for better tracking of task progress and outcomes.
- Refactor UI components to highlight LLM-related events and improve user interaction during audits.
- Enhance API endpoints to support new event structures and improve overall error handling.

											
										
										
											2025-12-11 21:14:32 +08:00
+								        for f in self._all_findings:
-												feat(agent): enhance streaming with in-memory event manager and fallback polling

- Implement dual-mode streaming: prioritize in-memory EventManager for running tasks with thinking_token support
- Add fallback to database polling for completed tasks without thinking_token replay capability
- Introduce SSE event formatter utility for consistent event serialization across streaming modes
- Add 10ms micro-delay for thinking_token events to ensure proper TCP packet separation and frontend incremental rendering
- Refactor stream_agent_with_thinking endpoint to support both runtime and historical event streaming
- Update event filtering logic to handle both in-memory and database event sources
- Improve logging with debug markers for thinking_token tracking and stream mode selection
- Optimize polling intervals: 0.3s for running tasks, 2.0s for completed tasks
- Reduce idle timeout from 10 minutes to 1 minute for completed task streams
- Update frontend useAgentStream hook to handle unified event format from dual-mode streaming
- Enhance AgentAudit UI to properly display streamed events from both sources

											
										
										
											2025-12-12 10:39:32 +08:00
+								            if not isinstance(f, dict):
 								                continue
-												feat(agent): enhance agent functionality with LLM-driven decision-making and event handling

- Introduce LLM-driven decision-making across various agents, allowing for dynamic adjustments based on real-time analysis.
- Implement new event types for LLM thinking, decisions, actions, and observations to enrich the event streaming experience.
- Update agent task responses to include additional metrics for better tracking of task progress and outcomes.
- Refactor UI components to highlight LLM-related events and improve user interaction during audits.
- Enhance API endpoints to support new event structures and improve overall error handling.

											
										
										
											2025-12-11 21:14:32 +08:00
+								            sev = f.get("severity", "low")
-												feat(agent): implement Agent audit module with LangGraph integration

- Introduce new Agent audit functionality for autonomous code security analysis and vulnerability verification.
- Add API endpoints for managing Agent tasks and configurations.
- Implement UI components for Agent mode selection and embedding model configuration.
- Enhance the overall architecture with a focus on RAG (Retrieval-Augmented Generation) for improved code semantic search.
- Create a sandbox environment for secure execution of vulnerability tests.
- Update documentation to include details on the new Agent audit features and usage instructions.

											
										
										
											2025-12-11 19:09:10 +08:00
+								            severity_counts[sev] = severity_counts.get(sev, 0) + 1
-												feat(agent): enhance agent functionality with LLM-driven decision-making and event handling

- Introduce LLM-driven decision-making across various agents, allowing for dynamic adjustments based on real-time analysis.
- Implement new event types for LLM thinking, decisions, actions, and observations to enrich the event streaming experience.
- Update agent task responses to include additional metrics for better tracking of task progress and outcomes.
- Refactor UI components to highlight LLM-related events and improve user interaction during audits.
- Enhance API endpoints to support new event structures and improve overall error handling.

											
										
										
											2025-12-11 21:14:32 +08:00
+								            vtype = f.get("vulnerability_type", "other")
-												feat(agent): implement Agent audit module with LangGraph integration

- Introduce new Agent audit functionality for autonomous code security analysis and vulnerability verification.
- Add API endpoints for managing Agent tasks and configurations.
- Implement UI components for Agent mode selection and embedding model configuration.
- Enhance the overall architecture with a focus on RAG (Retrieval-Augmented Generation) for improved code semantic search.
- Create a sandbox environment for secure execution of vulnerability tests.
- Update documentation to include details on the new Agent audit features and usage instructions.

											
										
										
											2025-12-11 19:09:10 +08:00
+								            type_counts[vtype] = type_counts.get(vtype, 0) + 1
-												feat(agent): enhance agent functionality with LLM-driven decision-making and event handling

- Introduce LLM-driven decision-making across various agents, allowing for dynamic adjustments based on real-time analysis.
- Implement new event types for LLM thinking, decisions, actions, and observations to enrich the event streaming experience.
- Update agent task responses to include additional metrics for better tracking of task progress and outcomes.
- Refactor UI components to highlight LLM-related events and improve user interaction during audits.
- Enhance API endpoints to support new event structures and improve overall error handling.

											
										
										
											2025-12-11 21:14:32 +08:00
+								        summary = f"""## 当前发现汇总
 								**总计**: {len(self._all_findings)} 个漏洞
 								### 严重程度分布
 								- Critical: {severity_counts['critical']}
 								- High: {severity_counts['high']}
 								- Medium: {severity_counts['medium']}
 								- Low: {severity_counts['low']}
 								### 漏洞类型分布
 								"""
 								        for vtype, count in type_counts.items():
 								            summary += f"- {vtype}: {count}\n"
 								        summary += "\n### 详细列表\n"
 								        for i, f in enumerate(self._all_findings):
-												feat(agent): enhance streaming with in-memory event manager and fallback polling

- Implement dual-mode streaming: prioritize in-memory EventManager for running tasks with thinking_token support
- Add fallback to database polling for completed tasks without thinking_token replay capability
- Introduce SSE event formatter utility for consistent event serialization across streaming modes
- Add 10ms micro-delay for thinking_token events to ensure proper TCP packet separation and frontend incremental rendering
- Refactor stream_agent_with_thinking endpoint to support both runtime and historical event streaming
- Update event filtering logic to handle both in-memory and database event sources
- Improve logging with debug markers for thinking_token tracking and stream mode selection
- Optimize polling intervals: 0.3s for running tasks, 2.0s for completed tasks
- Reduce idle timeout from 10 minutes to 1 minute for completed task streams
- Update frontend useAgentStream hook to handle unified event format from dual-mode streaming
- Enhance AgentAudit UI to properly display streamed events from both sources

											
										
										
											2025-12-12 10:39:32 +08:00
+								            if isinstance(f, dict):
 								                summary += f"{i+1}. [{f.get('severity')}] {f.get('title')} ({f.get('file_path')})\n"
-												feat(agent): enhance agent functionality with LLM-driven decision-making and event handling

- Introduce LLM-driven decision-making across various agents, allowing for dynamic adjustments based on real-time analysis.
- Implement new event types for LLM thinking, decisions, actions, and observations to enrich the event streaming experience.
- Update agent task responses to include additional metrics for better tracking of task progress and outcomes.
- Refactor UI components to highlight LLM-related events and improve user interaction during audits.
- Enhance API endpoints to support new event structures and improve overall error handling.

											
										
										
											2025-12-11 21:14:32 +08:00
 								        return summary
 								    def _generate_default_summary(self) -> Dict[str, Any]:
 								        """生成默认摘要"""
 								        severity_counts = {"critical": 0, "high": 0, "medium": 0, "low": 0}
 								        for f in self._all_findings:
-												feat(agent): enhance streaming with in-memory event manager and fallback polling

- Implement dual-mode streaming: prioritize in-memory EventManager for running tasks with thinking_token support
- Add fallback to database polling for completed tasks without thinking_token replay capability
- Introduce SSE event formatter utility for consistent event serialization across streaming modes
- Add 10ms micro-delay for thinking_token events to ensure proper TCP packet separation and frontend incremental rendering
- Refactor stream_agent_with_thinking endpoint to support both runtime and historical event streaming
- Update event filtering logic to handle both in-memory and database event sources
- Improve logging with debug markers for thinking_token tracking and stream mode selection
- Optimize polling intervals: 0.3s for running tasks, 2.0s for completed tasks
- Reduce idle timeout from 10 minutes to 1 minute for completed task streams
- Update frontend useAgentStream hook to handle unified event format from dual-mode streaming
- Enhance AgentAudit UI to properly display streamed events from both sources

											
										
										
											2025-12-12 10:39:32 +08:00
+								            if isinstance(f, dict):
 								                sev = f.get("severity", "low")
 								                severity_counts[sev] = severity_counts.get(sev, 0) + 1
-												feat(agent): implement Agent audit module with LangGraph integration

- Introduce new Agent audit functionality for autonomous code security analysis and vulnerability verification.
- Add API endpoints for managing Agent tasks and configurations.
- Implement UI components for Agent mode selection and embedding model configuration.
- Enhance the overall architecture with a focus on RAG (Retrieval-Augmented Generation) for improved code semantic search.
- Create a sandbox environment for secure execution of vulnerability tests.
- Update documentation to include details on the new Agent audit features and usage instructions.

											
										
										
											2025-12-11 19:09:10 +08:00
 								        return {
-												feat(agent): enhance agent functionality with LLM-driven decision-making and event handling

- Introduce LLM-driven decision-making across various agents, allowing for dynamic adjustments based on real-time analysis.
- Implement new event types for LLM thinking, decisions, actions, and observations to enrich the event streaming experience.
- Update agent task responses to include additional metrics for better tracking of task progress and outcomes.
- Refactor UI components to highlight LLM-related events and improve user interaction during audits.
- Enhance API endpoints to support new event structures and improve overall error handling.

											
										
										
											2025-12-11 21:14:32 +08:00
+								            "total_findings": len(self._all_findings),
-												feat(agent): implement Agent audit module with LangGraph integration

- Introduce new Agent audit functionality for autonomous code security analysis and vulnerability verification.
- Add API endpoints for managing Agent tasks and configurations.
- Implement UI components for Agent mode selection and embedding model configuration.
- Enhance the overall architecture with a focus on RAG (Retrieval-Augmented Generation) for improved code semantic search.
- Create a sandbox environment for secure execution of vulnerability tests.
- Update documentation to include details on the new Agent audit features and usage instructions.

											
										
										
											2025-12-11 19:09:10 +08:00
+								            "severity_distribution": severity_counts,
-												feat(agent): enhance agent functionality with LLM-driven decision-making and event handling

- Introduce LLM-driven decision-making across various agents, allowing for dynamic adjustments based on real-time analysis.
- Implement new event types for LLM thinking, decisions, actions, and observations to enrich the event streaming experience.
- Update agent task responses to include additional metrics for better tracking of task progress and outcomes.
- Refactor UI components to highlight LLM-related events and improve user interaction during audits.
- Enhance API endpoints to support new event structures and improve overall error handling.

											
										
										
											2025-12-11 21:14:32 +08:00
+								            "conclusion": "审计完成（未通过 LLM 生成结论）",
-												feat(agent): implement Agent audit module with LangGraph integration

- Introduce new Agent audit functionality for autonomous code security analysis and vulnerability verification.
- Add API endpoints for managing Agent tasks and configurations.
- Implement UI components for Agent mode selection and embedding model configuration.
- Enhance the overall architecture with a focus on RAG (Retrieval-Augmented Generation) for improved code semantic search.
- Create a sandbox environment for secure execution of vulnerability tests.
- Update documentation to include details on the new Agent audit features and usage instructions.

											
										
										
											2025-12-11 19:09:10 +08:00
+								        }
-												feat(agent): enhance agent functionality with LLM-driven decision-making and event handling

- Introduce LLM-driven decision-making across various agents, allowing for dynamic adjustments based on real-time analysis.
- Implement new event types for LLM thinking, decisions, actions, and observations to enrich the event streaming experience.
- Update agent task responses to include additional metrics for better tracking of task progress and outcomes.
- Refactor UI components to highlight LLM-related events and improve user interaction during audits.
- Enhance API endpoints to support new event structures and improve overall error handling.

											
										
										
											2025-12-11 21:14:32 +08:00
 								    def get_conversation_history(self) -> List[Dict[str, str]]:
 								        """获取对话历史"""
 								        return self._conversation_history
 								    def get_steps(self) -> List[AgentStep]:
 								        """获取执行步骤"""
 								        return self._steps