29.5 调试与优化模块

29.5.1 调试模块概述

调试模块是编程 Agent 的重要能力，它能够自动识别、定位和修复代码中的错误。调试涉及错误检测、根因分析、修复建议等多个环节。

调试流程

错误报告 ↓ 错误检测 ↓ 错误定位 ↓ 根因分析 ↓ 修复建议 ↓ 修复验证 ↓ 问题解决

python

## 29.5.2 错误检测

### 错误检测器

    python


    python

    class ErrorDetector:
        """错误检测器"""

        def __init__(self):
            self.detectors = {
                'syntax': SyntaxErrorDetector(),
                'runtime': RuntimeErrorDetector(),
                'logic': LogicErrorDetector(),
                'performance': PerformanceErrorDetector(),
                'security': SecurityErrorDetector()
            }

        async def detect(self, code: str,
                         execution_result: ExecutionResult = None) -> List[DetectedError]:
            """检测错误"""
            errors = []

            # 运行各种检测器
            for detector_name, detector in self.detectors.items():
                try:
                    detected = await detector.detect(code, execution_result)
                    errors.extend(detected)
                except Exception as e:
                    logger.error(f"Error in {detector_name} detector: {e}")

            # 去重
            errors = self._deduplicate_errors(errors)

            # 排序（按严重程度）
            errors.sort(key=lambda e: e.severity, reverse=True)

            return errors

        def _deduplicate_errors(self,
                                errors: List[DetectedError]) -> List[DetectedError]:
            """去重错误"""
            seen = set()
            unique_errors = []

            for error in errors:
                key = (error.type, error.location, error.message)
                if key not in seen:
                    seen.add(key)
                    unique_errors.append(error)

            return unique_errors

    class SyntaxErrorDetector:
        """语法错误检测器"""

        async def detect(self, code: str,
                         execution_result: ExecutionResult = None) -> List[DetectedError]:
            """检测语法错误"""
            errors = []

            try:
                # 尝试编译代码
                compile(code, '<string>', 'exec')
            except SyntaxError as e:
                error = DetectedError(
                    type='syntax',
                    severity='high',
                    location=f"Line {e.lineno}, Column {e.offset}",
                    message=e.msg,
                    code_snippet=self._get_code_snippet(code, e.lineno),
                    suggestion=self._get_syntax_suggestion(e)
                )
                errors.append(error)

            return errors

        def _get_code_snippet(self, code: str, line_no: int) -> str:
            """获取代码片段"""
            lines = code.split('\n')
            if 1 <= line_no <= len(lines):
                return lines[line_no - 1]
            return ""

        def _get_syntax_suggestion(self, error: SyntaxError) -> str:
            """获取语法错误建议"""
            suggestions = {
                'invalid syntax': "检查语法是否正确，确保括号、引号等匹配",
                'unexpected EOF': "检查代码是否完整，确保所有括号都已闭合",
                'unterminated string literal': "检查字符串是否正确闭合",
                'expected an indented block': "检查缩进是否正确",
                'unindent does not match any outer indentation level': "检查缩进层级是否一致"
            }

            return suggestions.get(error.msg, "请检查语法错误")

    class RuntimeErrorDetector:
        """运行时错误检测器"""

        async def detect(self, code: str,
                         execution_result: ExecutionResult = None) -> List[DetectedError]:
            """检测运行时错误"""
            errors = []

            if not execution_result or not execution_result.error:
                return errors

            # 分析错误信息
            error_info = self._parse_error(execution_result.error)

            error = DetectedError(
                type='runtime',
                severity='high',
                location=error_info.get('location', 'Unknown'),
                message=error_info.get('message', 'Unknown error'),
                code_snippet=error_info.get('code_snippet', ''),
                traceback=error_info.get('traceback', ''),
                suggestion=self._get_runtime_suggestion(error_info)
            )
            errors.append(error)

            return errors

        def _parse_error(self, error: str) -> Dict[str, str]:
            """解析错误信息"""
            error_info = {
                'message': error,
                'location': 'Unknown',
                'traceback': '',
                'code_snippet': ''
            }

            # 解析 traceback
            if 'Traceback' in error:
                lines = error.split('\n')
                for line in lines:
                    if 'File' in line and 'line' in line:
                        # 提取文件和行号
                        parts = line.split(',')
                        if len(parts) >= 2:
                            error_info['location'] = parts[1].strip()
                    elif line.strip() and not line.startswith(' ') and 'Error' in line:
                        error_info['message'] = line.strip()

            return error_info

        def _get_runtime_suggestion(self, error_info: Dict) -> str:
            """获取运行时错误建议"""
            message = error_info.get('message', '').lower()

            suggestions = {
                'nameerror': "检查变量名是否正确，确保在使用前已定义",
                'typeerror': "检查数据类型是否匹配，确保操作适用于该类型",
                'valueerror': "检查值是否在有效范围内",
                'indexerror': "检查索引是否在有效范围内",
                'keyerror': "检查字典键是否存在",
                'attributeerror': "检查对象是否具有该属性或方法",
                'zerodivisionerror': "检查除数是否为零"
            }

            for error_type, suggestion in suggestions.items():
                if error_type in message:
                    return suggestion

            return "请检查错误信息和代码逻辑"

    class LogicErrorDetector:
        """逻辑错误检测器"""

        def __init__(self, llm_client: LLMClient):
            self.llm_client = llm_client

        async def detect(self, code: str,
                         execution_result: ExecutionResult = None) -> List[DetectedError]:
            """检测逻辑错误"""
            errors = []

            # 使用 LLM 分析代码逻辑
            prompt = f"""
            分析以下代码中的潜在逻辑错误：

            {code}

            请识别：
            1. 无限循环
            2. 空指针引用
            3. 边界条件错误
            4. 逻辑矛盾
            5. 死代码

            以 JSON 格式返回检测到的错误列表。
            """

            response = await self.llm_client.complete(prompt)
            detected_errors = self._parse_logic_errors(response)

            for error in detected_errors:
                detected_error = DetectedError(
                    type='logic',
                    severity='medium',
                    location=error.get('location', 'Unknown'),
                    message=error.get('message', 'Logic error'),
                    code_snippet=error.get('code_snippet', ''),
                    suggestion=error.get('suggestion', 'Review the logic')
                )
                errors.append(detected_error)

            return errors

        def _parse_logic_errors(self, response: str) -> List[Dict]:
            """解析逻辑错误"""
            try:
                return json.loads(response)
            except json.JSONDecodeError:
                return []

    ```## 29.5.3 根因分析

```python
    ### 根因分析器

    class RootCauseAnalyzer:
    """根因分析器"""
    def __init__(self, llm_client: LLMClient):
    self.llm_client = llm_client
    async def analyze(self, error: DetectedError,
    code: str,
    context: Dict = None) -> RootCauseAnalysis:
    """分析根因"""
    analysis = RootCauseAnalysis(error=error)
    # 收集相关信息
    relevant_code = self._collect_relevant_code(error, code)
    # 分析根本原因
    analysis.root_cause = await self._identify_root_cause(
    error,
    relevant_code,
    context
    )
    # 分析影响范围
    analysis.impact = await self._analyze_impact(
    error,
    relevant_code
    )
    # 分析修复难度
    analysis.difficulty = await self._estimate_difficulty(
    error,
    analysis.root_cause
    )
    return analysis
    def _collect_relevant_code(self, error: DetectedError,
    code: str) -> str:
    """收集相关代码"""
    lines = code.split('\n')
    # 提取错误位置周围的代码
    if error.location:
    try:
    line_no = int(error.location.split(',')[0].split()[-1])
    start = max(0, line_no - 5)
    end = min(len(lines), line_no + 5)
    return '\n'.join(lines[start:end])
    except (ValueError, IndexError):
    pass
    return code
    async def _identify_root_cause(self, error: DetectedError,
    relevant_code: str,
    context: Dict) -> str:
    """识别根本原因"""
    prompt = f"""
    分析错误的根本原因：
    错误类型：{error.type}
    错误信息：{error.message}
    错误位置：{error.location}
    相关代码：
    {relevant_code}
    上下文：{context}
    请分析并说明：
    1. 错误的根本原因
    2. 为什么会发生这个错误
    3. 代码中的具体问题
    """
    return await self.llm_client.complete(prompt)
    async def _analyze_impact(self, error: DetectedError,
    relevant_code: str) -> ImpactAnalysis:
    """分析影响范围"""
    prompt = f"""
    分析错误的影响范围：
    错误：{error.message}
    相关代码：
    {relevant_code}
    请分析：
    1. 错误影响哪些功能
    2. 影响的严重程度
    3. 是否会影响其他代码
    4. 是否会影响数据完整性
    """
    response = await self.llm_client.complete(prompt)
    return self._parse_impact(response)
    async def _estimate_difficulty(self, error: DetectedError,
    root_cause: str) -> str:
    """估计修复难度"""
    prompt = f"""
    估计修复错误的难度：
    错误：{error.message}
    根本原因：{root_cause}
    请评估修复难度（简单/中等/困难）并说明理由。
    """
    return await self.llm_client.complete(prompt)

## 29.5.4 修复建议

### 修复建议生成器

    python

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316

python


    ```python

    class FixSuggestionGenerator:
        """修复建议生成器"""

        def __init__(self, llm_client: LLMClient):
            self.llm_client = llm_client

        async def generate_suggestions(self,
                                       analysis: RootCauseAnalysis,
                                       code: str) -> List[FixSuggestion]:
            """生成修复建议"""
            suggestions = []

            # 生成多个修复方案

            prompt = f"""
            为以下错误生成修复建议：

            错误：{analysis.error.message}
            根本原因：{analysis.root_cause}
            原始代码：
            {code}

            请生成 2-3 个不同的修复方案，每个方案包括：
            1. 修复方法
            2. 修改后的代码
            3. 优缺点分析
            4. 适用场景

            以 JSON 格式返回修复方案列表。
            """

            response = await self.llm_client.complete(prompt)
            fix_suggestions = self._parse_fix_suggestions(response)

            for suggestion in fix_suggestions:
                fix_suggestion = FixSuggestion(
                    method=suggestion.get('method', ''),
                    fixed_code=suggestion.get('fixed_code', ''),
                    advantages=suggestion.get('advantages', []),
                    disadvantages=suggestion.get('disadvantages', []),
                    applicable_scenarios=suggestion.get('applicable_scenarios', ''),
                    confidence=suggestion.get('confidence', 0.5)
                )
                suggestions.append(fix_suggestion)

            # 按置信度排序

            suggestions.sort(key=lambda s: s.confidence, reverse=True)

            return suggestions

    ```## 29.5.5 性能优化

    ### 性能分析器

    class PerformanceAnalyzer:
    """性能分析器"""
    def __init__(self, llm_client: LLMClient):
    self.llm_client = llm_client
    async def analyze(self, code: str,
    execution_result: ExecutionResult = None) -> PerformanceAnalysis:
    """分析性能"""
    analysis = PerformanceAnalysis()
    # 分析时间复杂度
    analysis.time_complexity = await self._analyze_time_complexity(code)
    # 分析空间复杂度
    analysis.space_complexity = await self._analyze_space_complexity(code)
    # 识别性能瓶颈
    analysis.bottlenecks = await self._identify_bottlenecks(code)
    # 生成优化建议
    analysis.optimization_suggestions = await self._generate_optimization_suggestions(
    code,
    analysis
    )
    return analysis
    async def _analyze_time_complexity(self, code: str) -> str:
    """分析时间复杂度"""
    prompt = f"""
    分析以下代码的时间复杂度：
    {code}
    请分析并说明：
    1. 整体时间复杂度
    2. 关键部分的复杂度
    3. 影响复杂度的主要因素
    """
    return await self.llm_client.complete(prompt)
    async def _analyze_space_complexity(self, code: str) -> str:
    """分析空间复杂度"""
    prompt = f"""
    分析以下代码的空间复杂度：
    {code}
    请分析并说明：
    1. 整体空间复杂度
    2. 内存使用情况
    3. 可能的内存泄漏
    """
    return await self.llm_client.complete(prompt)
    async def _identify_bottlenecks(self, code: str) -> List[PerformanceBottleneck]:
    """识别性能瓶颈"""
    prompt = f"""
    识别以下代码中的性能瓶颈：
    {code}
    请识别：
    1. 循环嵌套
    2. 重复计算
    3. 不必要的内存分配
    4. 低效的数据结构使用
    5. I/O 操作
    以 JSON 格式返回瓶颈列表。
    """
    response = await self.llm_client.complete(prompt)
    return self._parse_bottlenecks(response)
    async def _generate_optimization_suggestions(self,
    code: str,
    analysis: PerformanceAnalysis) -> List[OptimizationSuggestion]:
    """生成优化建议"""
    suggestions = []
    for bottleneck in analysis.bottlenecks:
    prompt = f"""
    为以下性能瓶颈生成优化建议：
    瓶颈类型：{bottleneck.type}
    瓶颈位置：{bottleneck.location}
    瓶颈描述：{bottleneck.description}
    请生成具体的优化建议，包括：
    1. 优化方法
    2. 优化后的代码
    3. 预期性能提升
    """
    response = await self.llm_client.complete(prompt)
    suggestion = OptimizationSuggestion(
    bottleneck_type=bottleneck.type,
    method=self._extract_method(response),
    optimized_code=self._extract_code(response),
    expected_improvement=self._extract_improvement(response)
    )
    suggestions.append(suggestion)
    return suggestions

### 代码优化器

    python

python


    ```python

    class CodeOptimizer:
        """代码优化器"""

        def __init__(self, llm_client: LLMClient):
            self.llm_client = llm_client

        async def optimize(self, code: str,
                          suggestions: List[OptimizationSuggestion]) -> OptimizedCode:
            """优化代码"""
            optimized_code = code

            for suggestion in suggestions:

                # 应用优化

                optimized_code = await self._apply_optimization(
                    optimized_code,
                    suggestion
                )

            return OptimizedCode(
                original_code=code,
                optimized_code=optimized_code,
                applied_suggestions=suggestions
            )

        async def _apply_optimization(self, code: str,
                                     suggestion: OptimizationSuggestion) -> str:
            """应用单个优化"""
            prompt = f"""
            应用以下优化到代码：

            原始代码：
            {code}

            优化方法：{suggestion.method}
            优化后的代码示例：
            {suggestion.optimized_code}

            请返回应用优化后的完整代码。
            """

            return await self.llm_client.complete(prompt)

    ```## 29.5.6 调试工作流

    ### 调试工作流管理器

    class DebuggingWorkflow:
    """调试工作流"""
    def __init__(self, llm_client: LLMClient,
    tool_manager: ToolManager):
    self.llm_client = llm_client
    self.tool_manager = tool_manager
    # 初始化组件
    self.error_detector = ErrorDetector()
    self.root_cause_analyzer = RootCauseAnalyzer(llm_client)
    self.fix_suggestion_generator = FixSuggestionGenerator(llm_client)
    self.performance_analyzer = PerformanceAnalyzer(llm_client)
    self.code_optimizer = CodeOptimizer(llm_client)
    async def debug(self, code: str,
    execution_result: ExecutionResult = None) -> DebuggingResult:
    """执行调试工作流"""
    result = DebuggingResult(original_code=code)
    # 1. 检测错误
    result.errors = await self.error_detector.detect(code, execution_result)
    if not result.errors:
    result.status = "no_errors"
    return result
    # 2. 分析每个错误
    for error in result.errors:
    # 根因分析
    analysis = await self.root_cause_analyzer.analyze(error, code)
    result.root_cause_analyses.append(analysis)
    # 生成修复建议
    suggestions = await self.fix_suggestion_generator.generate_suggestions(
    analysis,
    code
    )
    result.fix_suggestions.extend(suggestions)
    # 3. 性能分析
    result.performance_analysis = await self.performance_analyzer.analyze(code)
    # 4. 生成优化建议
    if result.performance_analysis.optimization_suggestions:
    result.optimization_suggestions = result.performance_analysis.optimization_suggestions
    result.status = "completed"
    return result
    async def apply_fix(self, code: str,
    suggestion: FixSuggestion) -> FixedCode:
    """应用修复"""
    fixed_code = FixedCode(
    original_code=code,
    fixed_code=suggestion.fixed_code,
    applied_suggestion=suggestion
    )
    # 验证修复
    validation_result = await self._validate_fix(fixed_code)
    fixed_code.validation_result = validation_result
    return fixed_code
    async def _validate_fix(self, fixed_code: FixedCode) -> ValidationResult:
    """验证修复"""
    # 检查语法
    try:
    compile(fixed_code.fixed_code, '<string>', 'exec')
    syntax_valid = True
    except SyntaxError:
    syntax_valid = False
    # 运行测试（如果有）
    test_result = await self._run_tests(fixed_code.fixed_code)
    return ValidationResult(
    syntax_valid=syntax_valid,
    tests_passed=test_result.passed,
    test_output=test_result.output
    )
    async def _run_tests(self, code: str) -> TestResult:
    """运行测试"""
    # 简化实现：执行代码并检查错误
    try:
    exec(code)
    return TestResult(passed=True, output="Execution successful")
    except Exception as e:
    return TestResult(passed=False, output=str(e))

29.5 调试与优化模块 ​

29.5.1 调试模块概述 ​

调试流程 ​

29.5 调试与优化模块

29.5.1 调试模块概述

调试流程