尝试使用五阶段debug流程

Kiran · Kiran · commit d268c476ed4d · 2025-11-23T11:53:17.000+08:00
diff --git a/apps/codexgraph_agent/pages/components/page.py b/apps/codexgraph_agent/pages/components/page.py
@@ -21,7 +21,7 @@ def get_llm_config(llm_name):
 
         llm_config = {
             'model': 'deepseek-coder',
-            'api_base': 'https://api.deepseek.com',
+            'api_base': 'https://jeniya.cn/v1',
             'model_server': 'openai'
         }
 
diff --git a/apps/codexgraph_agent/setting.json b/apps/codexgraph_agent/setting.json
@@ -1,7 +1,7 @@
 {
     "setting": {
         "prompt_path": "apps/codexgraph_agent/prompt",
-        "repo_path": "C:\\Users\\LENOVO\\Desktop\\testcode\\tinyhttpd-master",
+        "repo_path": "C:\\Users\\34862\\Desktop\\test\\lrzip",
         "llm_model_name": "deepseek-coder",
         "llm_temperature": 1.0,
         "max_iterations": 5,
@@ -10,19 +10,21 @@
             "code_comment",
             "code_debug",
             "code_generate",
-            "code_unittest"
+            "code_unittest",
+            "111",
+            "test"
         ],
-        "project_id": "code_chat",
+        "project_id": "test",
         "env_path_dict": {
-            "env_path": "F:\\python\\Anaconda\\envs\\mybuild\\python.exe",
-            "working_directory": "C:\\Users\\LENOVO\\Desktop\\CodeXGraph\\ms-agent\\modelscope_agent\\environment\\graph_database\\indexer"
+            "env_path": "D:\\Anaconda\\envs\\mybuild\\python.exe",
+            "working_directory": "D:\\GitHub\\CodeXGraph\\ms-agent\\modelscope_agent\\environment\\graph_database\\indexer"
         },
         "neo4j": {
             "url": "bolt://localhost:7687",
             "user": "neo4j",
-            "password": "GuoGuo0532",
+            "password": "neo4j1231",
             "database_name": "neo4j"
         },
-        "language": "Python"
+        "language": "C"
     }
 }
diff --git a/modelscope_agent/agents/codexgraph_agent/task/code_debugger.py b/modelscope_agent/agents/codexgraph_agent/task/code_debugger.py
diff --git a/modelscope_agent/environment/graph_database/indexer/method_description_generator.py b/modelscope_agent/environment/graph_database/indexer/method_description_generator.py
@@ -60,7 +60,7 @@ def _get_default_config(self) -> Dict[str, Any]:
                         return {
                             'model_name': setting_data.get('llm_model_name', 'deepseek-coder'),
                             'api_key': os.getenv('OPENAI_API_KEY', 'sk-aabc879cff054d9fac7025eb491ef163'),
-                            'base_url': os.getenv('OPENAI_BASE_URL', 'https://api.deepseek.com'),
+                            'base_url': os.getenv('OPENAI_BASE_URL', 'https://jeniya.cn/v1'),
                             'max_tokens': 200,
                             'temperature': setting_data.get('llm_temperature', 0.3)
                         }
@@ -71,7 +71,7 @@ def _get_default_config(self) -> Dict[str, Any]:
         return {
             'model_name': 'deepseek-coder',  # 默认使用deepseek-coder
             'api_key': os.getenv('OPENAI_API_KEY', 'sk-aabc879cff054d9fac7025eb491ef163'),
-            'base_url': os.getenv('OPENAI_BASE_URL', 'https://api.deepseek.com'),
+            'base_url': os.getenv('OPENAI_BASE_URL', 'https://jeniya.cn/v1'),
             'max_tokens': 200,
             'temperature': 0.3
         }
@@ -154,11 +154,17 @@ def _build_prompt(self, method_code: str, method_name: str,
     
     def _call_llm(self, prompt: str) -> str:
         """调用大模型API"""
+        # 检查是否有有效的API key
+        api_key = self.llm_config.get('api_key', '').strip()
+        if not api_key or api_key == 'sk-aabc879cff054d9fac7025eb491ef163':
+            print(f"警告: 未配置有效的API Key，自动使用模拟描述生成")
+            return self._generate_mock_description(prompt)
+        
         try:
             print(f"尝试调用LLM API...")
             print(f"模型: {self.llm_config['model_name']}")
             print(f"API Base: {self.llm_config['base_url']}")
-            print(f"API Key: {self.llm_config['api_key'][:10]}..." if self.llm_config['api_key'] else "无API Key")
+            print(f"API Key: {api_key[:10]}...")
             
             # 使用统一的LLM调用方式，兼容不同的API
             from modelscope_agent.llm import get_chat_model
@@ -167,7 +173,7 @@ def _call_llm(self, prompt: str) -> str:
             llm_config = {
                 'model': self.llm_config['model_name'],
                 'api_base': self.llm_config['base_url'],
-                'api_key': self.llm_config['api_key'],
+                'api_key': api_key,
                 'model_server': 'openai'
             }
             
@@ -177,7 +183,7 @@ def _call_llm(self, prompt: str) -> str:
             llm = get_chat_model(
                 model=self.llm_config['model_name'],
                 model_server='openai',
-                api_key=self.llm_config['api_key'],
+                api_key=api_key,
                 api_base=self.llm_config['base_url']
             )
             print(f"LLM实例创建成功: {type(llm)}")
@@ -201,11 +207,18 @@ def _call_llm(self, prompt: str) -> str:
             print(f"警告: 未安装相关库，使用模拟描述: {e}")
             return self._generate_mock_description(prompt)
         except Exception as e:
-            print(f"调用大模型API失败: {e}")
-            import traceback
-            traceback.print_exc()
-            # 返回包含错误信息的描述
-            return f"LLM调用失败: {str(e)}"
+            error_str = str(e)
+            # 检查是否是认证错误
+            if 'Authentication' in error_str or '401' in error_str or 'Unauthorized' in error_str:
+                print(f"警告: API认证失败，自动降级到模拟描述生成。错误: {error_str}")
+                return self._generate_mock_description(prompt)
+            else:
+                print(f"调用大模型API失败: {e}")
+                import traceback
+                traceback.print_exc()
+                # 对于其他错误，也使用模拟描述而不是返回错误信息
+                print(f"自动使用模拟描述作为备选方案")
+                return self._generate_mock_description(prompt)
     
     def _generate_mock_description(self, prompt: str) -> str:
         """生成模拟描述（用于测试）"""
diff --git a/modelscope_agent/llm/openai.py b/modelscope_agent/llm/openai.py
@@ -44,7 +44,7 @@ def __init__(
             )
         else:
             default_api_base = os.getenv('OPENAI_API_BASE',
-                                         'https://api.openai.com/v1')
+                                         'https://jeniya.cn/v1')
             api_base = kwargs.get('api_base', default_api_base).strip()
             api_key = kwargs.get('api_key',
                                  os.getenv('OPENAI_API_KEY',
diff --git a/replace/ast_visitor_client.py b/replace/ast_visitor_client.py
@@ -315,6 +315,11 @@ def get_kind_priority(kind_str):
                 node_parms['signature'] = self.symbol_data[full_name]['signature']
             if 'code' in self.symbol_data[full_name]:
                 node_parms['code'] = self.symbol_data[full_name]['code']
+            # Include return_type and parameters if they exist in data
+            if 'return_type' in data:
+                node_parms['return_type'] = data['return_type']
+            if 'parameters' in data:
+                node_parms['parameters'] = data['parameters']
 
             self.graphDB.add_node(label=kind, full_name=full_name, parms=node_parms)
 
diff --git a/replace/c_ast_traverser.py b/replace/c_ast_traverser.py
@@ -170,6 +170,109 @@ def extract_function_name_from_call(function_node: Node):
     return None
 
 
+def extract_function_return_type(function_node: Node):
+    """
+    从函数定义或声明节点中提取返回类型。
+    函数定义的结构：type declarator body
+    函数声明的结构：type declarator;
+    """
+    if not function_node:
+        return None
+    
+    # 支持 function_definition 和 declaration 两种节点类型
+    if function_node.type not in ['function_definition', 'declaration']:
+        return None
+    
+    type_node = function_node.child_by_field_name('type')
+    if not type_node:
+        return 'void'  # 默认返回类型
+    
+    # 提取类型文本
+    return_type_text = type_node.text.decode('utf8', errors='ignore').strip()
+    return return_type_text if return_type_text else 'void'
+
+
+def extract_function_parameters(function_node: Node):
+    """
+    从函数定义节点中提取参数列表。
+    返回参数列表的字符串表示，格式如: "int a, char *b, void"
+    """
+    if not function_node:
+        return []
+    
+    # 获取 declarator
+    declarator = None
+    if function_node.type == 'function_definition':
+        declarator = function_node.child_by_field_name('declarator')
+    elif function_node.type == 'declaration':
+        declarator = function_node.child_by_field_name('declarator')
+    
+    if not declarator:
+        return []
+    
+    # 查找 function_declarator
+    def find_function_declarator(n, depth=0, max_depth=10):
+        """递归查找 function_declarator 节点"""
+        if depth > max_depth:
+            return None
+        if n.type == 'function_declarator':
+            return n
+        for child in n.children:
+            result = find_function_declarator(child, depth + 1, max_depth)
+            if result:
+                return result
+        return None
+    
+    func_declarator = find_function_declarator(declarator)
+    if not func_declarator:
+        return []
+    
+    # 获取 parameter_list
+    param_list = func_declarator.child_by_field_name('parameters')
+    if not param_list:
+        return []
+    
+    # 提取参数
+    parameters = []
+    for child in param_list.children:
+        if child.type == 'parameter_declaration':
+            # 提取参数类型和名称
+            param_type_node = child.child_by_field_name('type')
+            param_declarator = child.child_by_field_name('declarator')
+            
+            param_type = param_type_node.text.decode('utf8', errors='ignore').strip() if param_type_node else ''
+            
+            # 提取参数名
+            param_name = None
+            if param_declarator:
+                # 查找 identifier
+                def find_identifier_in_declarator(n, depth=0, max_depth=5):
+                    if depth > max_depth:
+                        return None
+                    if n.type == 'identifier':
+                        return n.text.decode('utf8', errors='ignore')
+                    for c in n.children:
+                        result = find_identifier_in_declarator(c, depth + 1, max_depth)
+                        if result:
+                            return result
+                    return None
+                
+                param_name = find_identifier_in_declarator(param_declarator)
+            
+            # 构建参数字符串
+            if param_name:
+                param_str = f"{param_type} {param_name}".strip()
+            else:
+                param_str = param_type if param_type else 'void'
+            
+            if param_str:
+                parameters.append(param_str)
+        elif child.type == 'variadic_parameter':
+            parameters.append('...')
+    
+    return parameters
+
+
 def traverse_c_ast_and_record(client: AstVisitorClient, file_path: str):
     """
     解析 C 代码文件并使用 Tree-sitter 的 cursor 进行深度优先遍历，
@@ -264,6 +367,10 @@ def find_identifier_in_node(n, depth=0, max_depth=10):
                     # 直接记录整个函数定义（包含签名和函数体）到 code 属性
                     func_text = node.text.decode('utf8', errors='ignore')
                     
+                    # 提取返回类型和参数列表
+                    return_type = extract_function_return_type(node)
+                    parameters = extract_function_parameters(node)
+                    
                     name_hierarchy = NameHierarchy(func_name_short, client.current_context_name())
                     symbol_id = client.recordSymbol(
                         name_hierarchy,
@@ -275,11 +382,16 @@ def find_identifier_in_node(n, depth=0, max_depth=10):
                     full_name = client.symbolId_to_Name[symbol_id]
                     client.symbol_data[full_name]['code'] = func_text
                     
-                    # 标记为用户自定义函数并创建图节点
+                    # 标记为用户自定义函数并创建图节点，包含返回类型和参数列表
+                    attributes = {
+                        'category': FunctionCategory.USER_DEFINED.value,
+                        'return_type': return_type,
+                        'parameters': parameters
+                    }
                     client.recordSymbolKind(
                         symbol_id,
                         srctrl.SymbolKind.FUNCTION,
-                        {'category': FunctionCategory.USER_DEFINED.value}
+                        attributes
                     )
                     
                     # 将作用域范围记录为整个函数（含签名），确保 code 包含签名
@@ -353,6 +465,10 @@ def has_function_body(n, depth=0, max_depth=10):
                             # 提取完整的函数定义文本（包括返回类型、函数名、参数列表和函数体）
                             func_text = node.text.decode('utf8', errors='ignore')
                             
+                            # 提取返回类型和参数列表
+                            return_type = extract_function_return_type(node)
+                            parameters = extract_function_parameters(node)
+                            
                             name_hierarchy = NameHierarchy(func_name_short, client.current_context_name())
                             symbol_id = client.recordSymbol(name_hierarchy, node_path=file_path, tree_node=node, kind_hint=symbolKindToString(srctrl.SymbolKind.FUNCTION)) # <--- 修改
                             
@@ -377,7 +493,14 @@ def has_function_body(n, depth=0, max_depth=10):
                                 signature_text = func_text
                             
                             client.symbol_data[full_name]['signature'] = signature_text
-                            client.recordSymbolKind(symbol_id, srctrl.SymbolKind.FUNCTION) # <--- 修改
+                            
+                            # 创建属性字典，包含返回类型和参数列表
+                            attributes = {
+                                'signature': signature_text,
+                                'return_type': return_type,
+                                'parameters': parameters
+                            }
+                            client.recordSymbolKind(symbol_id, srctrl.SymbolKind.FUNCTION, attributes) # <--- 修改
                             
                             # 记录函数的作用域位置
                             client.recordSymbolScopeLocation(symbol_id, source_range)
@@ -393,14 +516,23 @@ def has_function_body(n, depth=0, max_depth=10):
                             # 提取完整的函数声明文本（包括返回类型、函数名、参数列表）
                             declaration_text = node.text.decode('utf8', errors='ignore')
                             
+                            # 提取返回类型和参数列表
+                            return_type = extract_function_return_type(node)
+                            parameters = extract_function_parameters(node)
+                            
                             name_hierarchy = NameHierarchy(func_name_short, client.current_context_name())
                             symbol_id = client.recordSymbol(name_hierarchy, node_path=file_path, tree_node=node, kind_hint=symbolKindToString(srctrl.SymbolKind.FUNCTION_DECLARATION)) # <--- 修改
                             
                             # 将完整的函数声明文本存储到 code 属性
                             full_name = client.symbolId_to_Name[symbol_id]
                             client.symbol_data[full_name]['code'] = declaration_text
                             
-                            client.recordSymbolKind(symbol_id, srctrl.SymbolKind.FUNCTION_DECLARATION) # <--- 修改
+                            # 创建属性字典，包含返回类型和参数列表
+                            attributes = {
+                                'return_type': return_type,
+                                'parameters': parameters
+                            }
+                            client.recordSymbolKind(symbol_id, srctrl.SymbolKind.FUNCTION_DECLARATION, attributes) # <--- 修改
                             # print(f"  [CLIENT] Recorded FUNCTION_DECLARATION: {client.symbolId_to_Name[symbol_id]} in {file_name}")
                 
                 elif declarator.type == 'init_declarator' or declarator.type == 'declarator': # 变量声明 (可能带初始化)
diff --git a/scripts/request.json b/scripts/request.json
@@ -7,7 +7,7 @@
   "llm_config":                                                                                                                                                     {
     "model": "deepseek-coder",
     "model_server": "openai",
-    "api_base": "https://api.deepseek.com",
+    "api_base": "https://jeniya.cn/v1",
     "api_key": "sk-d6462958a57b4922ac0974c6521809d9",
     "generate_config": {
       "temperature": 0.2

Original file line number	Diff line number	Diff line change
`@@ -21,7 +21,7 @@ def get_llm_config(llm_name):`
`21`	`21`
`22`	`22`	`llm_config = {`
`23`	`23`	`'model': 'deepseek-coder',`
`24`		`- 'api_base': 'https://api.deepseek.com',`
	`24`	`+ 'api_base': 'https://jeniya.cn/v1',`
`25`	`25`	`'model_server': 'openai'`
`26`	`26`	`}`
`27`	`27`
Original file line number	Diff line number	Diff line change
`@@ -44,7 +44,7 @@ def __init__(`
`44`	`44`	`)`
`45`	`45`	`else:`
`46`	`46`	`default_api_base = os.getenv('OPENAI_API_BASE',`
`47`		`- 'https://api.openai.com/v1')`
	`47`	`+ 'https://jeniya.cn/v1')`
`48`	`48`	`api_base = kwargs.get('api_base', default_api_base).strip()`
`49`	`49`	`api_key = kwargs.get('api_key',`
`50`	`50`	`os.getenv('OPENAI_API_KEY',`