PyPI - auto-coder - Versions diffs - 0.1.361__py3-none-any.whl → 0.1.362__py3-none-any.whl - Mend

auto-coder 0.1.361py3-none-any.whl → 0.1.362py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of auto-coder might be problematic. Click here for more details.

Files changed (21) hide show

{auto_coder-0.1.361.dist-info → auto_coder-0.1.362.dist-info}/METADATA +2 -1
{auto_coder-0.1.361.dist-info → auto_coder-0.1.362.dist-info}/RECORD +21 -21
autocoder/agent/auto_learn.py +249 -262
autocoder/auto_coder.py +1 -1
autocoder/auto_coder_runner.py +34 -12
autocoder/commands/auto_command.py +227 -159
autocoder/common/__init__.py +2 -2
autocoder/common/ignorefiles/ignore_file_utils.py +12 -8
autocoder/common/result_manager.py +10 -2
autocoder/common/rulefiles/autocoderrules_utils.py +145 -0
autocoder/common/v2/agent/agentic_edit.py +32 -22
autocoder/common/v2/agent/agentic_edit_tools/read_file_tool_resolver.py +15 -12
autocoder/common/v2/code_auto_generate_editblock.py +3 -1
autocoder/index/index.py +14 -8
autocoder/privacy/model_filter.py +297 -35
autocoder/utils/_markitdown.py +22 -3
autocoder/version.py +1 -1
{auto_coder-0.1.361.dist-info → auto_coder-0.1.362.dist-info}/LICENSE +0 -0
{auto_coder-0.1.361.dist-info → auto_coder-0.1.362.dist-info}/WHEEL +0 -0
{auto_coder-0.1.361.dist-info → auto_coder-0.1.362.dist-info}/entry_points.txt +0 -0
{auto_coder-0.1.361.dist-info → auto_coder-0.1.362.dist-info}/top_level.txt +0 -0

autocoder/common/ignorefiles/ignore_file_utils.py CHANGED Viewed

@@ -1,9 +1,9 @@
 import os
 from pathlib import Path
 from threading import Lock
 import pathspec
 import threading
+from typing import Optional  # 添加Optional导入
 # 尝试导入 FileMonitor
 try:
@@ -24,7 +24,7 @@ class IgnoreFileManager:
     _instance = None
     _lock = Lock()
-    def __new__(cls):
+    def __new__(cls, project_root: Optional[str] = None):
         if not cls._instance:
             with cls._lock:
                 if not cls._instance:
@@ -32,20 +32,21 @@ class IgnoreFileManager:
                     cls._instance._initialized = False
         return cls._instance
-    def __init__(self):
+    def __init__(self, project_root: Optional[str] = None):
         if self._initialized:
             return
         self._initialized = True
         self._spec = None
         self._ignore_file_path = None
         self._file_monitor = None
+        self._project_root = project_root if project_root is not None else os.getcwd()
         self._load_ignore_spec()
         self._setup_file_monitor()
     def _load_ignore_spec(self):
         """加载忽略规则文件并解析规则"""
         ignore_patterns = []
-        project_root = Path(os.getcwd())
+        project_root = Path(self._project_root)
         ignore_file_paths = [
             project_root / '.autocoderignore',
@@ -89,15 +90,18 @@ class IgnoreFileManager:
     def should_ignore(self, path: str) -> bool:
         """判断指定路径是否应该被忽略"""
-        rel_path = os.path.relpath(path, os.getcwd())
+        rel_path = os.path.relpath(path, self._project_root)
         # 标准化分隔符
         rel_path = rel_path.replace(os.sep, '/')
         return self._spec.match_file(rel_path)
-# 对外提供单例
-_ignore_manager = IgnoreFileManager()
+# 对外提供的单例管理器
+_ignore_manager = None
-def should_ignore(path: str) -> bool:
+def should_ignore(path: str, project_root: Optional[str] = None) -> bool:
     """判断指定路径是否应该被忽略"""
+    global _ignore_manager
+    if _ignore_manager is None:
+        _ignore_manager = IgnoreFileManager(project_root=project_root)
     return _ignore_manager.should_ignore(path)

autocoder/common/result_manager.py CHANGED Viewed

@@ -16,16 +16,24 @@ class ResultItem(BaseModel):
 class ResultManager:
     """结果管理器，用于维护一个追加写入的jsonl文件"""
-    def __init__(self, source_dir: Optional[str] = None):
+    def __init__(self, source_dir: Optional[str] = None, event_file: Optional[str] = None):
         """
         初始化结果管理器
         Args:
             source_dir: 可选的源目录，如果不提供则使用当前目录
+            event_file: 可选的事件文件路径，用于生成结果文件名
         """
         self.source_dir = source_dir or os.getcwd()
         self.result_dir = os.path.join(self.source_dir, ".auto-coder", "results")
-        self.result_file = os.path.join(self.result_dir, "results.jsonl")
+        if event_file:
+            # 获取文件名并去掉后缀
+            event_file_name = os.path.splitext(os.path.basename(event_file))[0]
+            self.result_file = os.path.join(self.result_dir, f"{event_file_name}.jsonl")
+        else:
+            self.result_file = os.path.join(self.result_dir, "results.jsonl")
         os.makedirs(self.result_dir, exist_ok=True)
     def append(self, content: str, meta: Optional[Dict[str, Any]] = None) -> ResultItem:

autocoder/common/rulefiles/autocoderrules_utils.py CHANGED Viewed

@@ -6,7 +6,10 @@ from typing import Dict, List, Optional
 from loguru import logger
 import re
 import yaml
+import byzerllm # Added import
 from pydantic import BaseModel, Field
+from typing import List, Dict, Optional, Any # Added Any
+from autocoder.common import AutoCoderArgs
 # 尝试导入 FileMonitor
 try:
@@ -254,3 +257,145 @@ def parse_rule_file(file_path: str, project_root: Optional[str] = None) -> RuleF
     if _rules_manager is None:
         _rules_manager = AutocoderRulesManager(project_root=project_root)
     return _rules_manager.parse_rule_file(file_path)
+# 添加用于返回类型的Pydantic模型
+class RuleRelevance(BaseModel):
+    """用于规则相关性判断的返回模型"""
+    is_relevant: bool = Field(description="规则是否与当前任务相关")
+    reason: str = Field(default="", description="判断理由")
+class RuleSelector:
+    """
+    根据LLM的判断和规则元数据选择适用的规则。
+    """
+    def __init__(self, llm: Optional[byzerllm.ByzerLLM], args: Optional[AutoCoderArgs] = None):
+        """
+        初始化RuleSelector。
+        Args:
+            llm: ByzerLLM 实例，用于判断规则是否适用。如果为 None，则只选择 always_apply=True 的规则。
+            args: 传递给 Agent 的参数，可能包含用于规则选择的上下文信息。
+        """
+        self.llm = llm
+        self.args = args
+    @byzerllm.prompt()
+    def _build_selection_prompt(self, rule: RuleFile, context: str = "") -> str:
+        """
+        判断规则是否适用于当前任务。
+        规则描述:
+        {{ rule.description }}
+        规则内容摘要 (前200字符):
+        {{ rule.content[:200] }}
+        {% if context %}
+        任务上下文:
+        {{ context }}
+        {% endif %}
+        基于以上信息，判断这条规则 (路径: {{ rule.file_path }}) 是否与当前任务相关并应该被应用？
+        请以JSON格式返回结果:
+        ```json
+        {
+            "is_relevant": true或false,
+            "reason": "判断理由"
+        }
+        ```
+        """
+        # 注意：确保 rule 对象和 context 字典能够被 Jinja2 正确访问。
+        # Pydantic模型可以直接在Jinja2中使用其属性。
+        return {
+            "rule": rule,
+            "context": context
+        }
+    def select_rules(self, context: str, rules: List[RuleFile]) -> List[RuleFile]:
+        """
+        选择适用于当前上下文的规则。
+        Args:
+            context: 可选的字典，包含用于规则选择的上下文信息 (例如，用户指令、目标文件等)。
+        Returns:
+            List[RuleFile]: 选定的规则列表。
+        """
+        selected_rules: List[RuleFile] = []
+        logger.info(f"开始选择规则，总规则数: {len(rules)}")
+        for rule in rules:
+            if rule.always_apply:
+                selected_rules.append(rule)
+                logger.debug(f"规则 '{os.path.basename(rule.file_path)}' (AlwaysApply=True) 已自动选择。")
+                continue
+            if self.llm is None:
+                 logger.debug(f"规则 '{os.path.basename(rule.file_path)}' (AlwaysApply=False) 已跳过，因为未提供 LLM。")
+                 continue
+            # 对于 alwaysApply=False 的规则，使用 LLM 判断
+            try:
+                prompt = self._build_selection_prompt.prompt(rule=rule, context=context)
+                logger.debug(f"为规则 '{os.path.basename(rule.file_path)}' 生成的判断 Prompt (片段): {prompt[:200]}...")
+                # **** 实际LLM调用 ****
+                # 确保 self.llm 实例已正确初始化并可用
+                if self.llm: # Check if llm is not None
+                    result = None
+                    try:
+                        # 使用with_return_type方法获取结构化结果
+                        result = self._build_selection_prompt.with_llm(self.llm).with_return_type(RuleRelevance).run(rule=rule, context=context)
+                        if result and result.is_relevant:
+                            selected_rules.append(rule)
+                            logger.info(f"规则 '{os.path.basename(rule.file_path)}' (AlwaysApply=False) 已被 LLM 选择，原因: {result.reason}")
+                        else:
+                            logger.debug(f"规则 '{os.path.basename(rule.file_path)}' (AlwaysApply=False) 未被 LLM 选择，原因: {result.reason if result else '未提供'}")
+                    except Exception as e:
+                        logger.warning(f"LLM 未能为规则 '{os.path.basename(rule.file_path)}' 提供有效响应。")
+                        # 根据需要决定是否跳过或默认不选
+                        continue # 跳过此规则
+                else: # Handle case where self.llm is None after the initial check
+                    logger.warning(f"LLM instance became None unexpectedly for rule '{os.path.basename(rule.file_path)}'.")
+                    continue
+                # **** 模拟LLM调用 (用于测试/开发) ****
+                # 注释掉模拟部分，使用上面的实际调用
+                # simulated_response = "yes" if "always" in rule.description.lower() or "index" in rule.description.lower() else "no"
+                # logger.warning(f"模拟LLM判断规则 '{os.path.basename(rule.file_path)}': {simulated_response}")
+                # response_text = simulated_response
+                # **** 结束模拟 ****
+            except Exception as e:
+                logger.error(f"使用 LLM 判断规则 '{os.path.basename(rule.file_path)}' 时出错: {e}", exc_info=True)
+                # 根据策略决定是否包含出错的规则，这里选择跳过
+                continue
+        logger.info(f"规则选择完成，选中规则数: {len(selected_rules)}")
+        return selected_rules
+    def get_selected_rules_content(self, context: Optional[Dict] = None) -> Dict[str, str]:
+        """
+        获取选定规则的文件路径和内容字典。
+        Args:
+            context: 传递给 select_rules 的上下文。
+        Returns:
+            Dict[str, str]: 选定规则的 {file_path: content} 字典。
+        """
+        selected_rules = self.select_rules(context=context)
+        # 使用 os.path.basename 获取文件名作为 key，如果需要的话
+        # return {os.path.basename(rule.file_path): rule.content for rule in selected_rules}
+        # 保持 file_path 作为 key
+        return {rule.file_path: rule.content for rule in selected_rules}
+def auto_select_rules(context: str, rules: List[RuleFile], llm: Optional[byzerllm.ByzerLLM] = None,args:Optional[AutoCoderArgs] = None) -> List[RuleFile]:
+    """
+    根据LLM的判断和规则元数据选择适用的规则。
+    """
+    selector = RuleSelector(llm=llm, args=args)
+    return selector.select_rules(context=context, rules=rules)

autocoder/common/v2/agent/agentic_edit.py CHANGED Viewed

@@ -10,7 +10,6 @@ from rich.panel import Panel
 from pydantic import SkipValidation
 from byzerllm.utils.types import SingleOutputMeta
-# Removed ResultManager, stream_out, git_utils, AutoCommandTools, count_tokens, global_cancel, ActionYmlFileManager, get_event_manager, EventContentCreator, get_run_context, AgenticFilterStreamOutType
 from autocoder.common import AutoCoderArgs, git_utils, SourceCodeList, SourceCode
 from autocoder.common.global_cancel import global_cancel
 from autocoder.common import detect_env
@@ -692,6 +691,15 @@ class AgenticEdit:
         3. Remember, you have extensive capabilities with access to a wide range of tools that can be used in powerful and clever ways as necessary to accomplish each goal. Before calling a tool, do some analysis within <thinking></thinking> tags. First, analyze the file structure provided in environment_details to gain context and insights for proceeding effectively. Then, think about which of the provided tools is the most relevant tool to accomplish the user's task. Next, go through each of the required parameters of the relevant tool and determine if the user has directly provided or given enough information to infer a value. When deciding if the parameter can be inferred, carefully consider all the context to see if it supports a specific value. If all of the required parameters are present or can be reasonably inferred, close the thinking tag and proceed with the tool use. BUT, if one of the values for a required parameter is missing, DO NOT invoke the tool (not even with fillers for the missing params) and instead, ask the user to provide the missing parameters using the ask_followup_question tool. DO NOT ask for more information on optional parameters if it is not provided.
         4. Once you've completed the user's task, you must use the attempt_completion tool to present the result of the task to the user. You may also provide a CLI command to showcase the result of your task; this can be particularly useful for web development tasks, where you can run e.g. \`open index.html\` to show the website you've built.
         5. The user may provide feedback, which you can use to make improvements and try again. But DO NOT continue in pointless back and forth conversations, i.e. don't end your responses with questions or offers for further assistance.
+        {% if file_paths_str %}
+        ====
+        The following are files that the user is currently focusing on.
+        Make sure you always start your analysis by using the read_file tool to get the content of the files.
+        <files>
+        {{file_paths_str}}
+        </files>
+        {% endif %}
         """
         import os
         extra_docs = get_rules()
@@ -702,6 +710,8 @@ class AgenticEdit:
             shell_type = "cmd"
         elif shells.is_running_in_powershell():
             shell_type = "powershell"
+        file_paths_str = "\n".join([file_source.module_name for file_source in self.files.sources])
         return {
             "conversation_history": self.conversation_history,
             "env_info": env_info,
@@ -716,6 +726,7 @@ class AgenticEdit:
             "mcp_server_info": self.mcp_server_info,
             "enable_active_context_in_generate": self.args.enable_active_context_in_generate,
             "extra_docs": extra_docs,
+            "file_paths_str": file_paths_str,
         }
     # Removed _execute_command_result and execute_auto_command methods
@@ -773,27 +784,15 @@ class AgenticEdit:
         conversations = [
             {"role": "system", "content": system_prompt},
         ]
-        logger.info("Adding initial files context to conversation")
-        conversations.append({
-            "role":"user","content":f'''
-The following are context files that the user is currently focusing on. These files are presented with their complete paths and up-to-date content, providing essential context to help you better understand the user's needs. If you need more detailed information about specific files or directories not shown here, you can use tools like read_file, search_files, or list_files to explore the codebase further.
-<files>
-{self.files.to_str()}
-</files>'''
-        })
-        conversations.append({
-            "role":"assistant","content":"Ok"
-        })
-        logger.info("Adding conversation history")
         conversations.append({
             "role": "user", "content": request.user_input
         })
         logger.info(
             f"Initial conversation history size: {len(conversations)}")
+        logger.info(f"Conversation history: {json.dumps(conversations, indent=2,ensure_ascii=False)}")
         iteration_count = 0
         tool_executed = False
@@ -960,12 +959,17 @@ The following are context files that the user is currently focusing on. These fi
                     elif last_message["role"] == "assistant":
                         logger.info("Appending to existing assistant message")
                         last_message["content"] += assistant_buffer
-                # If the loop ends without AttemptCompletion, it means the LLM finished talking
-                # without signaling completion. We might just stop or yield a final message.
-                # Let's assume it stops here.
-                logger.info("No tool executed and LLM finished. Breaking out of main loop.")
-                break
+                # 添加系统提示，要求LLM必须使用工具或明确结束，而不是直接退出
+                logger.info("Adding system reminder to use tools or attempt completion")
+                conversations.append({
+                    "role": "user",
+                    "content": "NOTE: You must use an appropriate tool (such as read_file, write_to_file, execute_command, etc.) or explicitly complete the task (using attempt_completion). Do not provide text responses without taking concrete actions. Please select a suitable tool to continue based on the user's task."
+                })
+                # 继续循环，让 LLM 再思考，而不是 break
+                logger.info("Continuing the LLM interaction loop without breaking")
+                continue
         logger.info(f"AgenticEdit analyze loop finished after {iteration_count} iterations.")
     def stream_and_parse_llm_response(
@@ -1264,6 +1268,9 @@ The following are context files that the user is currently focusing on. These fi
                     output_cost = (
                         last_meta.generated_tokens_count * output_price) / 1000000
+                    # 添加日志记录
+                    logger.info(f"Token Usage Details: Model={model_name}, Input Tokens={last_meta.input_tokens_count}, Output Tokens={last_meta.generated_tokens_count}, Input Cost=${input_cost:.6f}, Output Cost=${output_cost:.6f}")
                     get_event_manager(self.args.event_file).write_result(
                         EventContentCreator.create_result(content=EventContentCreator.ResultTokenStatContent(
                             model_name=model_name,
@@ -1447,6 +1454,9 @@ The following are context files that the user is currently focusing on. These fi
                     output_cost = (
                         last_meta.generated_tokens_count * output_price) / 1000000
+                    # 添加日志记录
+                    logger.info(f"Token Usage: Model={model_name}, Input Tokens={last_meta.input_tokens_count}, Output Tokens={last_meta.generated_tokens_count}, Input Cost=${input_cost:.6f}, Output Cost=${output_cost:.6f}")
                     self.printer.print_in_terminal(
                             "code_generation_complete",
                             duration=0.0,

autocoder/common/v2/agent/agentic_edit_tools/read_file_tool_resolver.py CHANGED Viewed

@@ -22,20 +22,23 @@ class ReadFileToolResolver(BaseToolResolver):
         abs_project_dir = os.path.abspath(source_dir)
         abs_file_path = os.path.abspath(os.path.join(source_dir, file_path))
-        # Security check: ensure the path is within the source directory
-        if not abs_file_path.startswith(abs_project_dir):
-            return ToolResult(success=False, message=f"Error: Access denied. Attempted to read file outside the project directory: {file_path}")
+        # # Security check: ensure the path is within the source directory
+        # if not abs_file_path.startswith(abs_project_dir):
+        #     return ToolResult(success=False, message=f"Error: Access denied. Attempted to read file outside the project directory: {file_path}")
         try:
-            if self.shadow_manager:
-                shadow_path = self.shadow_manager.to_shadow_path(abs_file_path)
-                # If shadow file exists, read from it
-                if os.path.exists(shadow_path) and os.path.isfile(shadow_path):
-                    with open(shadow_path, 'r', encoding='utf-8', errors='replace') as f:
-                        content = f.read()
-                    logger.info(f"[Shadow] Successfully read shadow file: {shadow_path}")
-                    return ToolResult(success=True, message=f"Successfully read file (shadow): {file_path}", content=content)
-                # else fallback to original file
+            try:
+                if self.shadow_manager:
+                    shadow_path = self.shadow_manager.to_shadow_path(abs_file_path)
+                    # If shadow file exists, read from it
+                    if os.path.exists(shadow_path) and os.path.isfile(shadow_path):
+                        with open(shadow_path, 'r', encoding='utf-8', errors='replace') as f:
+                            content = f.read()
+                        logger.info(f"[Shadow] Successfully read shadow file: {shadow_path}")
+                        return ToolResult(success=True, message=f"Successfully read file (shadow): {file_path}", content=content)
+            except Exception as e:
+                pass
+            # else fallback to original file
             # Fallback to original file
             if not os.path.exists(abs_file_path):
                 return ToolResult(success=False, message=f"Error: File not found at path: {file_path}")

autocoder/common/v2/code_auto_generate_editblock.py CHANGED Viewed

@@ -215,8 +215,10 @@ class CodeAutoGenerateEditBlock:
         ====
         下面是用户的需求：
+        <user_instruction>
         {{ instruction }}
+        </user_instruction>
         """
         if not self.args.include_project_structure:

autocoder/index/index.py CHANGED Viewed

@@ -31,6 +31,7 @@ from autocoder.rag.token_counter import count_tokens
 from autocoder.common.stream_out_type import IndexStreamOutType
 from autocoder.events.event_manager_singleton import get_event_manager
 from autocoder.events import event_content as EventContentCreator
+from loguru import logger
 class IndexManager:
     def __init__(
@@ -220,7 +221,7 @@ class IndexManager:
         5. 导入语句中需要包含 jsp:include 整个标签，类似 <jsp:include page="/jspf/prelude.jspf" />
         6. 导入语句中需要包含 form 标签，类似 <form name="ActionPlanLinkedForm" action="/ri/ActionPlanController.do" method="post">
         7. 导入语句中需要包含 有 src 属性的 script 标签。比如 <script language="script" src="xxx">
-        8. 导入语句中需要包含 有 src 属性的 link 标签。 比如 <link rel="stylesheet" type="text/css" href="/ri/ui/styles/xptheme.css">
+        8. 导入语句中需要包含 有 src 属性的 link 标签。 比如 <link rel="stylesheet" type="text/css" href="/ri/ui/styles/xptheme.css">
         9. 导入语句中需要包含 ajax 请求里的url,比如 $.ajax({
         type : "post",
         url : "admWorkingDay!updateAdmWorkingDayList.action",  中，那么对应的为 <ajax method="post" url="admWorkingDay!updateAdmWorkingDayList.action">
@@ -656,13 +657,18 @@ class IndexManager:
         index_items = []
         for module_name, data in index_data.items():
-            index_item = IndexItem(
-                module_name=module_name,
-                symbols=data["symbols"],
-                last_modified=data["last_modified"],
-                md5=data["md5"],
-            )
-            index_items.append(index_item)
+            try:
+                index_item = IndexItem(
+                    module_name=module_name,
+                    symbols=data["symbols"],
+                    last_modified=data["last_modified"],
+                    md5=data["md5"],
+                )
+                index_items.append(index_item)
+            except (KeyError, TypeError) as e:
+                logger.warning(f"处理索引条目 {module_name} 时出错: {str(e)}")
+                logger.exception(e)
+                continue
         return index_items

auto-coder 0.1.361__py3-none-any.whl → 0.1.362__py3-none-any.whl

Potentially problematic release.

auto-coder 0.1.361py3-none-any.whl → 0.1.362py3-none-any.whl