PyPI - autocoder-nano - Versions diffs - 0.1.26__py3-none-any.whl → 0.1.28__py3-none-any.whl - Mend

autocoder-nano 0.1.26py3-none-any.whl → 0.1.28py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (22) hide show

autocoder_nano/agent/agent_base.py +376 -63
autocoder_nano/auto_coder_nano.py +89 -1106
autocoder_nano/edit/__init__.py +20 -0
autocoder_nano/edit/actions.py +136 -0
autocoder_nano/edit/code/__init__.py +0 -0
autocoder_nano/edit/code/generate_editblock.py +403 -0
autocoder_nano/edit/code/merge_editblock.py +418 -0
autocoder_nano/edit/code/modification_ranker.py +90 -0
autocoder_nano/edit/text.py +38 -0
autocoder_nano/index/index_manager.py +1 -0
autocoder_nano/index/symbols_utils.py +43 -0
autocoder_nano/llm_types.py +1 -0
autocoder_nano/project/pyproject.py +1 -1
autocoder_nano/project/suffixproject.py +1 -1
autocoder_nano/version.py +1 -1
autocoder_nano-0.1.28.dist-info/METADATA +445 -0
{autocoder_nano-0.1.26.dist-info → autocoder_nano-0.1.28.dist-info}/RECORD +21 -13
autocoder_nano-0.1.26.dist-info/METADATA +0 -432
{autocoder_nano-0.1.26.dist-info → autocoder_nano-0.1.28.dist-info}/LICENSE +0 -0
{autocoder_nano-0.1.26.dist-info → autocoder_nano-0.1.28.dist-info}/WHEEL +0 -0
{autocoder_nano-0.1.26.dist-info → autocoder_nano-0.1.28.dist-info}/entry_points.txt +0 -0
{autocoder_nano-0.1.26.dist-info → autocoder_nano-0.1.28.dist-info}/top_level.txt +0 -0

autocoder_nano/auto_coder_nano.py CHANGED Viewed

@@ -2,21 +2,18 @@ import argparse
 import glob
 import hashlib
 import os
-import re
 import json
 import shutil
 import subprocess
-import tempfile
 import textwrap
 import time
-import traceback
 import uuid
-from difflib import SequenceMatcher
-from autocoder_nano.agent.new.auto_new_project import BuildNewProject
+from autocoder_nano.edit import Dispacher
 from autocoder_nano.helper import show_help
 from autocoder_nano.index.entry import build_index_and_filter_files
 from autocoder_nano.index.index_manager import IndexManager
+from autocoder_nano.index.symbols_utils import extract_symbols
 from autocoder_nano.llm_client import AutoLLM
 from autocoder_nano.version import __version__
 from autocoder_nano.llm_types import *
@@ -55,7 +52,7 @@ base_persist_dir = os.path.join(project_root, ".auto-coder", "plugins", "chat-au
 #                        ".vscode", ".idea", ".hg"]
 commands = [
     "/add_files", "/remove_files", "/list_files", "/conf", "/coding", "/chat", "/revert", "/index/query",
-    "/index/build", "/exclude_dirs", "/help", "/shell", "/exit", "/mode", "/models", "/commit", "/new"
+    "/index/build", "/exclude_dirs", "/exclude_files", "/help", "/shell", "/exit", "/mode", "/models", "/commit", "/new"
 ]
 memory = {
@@ -77,29 +74,6 @@ memory = {
 args: AutoCoderArgs = AutoCoderArgs()
-def extract_symbols(text: str) -> SymbolsInfo:
-    patterns = {
-        "usage": r"用途：(.+)",
-        "functions": r"函数：(.+)",
-        "variables": r"变量：(.+)",
-        "classes": r"类：(.+)",
-        "import_statements": r"导入语句：(.+)",
-    }
-    info = SymbolsInfo()
-    for field, pattern in patterns.items():
-        match = re.search(pattern, text)
-        if match:
-            value = match.group(1).strip()
-            if field == "import_statements":
-                value = [v.strip() for v in value.split("^^")]
-            elif field == "functions" or field == "variables" or field == "classes":
-                value = [v.strip() for v in value.split(",")]
-            setattr(info, field, value)
-    return info
 def get_all_file_names_in_project() -> List[str]:
     file_names = []
     final_exclude_dirs = default_exclude_dirs + memory.get("exclude_dirs", [])
@@ -223,7 +197,9 @@ COMMANDS = {
         "/conf": "",
         "/mode": "",
         "/models": ""
-    }
+    },
+    "/exclude_files": {"/list": "", "/drop": ""},
+    "/exclude_dirs": {}
 }
@@ -701,6 +677,15 @@ class CommandCompleter(Completer):
                     if current_word and current_word in file_name:
                         yield Completion(file_name, start_position=-len(current_word))
+            elif words[0] == "/exclude_files":
+                new_text = text[len("/exclude_files"):]
+                parser = CommandTextParser(new_text, words[0])
+                parser.add_files()
+                current_word = parser.current_word()
+                for command in parser.get_sub_commands():
+                    if command.startswith(current_word):
+                        yield Completion(command, start_position=-len(current_word))
             elif words[0] == "/models":
                 new_text = text[len("/models"):]
                 parser = CommandTextParser(new_text, words[0])
@@ -798,20 +783,69 @@ def load_memory():
     completer.update_current_files(memory["current_files"]["files"])
-def symbols_info_to_str(info: SymbolsInfo, symbol_types: List[SymbolType]) -> str:
-    result = []
-    for symbol_type in symbol_types:
-        value = getattr(info, symbol_type.value)
-        if value:
-            if symbol_type == SymbolType.IMPORT_STATEMENTS:
-                value_str = "^^".join(value)
-            elif symbol_type in [SymbolType.FUNCTIONS, SymbolType.VARIABLES, SymbolType.CLASSES,]:
-                value_str = ",".join(value)
-            else:
-                value_str = value
-            result.append(f"{symbol_type.value}：{value_str}")
+def exclude_dirs(dir_names: List[str]):
+    new_dirs = dir_names
+    existing_dirs = memory.get("exclude_dirs", [])
+    dirs_to_add = [d for d in new_dirs if d not in existing_dirs]
+    if dirs_to_add:
+        existing_dirs.extend(dirs_to_add)
+        if "exclude_dirs" not in memory:
+            memory["exclude_dirs"] = existing_dirs
+        print(f"Added exclude dirs: {dirs_to_add}")
+        for d in dirs_to_add:
+            exclude_files(f"regex://.*/{d}/*.")
+        # exclude_files([f"regex://.*/{d}/*." for d in dirs_to_add])
+    else:
+        print("All specified dirs are already in the exclude list.")
+    save_memory()
+    completer.refresh_files()
-    return "\n".join(result)
+def exclude_files(query: str):
+    if "/list" in query:
+        query = query.replace("/list", "", 1).strip()
+        existing_file_patterns = memory.get("exclude_files", [])
+        # 打印表格
+        table = Table(title="Exclude Files")
+        table.add_column("File Pattern")
+        for file_pattern in existing_file_patterns:
+            table.add_row(file_pattern)
+        console.print(table)
+        return
+    if "/drop" in query:
+        query = query.replace("/drop", "", 1).strip()
+        existing_file_patterns = memory.get("exclude_files", [])
+        existing_file_patterns.remove(query.strip())
+        memory["exclude_files"] = existing_file_patterns
+        if query.startswith("regex://.*/") and query.endswith("/*."):
+            existing_dirs_patterns = memory.get("exclude_dirs", [])
+            dir_query = query.replace("regex://.*/", "", 1).replace("/*.", "", 1)
+            if dir_query in existing_dirs_patterns:
+                existing_dirs_patterns.remove(dir_query.strip())
+        save_memory()
+        completer.refresh_files()
+        return
+    new_file_patterns = query.strip().split(",")
+    existing_file_patterns = memory.get("exclude_files", [])
+    file_patterns_to_add = [f for f in new_file_patterns if f not in existing_file_patterns]
+    for file_pattern in file_patterns_to_add:
+        if not file_pattern.startswith("regex://"):
+            raise
+    if file_patterns_to_add:
+        existing_file_patterns.extend(file_patterns_to_add)
+        if "exclude_files" not in memory:
+            memory["exclude_files"] = existing_file_patterns
+        save_memory()
+        print(f"Added exclude files: {file_patterns_to_add}")
+    else:
+        print("All specified files are already in the exclude list.")
 def index_command(llm):
@@ -1007,7 +1041,8 @@ def update_config_to_args(query, delete_execute_file: bool = False):
         "skip_confirm": conf.get("skip_confirm", "true") == "true",
         "chat_model": conf.get("chat_model", ""),
         "code_model": conf.get("code_model", ""),
-        "auto_merge": conf.get("auto_merge", "editblock")
+        "auto_merge": conf.get("auto_merge", "editblock"),
+        "exclude_files": memory.get("exclude_files", [])
     }
     current_files = memory["current_files"]["files"]
     yaml_config["urls"] = current_files
@@ -1220,30 +1255,6 @@ def chat(query: str, llm: AutoLLM):
     return
-def git_print_commit_info(commit_result: CommitResult):
-    table = Table(
-        title="Commit Information (Use /revert to revert this commit)", show_header=True, header_style="bold magenta"
-    )
-    table.add_column("Attribute", style="cyan", no_wrap=True)
-    table.add_column("Value", style="green")
-    table.add_row("Commit Hash", commit_result.commit_hash)
-    table.add_row("Commit Message", commit_result.commit_message)
-    table.add_row("Changed Files", "\n".join(commit_result.changed_files))
-    console.print(
-        Panel(table, expand=False, border_style="green", title="Git Commit Summary")
-    )
-    if commit_result.diffs:
-        for file, diff in commit_result.diffs.items():
-            console.print(f"\n[bold blue]File: {file}[/bold blue]")
-            syntax = Syntax(diff, "diff", theme="monokai", line_numbers=True)
-            console.print(
-                Panel(syntax, expand=False, border_style="yellow", title="File Diff")
-            )
 def init_project():
     if not args.project_type:
         logger.error(
@@ -1316,1040 +1327,6 @@ def load_include_files(config, base_path, max_depth=10, current_depth=0):
     return config
-class CodeAutoGenerateEditBlock:
-    def __init__(self, llm: AutoLLM, action=None, fence_0: str = "```", fence_1: str = "```"):
-        self.llm = llm
-        # self.llm.setup_default_model_name(memory["conf"]["current_code_model"])
-        self.args = args
-        self.action = action
-        self.fence_0 = fence_0
-        self.fence_1 = fence_1
-        if not self.llm:
-            raise ValueError("Please provide a valid model instance to use for code generation.")
-        self.llms = [self.llm]
-    @prompt()
-    def single_round_instruction(self, instruction: str, content: str, context: str = ""):
-        """
-        如果你需要生成代码，对于每个需要更改的文件,你需要按 *SEARCH/REPLACE block* 的格式进行生成。
-        # *SEARCH/REPLACE block* Rules:
-        Every *SEARCH/REPLACE block* must use this format:
-        1. The opening fence and code language, eg: {{ fence_0 }}python
-        2. The file path alone on a line, starting with "##File:" and verbatim. No bold asterisks, no quotes around it,
-        no escaping of characters, etc.
-        3. The start of search block: <<<<<<< SEARCH
-        4. A contiguous chunk of lines to search for in the existing source code
-        5. The dividing line: =======
-        6. The lines to replace into the source code
-        7. The end of the replacement block: >>>>>>> REPLACE
-        8. The closing fence: {{ fence_1 }}
-        Every *SEARCH* section must *EXACTLY MATCH* the existing source code, character for character,
-        including all comments, docstrings, etc.
-        *SEARCH/REPLACE* blocks will replace *all* matching occurrences.
-        Include enough lines to make the SEARCH blocks unique.
-        Include *ALL* the code being searched and replaced!
-        To move code within a file, use 2 *SEARCH/REPLACE* blocks: 1 to delete it from its current location,
-        1 to insert it in the new location.
-        If you want to put code in a new file, use a *SEARCH/REPLACE block* with:
-        - A new file path, including dir name if needed
-        - An empty `SEARCH` section
-        - The new file's contents in the `REPLACE` section
-        ONLY EVER RETURN CODE IN A *SEARCH/REPLACE BLOCK*!
-        下面我们来看一个例子：
-        当前项目目录结构：
-        1. 项目根目录： /tmp/projects/mathweb
-        2. 项目子目录/文件列表(类似tree 命令输出)
-        flask/
-            app.py
-            templates/
-                index.html
-            static/
-                style.css
-        用户需求： Change get_factorial() to use math.factorial
-        回答： To make this change we need to modify `/tmp/projects/mathweb/flask/app.py` to:
-        1. Import the math package.
-        2. Remove the existing factorial() function.
-        3. Update get_factorial() to call math.factorial instead.
-        Here are the *SEARCH/REPLACE* blocks:
-        ```python
-        ##File: /tmp/projects/mathweb/flask/app.py
-        <<<<<<< SEARCH
-        from flask import Flask
-        =======
-        import math
-        from flask import Flask
-        >>>>>>> REPLACE
-        ```
-        ```python
-        ##File: /tmp/projects/mathweb/flask/app.py
-        <<<<<<< SEARCH
-        def factorial(n):
-            "compute factorial"
-            if n == 0:
-                return 1
-            else:
-                return n * factorial(n-1)
-        =======
-        >>>>>>> REPLACE
-        ```
-        ```python
-        ##File: /tmp/projects/mathweb/flask/app.py
-        <<<<<<< SEARCH
-            return str(factorial(n))
-        =======
-            return str(math.factorial(n))
-        >>>>>>> REPLACE
-        ```
-        用户需求： Refactor hello() into its own file.
-        回答：To make this change we need to modify `main.py` and make a new file `hello.py`:
-        1. Make a new hello.py file with hello() in it.
-        2. Remove hello() from main.py and replace it with an import.
-        Here are the *SEARCH/REPLACE* blocks:
-        ```python
-        ##File: /tmp/projects/mathweb/hello.py
-        <<<<<<< SEARCH
-        =======
-        def hello():
-            "print a greeting"
-            print("hello")
-        >>>>>>> REPLACE
-        ```
-        ```python
-        ##File: /tmp/projects/mathweb/main.py
-        <<<<<<< SEARCH
-        def hello():
-            "print a greeting"
-            print("hello")
-        =======
-        from hello import hello
-        >>>>>>> REPLACE
-        ```
-        现在让我们开始一个新的任务:
-        {%- if structure %}
-        {{ structure }}
-        {%- endif %}
-        {%- if content %}
-        下面是一些文件路径以及每个文件对应的源码：
-        <files>
-        {{ content }}
-        </files>
-        {%- endif %}
-        {%- if context %}
-        <extra_context>
-        {{ context }}
-        </extra_context>
-        {%- endif %}
-        下面是用户的需求：
-        {{ instruction }}
-        """
-    @prompt()
-    def auto_implement_function(self, instruction: str, content: str) -> str:
-        """
-        下面是一些文件路径以及每个文件对应的源码：
-        {{ content }}
-        请参考上面的内容，重新实现所有文件下方法体标记了如下内容的方法：
-        ```python
-        raise NotImplementedError("This function should be implemented by the model.")
-        ```
-        {{ instruction }}
-        """
-    def single_round_run(self, query: str, source_content: str) -> CodeGenerateResult:
-        init_prompt = ''
-        if self.args.template == "common":
-            init_prompt = self.single_round_instruction.prompt(
-                instruction=query, content=source_content, context=self.args.context
-            )
-        elif self.args.template == "auto_implement":
-            init_prompt = self.auto_implement_function.prompt(
-                instruction=query, content=source_content
-            )
-        with open(self.args.target_file, "w") as file:
-            file.write(init_prompt)
-        conversations = [{"role": "user", "content": init_prompt}]
-        conversations_list = []
-        results = []
-        for llm in self.llms:
-            v = llm.chat_ai(conversations=conversations, model=args.code_model)
-            results.append(v.output)
-        for result in results:
-            conversations_list.append(conversations + [{"role": "assistant", "content": result}])
-        return CodeGenerateResult(contents=results, conversations=conversations_list)
-    @prompt()
-    def multi_round_instruction(self, instruction: str, content: str, context: str = "") -> str:
-        """
-        如果你需要生成代码，对于每个需要更改的文件,你需要按 *SEARCH/REPLACE block* 的格式进行生成。
-        # *SEARCH/REPLACE block* Rules:
-        Every *SEARCH/REPLACE block* must use this format:
-        1. The opening fence and code language, eg: {{ fence_0 }}python
-        2. The file path alone on a line, starting with "##File:" and verbatim. No bold asterisks, no quotes around it,
-        no escaping of characters, etc.
-        3. The start of search block: <<<<<<< SEARCH
-        4. A contiguous chunk of lines to search for in the existing source code
-        5. The dividing line: =======
-        6. The lines to replace into the source code
-        7. The end of the replacement block: >>>>>>> REPLACE
-        8. The closing fence: {{ fence_1 }}
-        Every *SEARCH* section must *EXACTLY MATCH* the existing source code, character for character,
-        including all comments, docstrings, etc.
-        *SEARCH/REPLACE* blocks will replace *all* matching occurrences.
-        Include enough lines to make the SEARCH blocks unique.
-        Include *ALL* the code being searched and replaced!
-        To move code within a file, use 2 *SEARCH/REPLACE* blocks: 1 to delete it from its current location,
-        1 to insert it in the new location.
-        If you want to put code in a new file, use a *SEARCH/REPLACE block* with:
-        - A new file path, including dir name if needed
-        - An empty `SEARCH` section
-        - The new file's contents in the `REPLACE` section
-        ONLY EVER RETURN CODE IN A *SEARCH/REPLACE BLOCK*!
-        下面我们来看一个例子：
-        当前项目目录结构：
-        1. 项目根目录： /tmp/projects/mathweb
-        2. 项目子目录/文件列表(类似tree 命令输出)
-        flask/
-            app.py
-            templates/
-                index.html
-            static/
-                style.css
-        用户需求： Change get_factorial() to use math.factorial
-        回答： To make this change we need to modify `/tmp/projects/mathweb/flask/app.py` to:
-        1. Import the math package.
-        2. Remove the existing factorial() function.
-        3. Update get_factorial() to call math.factorial instead.
-        Here are the *SEARCH/REPLACE* blocks:
-        {{ fence_0 }}python
-        ##File: /tmp/projects/mathweb/flask/app.py
-        <<<<<<< SEARCH
-        from flask import Flask
-        =======
-        import math
-        from flask import Flask
-        >>>>>>> REPLACE
-        {{ fence_1 }}
-        {{ fence_0 }}python
-        ##File: /tmp/projects/mathweb/flask/app.py
-        <<<<<<< SEARCH
-        def factorial(n):
-            "compute factorial"
-            if n == 0:
-                return 1
-            else:
-                return n * factorial(n-1)
-        =======
-        >>>>>>> REPLACE
-        {{ fence_1 }}
-        {{ fence_0 }}python
-        ##File: /tmp/projects/mathweb/flask/app.py
-        <<<<<<< SEARCH
-            return str(factorial(n))
-        =======
-            return str(math.factorial(n))
-        >>>>>>> REPLACE
-        {{ fence_1 }}
-        用户需求： Refactor hello() into its own file.
-        回答：To make this change we need to modify `main.py` and make a new file `hello.py`:
-        1. Make a new hello.py file with hello() in it.
-        2. Remove hello() from main.py and replace it with an import.
-        Here are the *SEARCH/REPLACE* blocks:
-        {{ fence_0 }}python
-        ##File: /tmp/projects/mathweb/hello.py
-        <<<<<<< SEARCH
-        =======
-        def hello():
-            "print a greeting"
-            print("hello")
-        >>>>>>> REPLACE
-        {{ fence_1 }}
-        {{ fence_0 }}python
-        ##File: /tmp/projects/mathweb/main.py
-        <<<<<<< SEARCH
-        def hello():
-            "print a greeting"
-            print("hello")
-        =======
-        from hello import hello
-        >>>>>>> REPLACE
-        {{ fence_1 }}
-        现在让我们开始一个新的任务:
-        {%- if structure %}
-        {{ structure }}
-        {%- endif %}
-        {%- if content %}
-        下面是一些文件路径以及每个文件对应的源码：
-        <files>
-        {{ content }}
-        </files>
-        {%- endif %}
-        {%- if context %}
-        <extra_context>
-        {{ context }}
-        </extra_context>
-        {%- endif %}
-        下面是用户的需求：
-        {{ instruction }}
-        每次生成一个文件的*SEARCH/REPLACE* blocks，然后询问我是否继续，当我回复继续，
-        继续生成下一个文件的*SEARCH/REPLACE* blocks。当没有后续任务时，请回复 "__完成__" 或者 "__EOF__"。
-        """
-    def multi_round_run(self, query: str, source_content: str, max_steps: int = 3) -> CodeGenerateResult:
-        init_prompt = ''
-        if self.args.template == "common":
-            init_prompt = self.multi_round_instruction.prompt(
-                instruction=query, content=source_content, context=self.args.context
-            )
-        elif self.args.template == "auto_implement":
-            init_prompt = self.auto_implement_function.prompt(
-                instruction=query, content=source_content
-            )
-        with open(self.args.target_file, "w") as file:
-            file.write(init_prompt)
-        results = []
-        conversations = [{"role": "user", "content": init_prompt}]
-        code_llm = self.llms[0]
-        v = code_llm.chat_ai(conversations=conversations, model=args.code_model)
-        results.append(v.output)
-        conversations.append({"role": "assistant", "content": v.output})
-        if "__完成__" in v.output or "/done" in v.output or "__EOF__" in v.output:
-            return CodeGenerateResult(contents=["\n\n".join(results)], conversations=[conversations])
-        current_step = 0
-        while current_step < max_steps:
-            conversations.append({"role": "user", "content": "继续"})
-            with open(self.args.target_file, "w") as file:
-                file.write("继续")
-            t = code_llm.chat_ai(conversations=conversations, model=args.code_model)
-            results.append(t.output)
-            conversations.append({"role": "assistant", "content": t.output})
-            current_step += 1
-            if "__完成__" in t.output or "/done" in t.output or "__EOF__" in t.output:
-                return CodeGenerateResult(contents=["\n\n".join(results)], conversations=[conversations])
-        return CodeGenerateResult(contents=["\n\n".join(results)], conversations=[conversations])
-class CodeModificationRanker:
-    def __init__(self, llm: AutoLLM):
-        self.llm = llm
-        self.llm.setup_default_model_name(args.code_model)
-        self.args = args
-        self.llms = [self.llm]
-    @prompt()
-    def _rank_modifications(self, s: CodeGenerateResult) -> str:
-        """
-        对一组代码修改进行质量评估并排序。
-        下面是修改需求：
-        <edit_requirement>
-        {{ s.conversations[0][-2]["content"] }}
-        </edit_requirement>
-        下面是相应的代码修改：
-        {% for content in s.contents %}
-        <edit_block id="{{ loop.index0 }}">
-        {{content}}
-        </edit_block>
-        {% endfor %}
-        请输出如下格式的评估结果,只包含 JSON 数据:
-        ```json
-        {
-            "rank_result": [id1, id2, id3]  // id 为 edit_block 的 id,按质量从高到低排序
-        }
-        ```
-        注意：
-        1. 只输出前面要求的 Json 格式就好，不要输出其他内容，Json 需要使用 ```json ```包裹
-        """
-    def rank_modifications(self, generate_result: CodeGenerateResult) -> CodeGenerateResult:
-        import time
-        from collections import defaultdict
-        start_time = time.time()
-        logger.info(f"开始对 {len(generate_result.contents)} 个候选结果进行排序")
-        try:
-            results = []
-            for llm in self.llms:
-                v = self._rank_modifications.with_llm(llm).with_return_type(RankResult).run(generate_result)
-                results.append(v.rank_result)
-            if not results:
-                raise Exception("All ranking requests failed")
-            # 计算每个候选人的分数
-            candidate_scores = defaultdict(float)
-            for rank_result in results:
-                for idx, candidate_id in enumerate(rank_result):
-                    # Score is 1/(position + 1) since position starts from 0
-                    candidate_scores[candidate_id] += 1.0 / (idx + 1)
-            # 按分数降序对候选人进行排序
-            sorted_candidates = sorted(candidate_scores.keys(),
-                                       key=lambda x: candidate_scores[x],
-                                       reverse=True)
-            elapsed = time.time() - start_time
-            score_details = ", ".join([f"candidate {i}: {candidate_scores[i]:.2f}" for i in sorted_candidates])
-            logger.info(
-                f"排序完成，耗时 {elapsed:.2f} 秒，最佳候选索引: {sorted_candidates[0]}，评分详情: {score_details}"
-            )
-            rerank_contents = [generate_result.contents[i] for i in sorted_candidates]
-            rerank_conversations = [generate_result.conversations[i] for i in sorted_candidates]
-            return CodeGenerateResult(contents=rerank_contents, conversations=rerank_conversations)
-        except Exception as e:
-            logger.error(f"排序过程失败: {str(e)}")
-            logger.debug(traceback.format_exc())
-            elapsed = time.time() - start_time
-            logger.warning(f"排序失败，耗时 {elapsed:.2f} 秒，将使用原始顺序")
-            return generate_result
-class TextSimilarity:
-    """
-    找到 text_b 中与 text_a 最相似的部分(滑动窗口)
-    返回相似度分数和最相似的文本片段
-    """
-    def __init__(self, text_a, text_b):
-        self.text_a = text_a
-        self.text_b = text_b
-        self.lines_a = self._split_into_lines(text_a)
-        self.lines_b = self._split_into_lines(text_b)
-        self.m = len(self.lines_a)
-        self.n = len(self.lines_b)
-    @staticmethod
-    def _split_into_lines(text):
-        return text.splitlines()
-    @staticmethod
-    def _levenshtein_ratio(s1, s2):
-        return SequenceMatcher(None, s1, s2).ratio()
-    def get_best_matching_window(self):
-        best_similarity = 0
-        best_window = []
-        for i in range(self.n - self.m + 1):  # 滑动窗口
-            window_b = self.lines_b[i:i + self.m]
-            similarity = self._levenshtein_ratio("\n".join(self.lines_a), "\n".join(window_b))
-            if similarity > best_similarity:
-                best_similarity = similarity
-                best_window = window_b
-        return best_similarity, "\n".join(best_window)
-class CodeAutoMergeEditBlock:
-    def __init__(self, llm: AutoLLM, fence_0: str = "```", fence_1: str = "```"):
-        self.llm = llm
-        self.llm.setup_default_model_name(args.code_model)
-        self.args = args
-        self.fence_0 = fence_0
-        self.fence_1 = fence_1
-    @staticmethod
-    def run_pylint(code: str) -> tuple[bool, str]:
-        """
-        --disable=all 禁用所有 Pylint 的检查规则
-        --enable=E0001,W0311,W0312 启用指定的 Pylint 检查规则,
-        E0001：语法错误(Syntax Error),
-        W0311：代码缩进使用了 Tab 而不是空格(Bad indentation)
-        W0312：代码缩进不一致(Mixed indentation)
-        :param code:
-        :return:
-        """
-        with tempfile.NamedTemporaryFile(mode="w", suffix=".py", delete=False) as temp_file:
-            temp_file.write(code)
-            temp_file_path = temp_file.name
-        try:
-            result = subprocess.run(
-                ["pylint", "--disable=all", "--enable=E0001,W0311,W0312", temp_file_path,],
-                capture_output=True,
-                text=True,
-                check=False,
-            )
-            os.unlink(temp_file_path)
-            if result.returncode != 0:
-                error_message = result.stdout.strip() or result.stderr.strip()
-                logger.warning(f"Pylint 检查代码失败: {error_message}")
-                return False, error_message
-            return True, ""
-        except subprocess.CalledProcessError as e:
-            error_message = f"运行 Pylint 时发生错误: {str(e)}"
-            logger.error(error_message)
-            os.unlink(temp_file_path)
-            return False, error_message
-    def parse_whole_text(self, text: str) -> List[PathAndCode]:
-        """
-        从文本中抽取如下格式代码(two_line_mode)：
-        ```python
-        ##File: /project/path/src/autocoder/index/index.py
-        <<<<<<< SEARCH
-        =======
-        >>>>>>> REPLACE
-        ```
-        或者 (one_line_mode)
-        ```python:/project/path/src/autocoder/index/index.py
-        <<<<<<< SEARCH
-        =======
-        >>>>>>> REPLACE
-        ```
-        """
-        HEAD = "<<<<<<< SEARCH"
-        DIVIDER = "======="
-        UPDATED = ">>>>>>> REPLACE"
-        lines = text.split("\n")
-        lines_len = len(lines)
-        start_marker_count = 0
-        block = []
-        path_and_code_list = []
-        # two_line_mode or one_line_mode
-        current_editblock_mode = "two_line_mode"
-        current_editblock_path = None
-        def guard(_index):
-            return _index + 1 < lines_len
-        def start_marker(_line, _index):
-            nonlocal current_editblock_mode
-            nonlocal current_editblock_path
-            if _line.startswith(self.fence_0) and guard(_index) and ":" in _line and lines[_index + 1].startswith(HEAD):
-                current_editblock_mode = "one_line_mode"
-                current_editblock_path = _line.split(":", 1)[1].strip()
-                return True
-            if _line.startswith(self.fence_0) and guard(_index) and lines[_index + 1].startswith("##File:"):
-                current_editblock_mode = "two_line_mode"
-                current_editblock_path = None
-                return True
-            return False
-        def end_marker(_line, _index):
-            return _line.startswith(self.fence_1) and UPDATED in lines[_index - 1]
-        for index, line in enumerate(lines):
-            if start_marker(line, index) and start_marker_count == 0:
-                start_marker_count += 1
-            elif end_marker(line, index) and start_marker_count == 1:
-                start_marker_count -= 1
-                if block:
-                    if current_editblock_mode == "two_line_mode":
-                        path = block[0].split(":", 1)[1].strip()
-                        content = "\n".join(block[1:])
-                    else:
-                        path = current_editblock_path
-                        content = "\n".join(block)
-                    block = []
-                    path_and_code_list.append(PathAndCode(path=path, content=content))
-            elif start_marker_count > 0:
-                block.append(line)
-        return path_and_code_list
-    def get_edits(self, content: str):
-        edits = self.parse_whole_text(content)
-        HEAD = "<<<<<<< SEARCH"
-        DIVIDER = "======="
-        UPDATED = ">>>>>>> REPLACE"
-        result = []
-        for edit in edits:
-            heads = []
-            updates = []
-            c = edit.content
-            in_head = False
-            in_updated = False
-            for line in c.splitlines():
-                if line.strip() == HEAD:
-                    in_head = True
-                    continue
-                if line.strip() == DIVIDER:
-                    in_head = False
-                    in_updated = True
-                    continue
-                if line.strip() == UPDATED:
-                    in_head = False
-                    in_updated = False
-                    continue
-                if in_head:
-                    heads.append(line)
-                if in_updated:
-                    updates.append(line)
-            result.append((edit.path, "\n".join(heads), "\n".join(updates)))
-        return result
-    @prompt()
-    def git_require_msg(self, source_dir: str, error: str) -> str:
-        """
-        auto_merge only works for git repositories.
-        Try to use git init in the source directory.
-        ```shell
-        cd {{ source_dir }}
-        git init .
-        ```
-        Then try to run auto-coder again.
-        Error: {{ error }}
-        """
-    def _merge_code_without_effect(self, content: str) -> MergeCodeWithoutEffect:
-        """
-        合并代码时不会产生任何副作用，例如 Git 操作、代码检查或文件写入。
-        返回一个元组，包含：
-        - 成功合并的代码块的列表，每个元素是一个 (file_path, new_content) 元组，
-          其中 file_path 是文件路径，new_content 是合并后的新内容。
-        - 合并失败的代码块的列表，每个元素是一个 (file_path, head, update) 元组，
-          其中：file_path 是文件路径，head 是原始内容，update 是尝试合并的内容。
-        """
-        codes = self.get_edits(content)
-        file_content_mapping = {}
-        failed_blocks = []
-        for block in codes:
-            file_path, head, update = block
-            if not os.path.exists(file_path):
-                file_content_mapping[file_path] = update
-            else:
-                if file_path not in file_content_mapping:
-                    with open(file_path, "r") as f:
-                        temp = f.read()
-                        file_content_mapping[file_path] = temp
-                existing_content = file_content_mapping[file_path]
-                # First try exact match
-                new_content = (
-                    existing_content.replace(head, update, 1)
-                    if head
-                    else existing_content + "\n" + update
-                )
-                # If exact match fails, try similarity match
-                if new_content == existing_content and head:
-                    similarity, best_window = TextSimilarity(
-                        head, existing_content
-                    ).get_best_matching_window()
-                    if similarity > self.args.editblock_similarity:
-                        new_content = existing_content.replace(
-                            best_window, update, 1
-                        )
-                if new_content != existing_content:
-                    file_content_mapping[file_path] = new_content
-                else:
-                    failed_blocks.append((file_path, head, update))
-        return MergeCodeWithoutEffect(
-            success_blocks=[(path, content) for path, content in file_content_mapping.items()],
-            failed_blocks=failed_blocks
-        )
-    def choose_best_choice(self, generate_result: CodeGenerateResult) -> CodeGenerateResult:
-        """ 选择最佳代码 """
-        if len(generate_result.contents) == 1:  # 仅一份代码立即返回
-            logger.info("仅有一个候选结果，跳过排序")
-            return generate_result
-        ranker = CodeModificationRanker(self.llm)
-        ranked_result = ranker.rank_modifications(generate_result)
-        # 过滤掉包含失败块的内容
-        for content, conversations in zip(ranked_result.contents, ranked_result.conversations):
-            merge_result = self._merge_code_without_effect(content)
-            if not merge_result.failed_blocks:
-                return CodeGenerateResult(contents=[content], conversations=[conversations])
-        # 如果所有内容都包含失败块，则返回第一个
-        return CodeGenerateResult(contents=[ranked_result.contents[0]], conversations=[ranked_result.conversations[0]])
-    def _merge_code(self, content: str, force_skip_git: bool = False):
-        file_content = open(self.args.file).read()
-        md5 = hashlib.md5(file_content.encode("utf-8")).hexdigest()
-        file_name = os.path.basename(self.args.file)
-        codes = self.get_edits(content)
-        changes_to_make = []
-        changes_made = False
-        unmerged_blocks = []
-        merged_blocks = []
-        # First, check if there are any changes to be made
-        file_content_mapping = {}
-        for block in codes:
-            file_path, head, update = block
-            if not os.path.exists(file_path):
-                changes_to_make.append((file_path, None, update))
-                file_content_mapping[file_path] = update
-                merged_blocks.append((file_path, "", update, 1))
-                changes_made = True
-            else:
-                if file_path not in file_content_mapping:
-                    with open(file_path, "r") as f:
-                        temp = f.read()
-                        file_content_mapping[file_path] = temp
-                existing_content = file_content_mapping[file_path]
-                new_content = (
-                    existing_content.replace(head, update, 1)
-                    if head
-                    else existing_content + "\n" + update
-                )
-                if new_content != existing_content:
-                    changes_to_make.append(
-                        (file_path, existing_content, new_content))
-                    file_content_mapping[file_path] = new_content
-                    merged_blocks.append((file_path, head, update, 1))
-                    changes_made = True
-                else:
-                    # If the SEARCH BLOCK is not found exactly, then try to use
-                    # the similarity ratio to find the best matching block
-                    similarity, best_window = TextSimilarity(head, existing_content).get_best_matching_window()
-                    if similarity > self.args.editblock_similarity:  # 相似性比较
-                        new_content = existing_content.replace(
-                            best_window, update, 1)
-                        if new_content != existing_content:
-                            changes_to_make.append(
-                                (file_path, existing_content, new_content)
-                            )
-                            file_content_mapping[file_path] = new_content
-                            merged_blocks.append(
-                                (file_path, head, update, similarity))
-                            changes_made = True
-                    else:
-                        unmerged_blocks.append((file_path, head, update, similarity))
-        if unmerged_blocks:
-            if self.args.request_id and not self.args.skip_events:
-                # collect unmerged blocks
-                event_data = []
-                for file_path, head, update, similarity in unmerged_blocks:
-                    event_data.append(
-                        {
-                            "file_path": file_path,
-                            "head": head,
-                            "update": update,
-                            "similarity": similarity,
-                        }
-                    )
-                return
-            logger.warning(f"发现 {len(unmerged_blocks)} 个未合并的代码块，更改将不会应用，请手动检查这些代码块后重试。")
-            self._print_unmerged_blocks(unmerged_blocks)
-            return
-        # lint check
-        for file_path, new_content in file_content_mapping.items():
-            if file_path.endswith(".py"):
-                pylint_passed, error_message = self.run_pylint(new_content)
-                if not pylint_passed:
-                    logger.warning(f"代码文件 {file_path} 的 Pylint 检查未通过，本次更改未应用。错误信息: {error_message}")
-        if changes_made and not force_skip_git and not self.args.skip_commit:
-            try:
-                commit_changes(self.args.source_dir, f"auto_coder_pre_{file_name}_{md5}")
-            except Exception as e:
-                logger.error(
-                    self.git_require_msg(
-                        source_dir=self.args.source_dir, error=str(e))
-                )
-                return
-        # Now, apply the changes
-        for file_path, new_content in file_content_mapping.items():
-            os.makedirs(os.path.dirname(file_path), exist_ok=True)
-            with open(file_path, "w") as f:
-                f.write(new_content)
-        if self.args.request_id and not self.args.skip_events:
-            # collect modified files
-            event_data = []
-            for code in merged_blocks:
-                file_path, head, update, similarity = code
-                event_data.append(
-                    {
-                        "file_path": file_path,
-                        "head": head,
-                        "update": update,
-                        "similarity": similarity,
-                    }
-                )
-        if changes_made:
-            if not force_skip_git and not self.args.skip_commit:
-                try:
-                    commit_result = commit_changes(self.args.source_dir, f"auto_coder_{file_name}_{md5}")
-                    git_print_commit_info(commit_result=commit_result)
-                except Exception as e:
-                    logger.error(
-                        self.git_require_msg(
-                            source_dir=self.args.source_dir, error=str(e)
-                        )
-                    )
-            logger.info(
-                f"已在 {len(file_content_mapping.keys())} 个文件中合并更改，"
-                f"完成 {len(changes_to_make)}/{len(codes)} 个代码块。"
-            )
-        else:
-            logger.warning("未对任何文件进行更改。")
-    def merge_code(self, generate_result: CodeGenerateResult, force_skip_git: bool = False):
-        result = self.choose_best_choice(generate_result)
-        self._merge_code(result.contents[0], force_skip_git)
-        return result
-    @staticmethod
-    def _print_unmerged_blocks(unmerged_blocks: List[tuple]):
-        console.print(f"\n[bold red]未合并的代码块:[/bold red]")
-        for file_path, head, update, similarity in unmerged_blocks:
-            console.print(f"\n[bold blue]文件:[/bold blue] {file_path}")
-            console.print(
-                f"\n[bold green]搜索代码块（相似度：{similarity}）:[/bold green]")
-            syntax = Syntax(head, "python", theme="monokai", line_numbers=True)
-            console.print(Panel(syntax, expand=False))
-            console.print("\n[bold yellow]替换代码块:[/bold yellow]")
-            syntax = Syntax(update, "python", theme="monokai",
-                            line_numbers=True)
-            console.print(Panel(syntax, expand=False))
-        console.print(f"\n[bold red]未合并的代码块总数: {len(unmerged_blocks)}[/bold red]")
-class BaseAction:
-    @staticmethod
-    def _get_content_length(content: str) -> int:
-        return len(content)
-class ActionPyProject(BaseAction):
-    def __init__(self, llm: Optional[AutoLLM] = None) -> None:
-        self.args = args
-        self.llm = llm
-        self.pp = None
-    def run(self):
-        if self.args.project_type != "py":
-            return False
-        pp = PyProject(llm=self.llm, args=args)
-        self.pp = pp
-        pp.run()
-        source_code = pp.output()
-        if self.llm:
-            source_code = build_index_and_filter_files(args=args, llm=self.llm, sources=pp.sources)
-        self.process_content(source_code)
-        return True
-    def process_content(self, content: str):
-        # args = self.args
-        if self.args.execute and self.llm:
-            content_length = self._get_content_length(content)
-            if content_length > self.args.model_max_input_length:
-                logger.warning(
-                    f"发送给模型的内容长度为 {content_length} 个 token（可能收集了过多文件），"
-                    f"已超过最大输入长度限制 {self.args.model_max_input_length}。"
-                )
-        if args.execute:
-            logger.info("正在自动生成代码...")
-            start_time = time.time()
-            # diff, strict_diff, editblock 是代码自动生成或合并的不同策略, 通常用于处理代码的变更或生成
-            # diff 模式,基于差异生成代码,生成最小的变更集,适用于局部优化,代码重构
-            # strict_diff 模式,严格验证差异,确保生成的代码符合规则,适用于代码审查,自动化测试
-            # editblock 模式,基于编辑块生成代码，支持较大范围的修改,适用于代码重构,功能扩展
-            if args.auto_merge == "editblock":
-                generate = CodeAutoGenerateEditBlock(llm=self.llm, action=self)
-            else:
-                generate = None
-            if self.args.enable_multi_round_generate:
-                generate_result = generate.multi_round_run(query=args.query, source_content=content)
-            else:
-                generate_result = generate.single_round_run(query=args.query, source_content=content)
-            logger.info(f"代码生成完成，耗时 {time.time() - start_time:.2f} 秒")
-            if args.auto_merge:
-                logger.info("正在自动合并代码...")
-                if args.auto_merge == "editblock":
-                    code_merge = CodeAutoMergeEditBlock(llm=self.llm)
-                    merge_result = code_merge.merge_code(generate_result=generate_result)
-                else:
-                    merge_result = None
-                content = merge_result.contents[0]
-            else:
-                content = generate_result.contents[0]
-            with open(args.target_file, "w") as file:
-                file.write(content)
-class ActionSuffixProject(BaseAction):
-    def __init__(self, llm: Optional[AutoLLM] = None) -> None:
-        self.args = args
-        self.llm = llm
-        self.pp = None
-    def run(self):
-        pp = SuffixProject(llm=self.llm, args=args)
-        self.pp = pp
-        pp.run()
-        source_code = pp.output()
-        if self.llm:
-            source_code = build_index_and_filter_files(args=args, llm=self.llm, sources=pp.sources)
-        self.process_content(source_code)
-    def process_content(self, content: str):
-        if self.args.execute and self.llm:
-            content_length = self._get_content_length(content)
-            if content_length > self.args.model_max_input_length:
-                logger.warning(
-                    f"发送给模型的内容长度为 {content_length} 个 token（可能收集了过多文件），"
-                    f"已超过最大输入长度限制 {self.args.model_max_input_length}。"
-                )
-        if args.execute:
-            logger.info("正在自动生成代码...")
-            start_time = time.time()
-            # diff, strict_diff, editblock 是代码自动生成或合并的不同策略, 通常用于处理代码的变更或生成
-            # diff 模式,基于差异生成代码,生成最小的变更集,适用于局部优化,代码重构
-            # strict_diff 模式,严格验证差异,确保生成的代码符合规则,适用于代码审查,自动化测试
-            # editblock 模式,基于编辑块生成代码，支持较大范围的修改,适用于代码重构,功能扩展
-            if args.auto_merge == "editblock":
-                generate = CodeAutoGenerateEditBlock(llm=self.llm, action=self)
-            else:
-                generate = None
-            if self.args.enable_multi_round_generate:
-                generate_result = generate.multi_round_run(query=args.query, source_content=content)
-            else:
-                generate_result = generate.single_round_run(query=args.query, source_content=content)
-            logger.info(f"代码生成完成，耗时 {time.time() - start_time:.2f} 秒")
-            if args.auto_merge:
-                logger.info("正在自动合并代码...")
-                if args.auto_merge == "editblock":
-                    code_merge = CodeAutoMergeEditBlock(llm=self.llm)
-                    merge_result = code_merge.merge_code(generate_result=generate_result)
-                else:
-                    merge_result = None
-                content = merge_result.contents[0]
-            else:
-                content = generate_result.contents[0]
-            with open(args.target_file, "w") as file:
-                file.write(content)
-class Dispacher:
-    def __init__(self, llm: Optional[AutoLLM] = None):
-        self.args = args
-        self.llm = llm
-    def dispach(self):
-        actions = [
-            ActionPyProject(llm=self.llm),
-            ActionSuffixProject(llm=self.llm)
-        ]
-        for action in actions:
-            if action.run():
-                return
 def prepare_chat_yaml():
     # auto_coder_main(["next", "chat_action"]) 准备聊天 yaml 文件
     actions_dir = os.path.join(args.source_dir, "actions")
@@ -2476,7 +1453,7 @@ def coding(query: str, llm: AutoLLM):
             f.write(yaml_content)
         convert_yaml_to_config(execute_file)
-        dispacher = Dispacher(llm)
+        dispacher = Dispacher(args=args, llm=llm)
         dispacher.dispach()
     else:
         logger.warning("创建新的 YAML 文件失败。")
@@ -3609,6 +2586,12 @@ def main():
                     print(f"{memory['mode']} [{MODES[memory['mode']]}]")
                 else:
                     memory["mode"] = conf
+            elif user_input.startswith("/exclude_dirs"):
+                dir_names = user_input[len("/exclude_dirs"):].strip().split(",")
+                exclude_dirs(dir_names)
+            elif user_input.startswith("/exclude_files"):
+                query = user_input[len("/exclude_files"):].strip()
+                exclude_files(query)
             else:
                 command = user_input
                 if user_input.startswith("/shell"):
@@ -3628,9 +2611,9 @@ def main():
             break
         except Exception as e:
             print(f"\033[91m发生异常:\033[0m \033[93m{type(e).__name__}\033[0m - {str(e)}")
-            # if runing_args and runing_args.debug:
-            import traceback
-            traceback.print_exc()
+            if runing_args and runing_args.debug:
+                import traceback
+                traceback.print_exc()
 if __name__ == '__main__':

autocoder-nano 0.1.26__py3-none-any.whl → 0.1.28__py3-none-any.whl

autocoder-nano 0.1.26py3-none-any.whl → 0.1.28py3-none-any.whl