PyPI - auto-coder - Versions diffs - 0.1.268__py3-none-any.whl → 0.1.269__py3-none-any.whl - Mend

auto-coder 0.1.268py3-none-any.whl → 0.1.269py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of auto-coder might be problematic. Click here for more details.

Files changed (19) hide show

{auto_coder-0.1.268.dist-info → auto_coder-0.1.269.dist-info}/METADATA +2 -2
{auto_coder-0.1.268.dist-info → auto_coder-0.1.269.dist-info}/RECORD +19 -17
autocoder/auto_coder_runner.py +2635 -0
autocoder/chat_auto_coder.py +54 -2630
autocoder/commands/auto_command.py +23 -33
autocoder/common/__init__.py +6 -2
autocoder/common/auto_coder_lang.py +5 -1
autocoder/common/auto_configure.py +41 -30
autocoder/common/command_templates.py +2 -3
autocoder/common/context_pruner.py +185 -12
autocoder/common/conversation_pruner.py +11 -10
autocoder/index/entry.py +42 -22
autocoder/utils/auto_project_type.py +120 -0
autocoder/utils/model_provider_selector.py +23 -23
autocoder/version.py +1 -1
{auto_coder-0.1.268.dist-info → auto_coder-0.1.269.dist-info}/LICENSE +0 -0
{auto_coder-0.1.268.dist-info → auto_coder-0.1.269.dist-info}/WHEEL +0 -0
{auto_coder-0.1.268.dist-info → auto_coder-0.1.269.dist-info}/entry_points.txt +0 -0
{auto_coder-0.1.268.dist-info → auto_coder-0.1.269.dist-info}/top_level.txt +0 -0

autocoder/index/entry.py CHANGED Viewed

@@ -58,8 +58,12 @@ def build_index_and_filter_files(
             return file_path.strip()[2:]
         return file_path
+    # 文件路径 -> TargetFile
     final_files: Dict[str, TargetFile] = {}
+    # 文件路径 -> 文件在文件列表中的位置（越前面表示越相关）
+    file_positions:Dict[str,int] = {}
     # Phase 1: Process REST/RAG/Search sources
     printer = Printer()
     printer.print_in_terminal("phase1_processing_sources")
@@ -102,25 +106,20 @@ def build_index_and_filter_files(
                     })
                 )
             )
         if not args.skip_filter_index and args.index_filter_model:
             model_name = getattr(index_manager.index_filter_llm, 'default_model_name', None)
             if not model_name:
                 model_name = "unknown(without default model name)"
             printer.print_in_terminal("quick_filter_start", style="blue", model_name=model_name)
             quick_filter = QuickFilter(index_manager,stats,sources)
-            quick_filter_result = quick_filter.filter(index_manager.read_index(),args.query)
-            # if quick_filter_result.has_error:
-            #     raise KeyboardInterrupt(printer.get_message_from_key_with_format("quick_filter_failed",error=quick_filter_result.error_message))
-            # Merge quick filter results into final_files
-            if args.context_prune:
-                context_pruner = PruneContext(max_tokens=args.conversation_prune_safe_zone_tokens, args=args, llm=llm)
-                pruned_files = context_pruner.handle_overflow(quick_filter_result.files, [{"role":"user","content":args.query}], args.context_prune_strategy)
-                for source_file in pruned_files:
-                    final_files[source_file.module_name] = quick_filter_result.files[source_file.module_name]
-            else:
-                final_files.update(quick_filter_result.files)
+            quick_filter_result = quick_filter.filter(index_manager.read_index(),args.query)
+            final_files.update(quick_filter_result.files)
+            if quick_filter_result.file_positions:
+                file_positions.update(quick_filter_result.file_positions)
         if not args.skip_filter_index and not args.index_filter_model:
             model_name = getattr(index_manager.llm, 'default_model_name', None)
@@ -261,32 +260,53 @@ def build_index_and_filter_files(
         for file in final_filenames:
             print(f"{file} - {final_files[file].reason}")
-    source_code = ""
+    # source_code = ""
     source_code_list = SourceCodeList(sources=[])
     depulicated_sources = set()
+    ## 先去重
+    temp_sources = []
     for file in sources:
         if file.module_name in final_filenames:
             if file.module_name in depulicated_sources:
                 continue
             depulicated_sources.add(file.module_name)
-            source_code += f"##File: {file.module_name}\n"
-            source_code += f"{file.source_code}\n\n"
-            source_code_list.sources.append(file)
+            # source_code += f"##File: {file.module_name}\n"
+            # source_code += f"{file.source_code}\n\n"
+            temp_sources.append(file)
+    ## 开启了裁剪，则需要做裁剪，不过目前只针对 quick filter 生效
+    if args.context_prune:
+        context_pruner = PruneContext(max_tokens=args.conversation_prune_safe_zone_tokens, args=args, llm=llm)
+        # 如果 file_positions 不为空，则通过 file_positions 来获取文件
+        if file_positions:
+            ## 拿到位置列表，然后根据位置排序 得到 [(pos,file_path)]
+            ## 将 [(pos,file_path)] 转换为 [file_path]
+            ## 通过 [file_path] 顺序调整 temp_sources 的顺序
+            ## MARK
+             # 将 file_positions 转换为 [(pos, file_path)] 的列表
+            position_file_pairs = [(pos, file_path) for file_path, pos in file_positions.items()]
+            # 按位置排序
+            position_file_pairs.sort(key=lambda x: x[0])
+            # 提取排序后的文件路径列表
+            sorted_file_paths = [file_path for _, file_path in position_file_pairs]
+            # 根据 sorted_file_paths 重新排序 temp_sources
+            temp_sources.sort(key=lambda x: sorted_file_paths.index(x.module_name) if x.module_name in sorted_file_paths else len(sorted_file_paths))
+        pruned_files = context_pruner.handle_overflow([source.module_name for source in temp_sources], [{"role":"user","content":args.query}], args.context_prune_strategy)
+        source_code_list.sources = pruned_files
     if args.request_id and not args.skip_events:
         queue_communicate.send_event(
             request_id=args.request_id,
             event=CommunicateEvent(
                 event_type=CommunicateEventType.CODE_INDEX_FILTER_FILE_SELECTED.value,
                 data=json.dumps([
-                    (file["file_path"], file.reason)
-                    for file in final_files.values()
-                    if file.file_path in depulicated_sources
+                    (file.module_name, "") for file in source_code_list.sources
                 ])
             )
         )
-    stats["final_files"] = len(depulicated_sources)
+    stats["final_files"] = len(source_code_list.sources)
     phase_end = time.monotonic()
     stats["timings"]["prepare_output"] = phase_end - phase_start

autocoder/utils/auto_project_type.py ADDED Viewed

@@ -0,0 +1,120 @@
+import os
+import json
+from collections import defaultdict
+from typing import Dict, List, Set, Tuple
+from pathlib import Path
+from loguru import logger
+import byzerllm
+from autocoder.common import AutoCoderArgs
+from autocoder.common.printer import Printer
+from typing import Union
+import pydantic
+from autocoder.common.result_manager import ResultManager
+class ExtensionClassifyResult(pydantic.BaseModel):
+    code: List[str] = []
+    config: List[str] = []
+    data: List[str] = []
+    document: List[str] = []
+    other: List[str] = []
+    framework: List[str] = []
+class ProjectTypeAnalyzer:
+    def __init__(self, args: AutoCoderArgs, llm: Union[byzerllm.ByzerLLM, byzerllm.SimpleByzerLLM]):
+        self.args = args
+        self.llm = llm
+        self.printer = Printer()
+        self.default_exclude_dirs = [
+            ".git", ".svn", ".hg", "build", "dist", "__pycache__",
+            "node_modules", ".auto-coder", ".vscode", ".idea", "venv",
+            ".next", ".nuxt", ".svelte-kit", "out", "cache", "logs",
+            "temp", "tmp", "coverage", ".DS_Store", "public", "static"
+        ]
+        self.extension_counts = defaultdict(int)
+        self.stats_file = Path(args.source_dir) / ".auto-coder" / "project_type_stats.json"
+        self.result_manager = ResultManager()
+    def traverse_project(self) -> None:
+        """遍历项目目录，统计文件后缀"""
+        for root, dirs, files in os.walk(self.args.source_dir):
+            # 过滤掉默认排除的目录
+            dirs[:] = [d for d in dirs if d not in self.default_exclude_dirs]
+            for file in files:
+                _, ext = os.path.splitext(file)
+                if ext:  # 只统计有后缀的文件
+                    self.extension_counts[ext.lower()] += 1
+    def count_extensions(self) -> Dict[str, int]:
+        """返回文件后缀统计结果"""
+        return dict(sorted(self.extension_counts.items(), key=lambda x: x[1], reverse=True))
+    @byzerllm.prompt()
+    def classify_extensions(self, extensions: str) -> str:
+        """
+        根据文件后缀列表，将后缀分类为代码、配置、数据、文档等类型。
+        文件后缀列表：
+        {{ extensions }}
+        请返回如下JSON格式：
+        {
+            "code": ["后缀1", "后缀2"],
+            "config": ["后缀3", "后缀4"],
+            "data": ["后缀5", "后缀6"],
+            "document": ["后缀7", "后缀8"],
+            "other": ["后缀9", "后缀10"],
+            "framework": ["后缀11", "后缀12"]
+        }
+        """
+        return {
+            "extensions": extensions
+        }
+    def save_stats(self) -> None:
+        """保存统计结果到文件"""
+        stats = {
+            "extension_counts": self.extension_counts,
+            "project_type": self.detect_project_type()
+        }
+        # 确保目录存在
+        self.stats_file.parent.mkdir(parents=True, exist_ok=True)
+        with open(self.stats_file, "w", encoding="utf-8") as f:
+            json.dump(stats, f, indent=2)
+        self.printer.print_in_terminal("stats_saved", path=str(self.stats_file))
+    def load_stats(self) -> Dict[str, any]:
+        """从文件加载统计结果"""
+        if not self.stats_file.exists():
+            self.printer.print_in_terminal("stats_not_found", path=str(self.stats_file))
+            return {}
+        with open(self.stats_file, "r", encoding="utf-8") as f:
+            return json.load(f)
+    def detect_project_type(self) -> str:
+        """根据后缀统计结果推断项目类型"""
+        # 获取统计结果
+        ext_counts = self.count_extensions()
+        # 将后缀分类
+        classification = self.classify_extensions.with_llm(self.llm).with_return_type(ExtensionClassifyResult).run(json.dumps(ext_counts,ensure_ascii=False))
+        return ",".join(classification.code)
+    def analyze(self) -> Dict[str, any]:
+        """执行完整的项目类型分析流程"""
+        # 遍历项目目录
+        self.traverse_project()
+        # 检测项目类型
+        project_type = self.detect_project_type()
+        self.result_manager.add_result(content=project_type, meta={
+                    "action": "get_project_type",
+                    "input": {
+                    }
+                })
+        return project_type

autocoder/utils/model_provider_selector.py CHANGED Viewed

@@ -25,8 +25,8 @@ PROVIDER_INFO_LIST = [
     ProviderInfo(
         name="volcano",
         endpoint="https://ark.cn-beijing.volces.com/api/v3",
-        r1_model="",
-        v3_model="",
+        r1_model="deepseek-r1-250120",
+        v3_model="deepseek-v3-241226",
         api_key="",
         r1_input_price=2.0,
         r1_output_price=8.0,
@@ -162,32 +162,32 @@ class ModelProviderSelector:
                 provider_info = provider
                 break
-        if result == "volcano":
-            # Get R1 endpoint
-            r1_endpoint = input_dialog(
-                title=self.printer.get_message_from_key("model_provider_api_key_title"),
-                text=self.printer.get_message_from_key("model_provider_volcano_r1_text"),
-                validator=VolcanoEndpointValidator(),
-                style=dialog_style
-            ).run()
+        # if result == "volcano":
+        #     # Get R1 endpoint
+        #     r1_endpoint = input_dialog(
+        #         title=self.printer.get_message_from_key("model_provider_api_key_title"),
+        #         text=self.printer.get_message_from_key("model_provider_volcano_r1_text"),
+        #         validator=VolcanoEndpointValidator(),
+        #         style=dialog_style
+        #     ).run()
-            if r1_endpoint is None:
-                return None
+        #     if r1_endpoint is None:
+        #         return None
-            provider_info.r1_model = r1_endpoint
+        #     provider_info.r1_model = r1_endpoint
-            # Get V3 endpoint
-            v3_endpoint = input_dialog(
-                title=self.printer.get_message_from_key("model_provider_api_key_title"),
-                text=self.printer.get_message_from_key("model_provider_volcano_v3_text"),
-                validator=VolcanoEndpointValidator(),
-                style=dialog_style
-            ).run()
+        #     # Get V3 endpoint
+        #     v3_endpoint = input_dialog(
+        #         title=self.printer.get_message_from_key("model_provider_api_key_title"),
+        #         text=self.printer.get_message_from_key("model_provider_volcano_v3_text"),
+        #         validator=VolcanoEndpointValidator(),
+        #         style=dialog_style
+        #     ).run()
-            if v3_endpoint is None:
-                return None
+        #     if v3_endpoint is None:
+        #         return None
-            provider_info.v3_model = v3_endpoint
+        #     provider_info.v3_model = v3_endpoint
         # Get API key for all providers
         api_key = input_dialog(

autocoder/version.py CHANGED Viewed

	@@ -1 +1 @@
1	- __version__ = "0.1.~~268~~"
1	+ __version__ = "0.1.269"

{auto_coder-0.1.268.dist-info → auto_coder-0.1.269.dist-info}/LICENSE RENAMED Viewed

File without changes

{auto_coder-0.1.268.dist-info → auto_coder-0.1.269.dist-info}/WHEEL RENAMED Viewed

File without changes

{auto_coder-0.1.268.dist-info → auto_coder-0.1.269.dist-info}/entry_points.txt RENAMED Viewed

File without changes

{auto_coder-0.1.268.dist-info → auto_coder-0.1.269.dist-info}/top_level.txt RENAMED Viewed

File without changes

auto-coder 0.1.268__py3-none-any.whl → 0.1.269__py3-none-any.whl

Potentially problematic release.

auto-coder 0.1.268py3-none-any.whl → 0.1.269py3-none-any.whl