auto-coder 0.1.400__py3-none-any.whl → 2.0.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of auto-coder might be problematic. Click here for more details.

Files changed (579) hide show
  1. auto_coder-2.0.0.dist-info/LICENSE +158 -0
  2. auto_coder-2.0.0.dist-info/METADATA +558 -0
  3. auto_coder-2.0.0.dist-info/RECORD +795 -0
  4. {auto_coder-0.1.400.dist-info → auto_coder-2.0.0.dist-info}/WHEEL +1 -1
  5. {auto_coder-0.1.400.dist-info → auto_coder-2.0.0.dist-info}/entry_points.txt +3 -3
  6. autocoder/__init__.py +31 -0
  7. autocoder/agent/auto_filegroup.py +32 -13
  8. autocoder/agent/auto_learn_from_commit.py +9 -1
  9. autocoder/agent/base_agentic/__init__.py +3 -0
  10. autocoder/agent/base_agentic/agent_hub.py +1 -1
  11. autocoder/agent/base_agentic/base_agent.py +235 -136
  12. autocoder/agent/base_agentic/default_tools.py +119 -118
  13. autocoder/agent/base_agentic/test_base_agent.py +1 -1
  14. autocoder/agent/base_agentic/tool_registry.py +32 -20
  15. autocoder/agent/base_agentic/tools/read_file_tool_resolver.py +25 -4
  16. autocoder/agent/base_agentic/tools/write_to_file_tool_resolver.py +24 -11
  17. autocoder/agent/base_agentic/types.py +42 -0
  18. autocoder/agent/entry_command_agent/chat.py +73 -59
  19. autocoder/auto_coder.py +31 -40
  20. autocoder/auto_coder_rag.py +11 -1084
  21. autocoder/auto_coder_runner.py +1029 -2310
  22. autocoder/auto_coder_terminal.py +26 -0
  23. autocoder/auto_coder_terminal_v3.py +190 -0
  24. autocoder/chat/conf_command.py +224 -124
  25. autocoder/chat/models_command.py +361 -299
  26. autocoder/chat/rules_command.py +79 -31
  27. autocoder/chat_auto_coder.py +1021 -372
  28. autocoder/chat_auto_coder_lang.py +23 -732
  29. autocoder/commands/auto_command.py +26 -9
  30. autocoder/commands/auto_web.py +1 -1
  31. autocoder/commands/tools.py +44 -44
  32. autocoder/common/__init__.py +150 -128
  33. autocoder/common/ac_style_command_parser/__init__.py +39 -2
  34. autocoder/common/ac_style_command_parser/config.py +422 -0
  35. autocoder/common/ac_style_command_parser/parser.py +292 -78
  36. autocoder/common/ac_style_command_parser/test_parser.py +241 -16
  37. autocoder/common/ac_style_command_parser/test_typed_parser.py +342 -0
  38. autocoder/common/ac_style_command_parser/typed_parser.py +653 -0
  39. autocoder/common/action_yml_file_manager.py +25 -13
  40. autocoder/common/agent_events/__init__.py +52 -0
  41. autocoder/common/agent_events/agent_event_emitter.py +193 -0
  42. autocoder/common/agent_events/event_factory.py +177 -0
  43. autocoder/common/agent_events/examples.py +307 -0
  44. autocoder/common/agent_events/types.py +113 -0
  45. autocoder/common/agent_events/utils.py +68 -0
  46. autocoder/common/agent_hooks/__init__.py +44 -0
  47. autocoder/common/agent_hooks/examples.py +582 -0
  48. autocoder/common/agent_hooks/hook_executor.py +217 -0
  49. autocoder/common/agent_hooks/hook_manager.py +288 -0
  50. autocoder/common/agent_hooks/types.py +133 -0
  51. autocoder/common/agent_hooks/utils.py +99 -0
  52. autocoder/common/agent_query_queue/queue_executor.py +324 -0
  53. autocoder/common/agent_query_queue/queue_manager.py +325 -0
  54. autocoder/common/agents/__init__.py +11 -0
  55. autocoder/common/agents/agent_manager.py +323 -0
  56. autocoder/common/agents/agent_parser.py +189 -0
  57. autocoder/common/agents/example_usage.py +344 -0
  58. autocoder/common/agents/integration_example.py +330 -0
  59. autocoder/common/agents/test_agent_parser.py +545 -0
  60. autocoder/common/async_utils.py +101 -0
  61. autocoder/common/auto_coder_lang.py +23 -972
  62. autocoder/common/autocoderargs_parser/__init__.py +14 -0
  63. autocoder/common/autocoderargs_parser/parser.py +184 -0
  64. autocoder/common/autocoderargs_parser/tests/__init__.py +1 -0
  65. autocoder/common/autocoderargs_parser/tests/test_args_parser.py +235 -0
  66. autocoder/common/autocoderargs_parser/tests/test_token_parser.py +195 -0
  67. autocoder/common/autocoderargs_parser/token_parser.py +290 -0
  68. autocoder/common/buildin_tokenizer.py +2 -4
  69. autocoder/common/code_auto_generate.py +149 -74
  70. autocoder/common/code_auto_generate_diff.py +163 -70
  71. autocoder/common/code_auto_generate_editblock.py +179 -89
  72. autocoder/common/code_auto_generate_strict_diff.py +167 -72
  73. autocoder/common/code_auto_merge_editblock.py +13 -6
  74. autocoder/common/code_modification_ranker.py +1 -1
  75. autocoder/common/command_completer.py +3 -3
  76. autocoder/common/command_file_manager/manager.py +183 -47
  77. autocoder/common/command_file_manager/test_command_file_manager.py +507 -0
  78. autocoder/common/command_templates.py +1 -1
  79. autocoder/common/conf_utils.py +2 -4
  80. autocoder/common/conversations/config.py +11 -3
  81. autocoder/common/conversations/get_conversation_manager.py +100 -2
  82. autocoder/common/conversations/llm_stats_models.py +264 -0
  83. autocoder/common/conversations/manager.py +112 -28
  84. autocoder/common/conversations/models.py +16 -2
  85. autocoder/common/conversations/storage/index_manager.py +134 -10
  86. autocoder/common/core_config/__init__.py +63 -0
  87. autocoder/common/core_config/agentic_mode_manager.py +109 -0
  88. autocoder/common/core_config/base_manager.py +123 -0
  89. autocoder/common/core_config/compatibility.py +151 -0
  90. autocoder/common/core_config/config_manager.py +156 -0
  91. autocoder/common/core_config/conversation_manager.py +31 -0
  92. autocoder/common/core_config/exclude_manager.py +72 -0
  93. autocoder/common/core_config/file_manager.py +177 -0
  94. autocoder/common/core_config/human_as_model_manager.py +129 -0
  95. autocoder/common/core_config/lib_manager.py +54 -0
  96. autocoder/common/core_config/main_manager.py +81 -0
  97. autocoder/common/core_config/mode_manager.py +126 -0
  98. autocoder/common/core_config/models.py +70 -0
  99. autocoder/common/core_config/test_memory_manager.py +1056 -0
  100. autocoder/common/env_manager.py +282 -0
  101. autocoder/common/env_manager_usage_example.py +211 -0
  102. autocoder/common/file_checkpoint/conversation_checkpoint.py +19 -19
  103. autocoder/common/file_checkpoint/manager.py +264 -48
  104. autocoder/common/file_checkpoint/test_backup.py +1 -18
  105. autocoder/common/file_checkpoint/test_manager.py +270 -1
  106. autocoder/common/file_checkpoint/test_store.py +1 -17
  107. autocoder/common/file_handler/__init__.py +23 -0
  108. autocoder/common/file_handler/active_context_handler.py +159 -0
  109. autocoder/common/file_handler/add_files_handler.py +409 -0
  110. autocoder/common/file_handler/chat_handler.py +180 -0
  111. autocoder/common/file_handler/coding_handler.py +401 -0
  112. autocoder/common/file_handler/commit_handler.py +200 -0
  113. autocoder/common/file_handler/lib_handler.py +156 -0
  114. autocoder/common/file_handler/list_files_handler.py +111 -0
  115. autocoder/common/file_handler/mcp_handler.py +268 -0
  116. autocoder/common/file_handler/models_handler.py +493 -0
  117. autocoder/common/file_handler/remove_files_handler.py +172 -0
  118. autocoder/common/file_monitor/test_file_monitor.py +307 -0
  119. autocoder/common/git_utils.py +51 -10
  120. autocoder/common/global_cancel.py +15 -6
  121. autocoder/common/ignorefiles/test_ignore_file_utils.py +1 -1
  122. autocoder/common/international/__init__.py +31 -0
  123. autocoder/common/international/demo_international.py +92 -0
  124. autocoder/common/international/message_manager.py +157 -0
  125. autocoder/common/international/messages/__init__.py +56 -0
  126. autocoder/common/international/messages/async_command_messages.py +507 -0
  127. autocoder/common/international/messages/auto_coder_messages.py +2208 -0
  128. autocoder/common/international/messages/chat_auto_coder_messages.py +1547 -0
  129. autocoder/common/international/messages/command_help_messages.py +986 -0
  130. autocoder/common/international/messages/conversation_command_messages.py +191 -0
  131. autocoder/common/international/messages/git_helper_plugin_messages.py +159 -0
  132. autocoder/common/international/messages/queue_command_messages.py +751 -0
  133. autocoder/common/international/messages/rules_command_messages.py +77 -0
  134. autocoder/common/international/messages/sdk_messages.py +1707 -0
  135. autocoder/common/international/messages/token_helper_plugin_messages.py +361 -0
  136. autocoder/common/international/messages/tool_display_messages.py +1212 -0
  137. autocoder/common/international/messages/workflow_exception_messages.py +473 -0
  138. autocoder/common/international/test_international.py +612 -0
  139. autocoder/common/linter_core/__init__.py +28 -0
  140. autocoder/common/linter_core/base_linter.py +61 -0
  141. autocoder/common/linter_core/config_loader.py +271 -0
  142. autocoder/common/linter_core/formatters/__init__.py +0 -0
  143. autocoder/common/linter_core/formatters/base_formatter.py +38 -0
  144. autocoder/common/linter_core/formatters/raw_formatter.py +17 -0
  145. autocoder/common/linter_core/linter.py +166 -0
  146. autocoder/common/linter_core/linter_factory.py +216 -0
  147. autocoder/common/linter_core/linter_manager.py +333 -0
  148. autocoder/common/linter_core/linters/__init__.py +9 -0
  149. autocoder/common/linter_core/linters/java_linter.py +342 -0
  150. autocoder/common/linter_core/linters/python_linter.py +115 -0
  151. autocoder/common/linter_core/linters/typescript_linter.py +119 -0
  152. autocoder/common/linter_core/models/__init__.py +7 -0
  153. autocoder/common/linter_core/models/lint_result.py +91 -0
  154. autocoder/common/linter_core/models.py +33 -0
  155. autocoder/common/linter_core/tests/__init__.py +3 -0
  156. autocoder/common/linter_core/tests/test_config_loader.py +323 -0
  157. autocoder/common/linter_core/tests/test_config_loading.py +308 -0
  158. autocoder/common/linter_core/tests/test_factory_manager.py +234 -0
  159. autocoder/common/linter_core/tests/test_formatters.py +147 -0
  160. autocoder/common/linter_core/tests/test_integration.py +317 -0
  161. autocoder/common/linter_core/tests/test_java_linter.py +496 -0
  162. autocoder/common/linter_core/tests/test_linters.py +265 -0
  163. autocoder/common/linter_core/tests/test_models.py +81 -0
  164. autocoder/common/linter_core/tests/verify_config_loading.py +296 -0
  165. autocoder/common/linter_core/tests/verify_fixes.py +183 -0
  166. autocoder/common/llm_friendly_package/__init__.py +31 -0
  167. autocoder/common/llm_friendly_package/base_manager.py +102 -0
  168. autocoder/common/llm_friendly_package/docs_manager.py +121 -0
  169. autocoder/common/llm_friendly_package/library_manager.py +171 -0
  170. autocoder/common/{llm_friendly_package.py → llm_friendly_package/main_manager.py} +204 -231
  171. autocoder/common/llm_friendly_package/models.py +40 -0
  172. autocoder/common/llm_friendly_package/test_llm_friendly_package.py +536 -0
  173. autocoder/common/llms/__init__.py +15 -0
  174. autocoder/common/llms/demo_error_handling.py +85 -0
  175. autocoder/common/llms/factory.py +142 -0
  176. autocoder/common/llms/manager.py +264 -0
  177. autocoder/common/llms/pricing.py +121 -0
  178. autocoder/common/llms/registry.py +288 -0
  179. autocoder/common/llms/schema.py +77 -0
  180. autocoder/common/llms/simple_demo.py +45 -0
  181. autocoder/common/llms/test_quick_model.py +116 -0
  182. autocoder/common/llms/test_remove_functionality.py +182 -0
  183. autocoder/common/llms/tests/__init__.py +1 -0
  184. autocoder/common/llms/tests/test_manager.py +330 -0
  185. autocoder/common/llms/tests/test_registry.py +364 -0
  186. autocoder/common/mcp_tools/__init__.py +62 -0
  187. autocoder/common/{mcp_tools.py → mcp_tools/executor.py} +49 -40
  188. autocoder/common/{mcp_hub.py → mcp_tools/hub.py} +42 -68
  189. autocoder/common/{mcp_server_install.py → mcp_tools/installer.py} +16 -28
  190. autocoder/common/{mcp_server.py → mcp_tools/server.py} +176 -48
  191. autocoder/common/mcp_tools/test_keyboard_interrupt.py +93 -0
  192. autocoder/common/mcp_tools/test_mcp_tools.py +391 -0
  193. autocoder/common/{mcp_server_types.py → mcp_tools/types.py} +121 -48
  194. autocoder/common/mcp_tools/verify_functionality.py +202 -0
  195. autocoder/common/model_speed_tester.py +32 -26
  196. autocoder/common/priority_directory_finder/__init__.py +142 -0
  197. autocoder/common/priority_directory_finder/examples.py +230 -0
  198. autocoder/common/priority_directory_finder/finder.py +283 -0
  199. autocoder/common/priority_directory_finder/models.py +236 -0
  200. autocoder/common/priority_directory_finder/test_priority_directory_finder.py +431 -0
  201. autocoder/common/project_scanner/__init__.py +18 -0
  202. autocoder/common/project_scanner/compat.py +77 -0
  203. autocoder/common/project_scanner/scanner.py +436 -0
  204. autocoder/common/project_tracker/__init__.py +27 -0
  205. autocoder/common/project_tracker/api.py +228 -0
  206. autocoder/common/project_tracker/demo.py +272 -0
  207. autocoder/common/project_tracker/tracker.py +487 -0
  208. autocoder/common/project_tracker/types.py +53 -0
  209. autocoder/common/pruner/__init__.py +67 -0
  210. autocoder/common/pruner/agentic_conversation_pruner.py +746 -0
  211. autocoder/common/{context_pruner.py → pruner/context_pruner.py} +137 -40
  212. autocoder/common/pruner/conversation_message_ids_api.py +386 -0
  213. autocoder/common/pruner/conversation_message_ids_manager.py +347 -0
  214. autocoder/common/pruner/conversation_message_ids_pruner.py +473 -0
  215. autocoder/common/pruner/conversation_normalizer.py +347 -0
  216. autocoder/common/{conversation_pruner.py → pruner/conversation_pruner.py} +26 -6
  217. autocoder/common/pruner/test_agentic_conversation_pruner.py +784 -0
  218. autocoder/common/pruner/test_context_pruner.py +546 -0
  219. autocoder/common/pruner/test_conversation_normalizer.py +502 -0
  220. autocoder/common/pruner/test_tool_content_detector.py +324 -0
  221. autocoder/common/pruner/tool_content_detector.py +227 -0
  222. autocoder/common/pruner/tools/__init__.py +18 -0
  223. autocoder/common/pruner/tools/query_message_ids.py +264 -0
  224. autocoder/common/pruner/tools/test_agentic_pruning_logic.py +432 -0
  225. autocoder/common/pruner/tools/test_message_ids_pruning_only.py +192 -0
  226. autocoder/common/pull_requests/__init__.py +9 -1
  227. autocoder/common/pull_requests/utils.py +122 -1
  228. autocoder/common/rag_manager/rag_manager.py +36 -40
  229. autocoder/common/rulefiles/__init__.py +53 -1
  230. autocoder/common/rulefiles/api.py +250 -0
  231. autocoder/common/rulefiles/core/__init__.py +14 -0
  232. autocoder/common/rulefiles/core/manager.py +241 -0
  233. autocoder/common/rulefiles/core/selector.py +805 -0
  234. autocoder/common/rulefiles/models/__init__.py +20 -0
  235. autocoder/common/rulefiles/models/index.py +16 -0
  236. autocoder/common/rulefiles/models/init_rule.py +18 -0
  237. autocoder/common/rulefiles/models/rule_file.py +18 -0
  238. autocoder/common/rulefiles/models/rule_relevance.py +14 -0
  239. autocoder/common/rulefiles/models/summary.py +16 -0
  240. autocoder/common/rulefiles/test_rulefiles.py +776 -0
  241. autocoder/common/rulefiles/utils/__init__.py +34 -0
  242. autocoder/common/rulefiles/utils/monitor.py +86 -0
  243. autocoder/common/rulefiles/utils/parser.py +230 -0
  244. autocoder/common/save_formatted_log.py +67 -10
  245. autocoder/common/search_replace.py +8 -1
  246. autocoder/common/search_replace_patch/__init__.py +24 -0
  247. autocoder/common/search_replace_patch/base.py +115 -0
  248. autocoder/common/search_replace_patch/manager.py +248 -0
  249. autocoder/common/search_replace_patch/patch_replacer.py +304 -0
  250. autocoder/common/search_replace_patch/similarity_replacer.py +306 -0
  251. autocoder/common/search_replace_patch/string_replacer.py +181 -0
  252. autocoder/common/search_replace_patch/tests/__init__.py +3 -0
  253. autocoder/common/search_replace_patch/tests/run_tests.py +126 -0
  254. autocoder/common/search_replace_patch/tests/test_base.py +188 -0
  255. autocoder/common/search_replace_patch/tests/test_empty_line_insert.py +233 -0
  256. autocoder/common/search_replace_patch/tests/test_integration.py +389 -0
  257. autocoder/common/search_replace_patch/tests/test_manager.py +351 -0
  258. autocoder/common/search_replace_patch/tests/test_patch_replacer.py +316 -0
  259. autocoder/common/search_replace_patch/tests/test_regex_replacer.py +306 -0
  260. autocoder/common/search_replace_patch/tests/test_similarity_replacer.py +384 -0
  261. autocoder/common/shell_commands/__init__.py +197 -0
  262. autocoder/common/shell_commands/background_process_notifier.py +346 -0
  263. autocoder/common/shell_commands/command_executor.py +1127 -0
  264. autocoder/common/shell_commands/error_recovery.py +541 -0
  265. autocoder/common/shell_commands/exceptions.py +120 -0
  266. autocoder/common/shell_commands/interactive_executor.py +476 -0
  267. autocoder/common/shell_commands/interactive_pexpect_process.py +623 -0
  268. autocoder/common/shell_commands/interactive_process.py +744 -0
  269. autocoder/common/shell_commands/interactive_session_manager.py +1014 -0
  270. autocoder/common/shell_commands/monitoring.py +529 -0
  271. autocoder/common/shell_commands/process_cleanup.py +386 -0
  272. autocoder/common/shell_commands/process_manager.py +606 -0
  273. autocoder/common/shell_commands/test_interactive_pexpect_process.py +281 -0
  274. autocoder/common/shell_commands/tests/__init__.py +6 -0
  275. autocoder/common/shell_commands/tests/conftest.py +118 -0
  276. autocoder/common/shell_commands/tests/test_background_process_notifier.py +703 -0
  277. autocoder/common/shell_commands/tests/test_command_executor.py +448 -0
  278. autocoder/common/shell_commands/tests/test_error_recovery.py +305 -0
  279. autocoder/common/shell_commands/tests/test_exceptions.py +299 -0
  280. autocoder/common/shell_commands/tests/test_execute_batch.py +588 -0
  281. autocoder/common/shell_commands/tests/test_indented_batch_commands.py +244 -0
  282. autocoder/common/shell_commands/tests/test_integration.py +664 -0
  283. autocoder/common/shell_commands/tests/test_monitoring.py +546 -0
  284. autocoder/common/shell_commands/tests/test_performance.py +632 -0
  285. autocoder/common/shell_commands/tests/test_process_cleanup.py +397 -0
  286. autocoder/common/shell_commands/tests/test_process_manager.py +606 -0
  287. autocoder/common/shell_commands/tests/test_timeout_config.py +343 -0
  288. autocoder/common/shell_commands/tests/test_timeout_manager.py +520 -0
  289. autocoder/common/shell_commands/timeout_config.py +315 -0
  290. autocoder/common/shell_commands/timeout_manager.py +352 -0
  291. autocoder/common/terminal_paste/__init__.py +14 -0
  292. autocoder/common/terminal_paste/demo.py +145 -0
  293. autocoder/common/terminal_paste/demo_paste_functionality.py +95 -0
  294. autocoder/common/terminal_paste/paste_handler.py +200 -0
  295. autocoder/common/terminal_paste/paste_manager.py +118 -0
  296. autocoder/common/terminal_paste/tests/__init__.py +1 -0
  297. autocoder/common/terminal_paste/tests/test_paste_handler.py +182 -0
  298. autocoder/common/terminal_paste/tests/test_paste_manager.py +126 -0
  299. autocoder/common/terminal_paste/utils.py +163 -0
  300. autocoder/common/test_autocoder_args.py +232 -0
  301. autocoder/common/test_env_manager.py +173 -0
  302. autocoder/common/test_env_manager_integration.py +159 -0
  303. autocoder/common/text_similarity/__init__.py +9 -0
  304. autocoder/common/text_similarity/demo.py +216 -0
  305. autocoder/common/text_similarity/examples.py +266 -0
  306. autocoder/common/text_similarity/test_text_similarity.py +306 -0
  307. autocoder/common/text_similarity/text_similarity.py +194 -0
  308. autocoder/common/text_similarity/utils.py +125 -0
  309. autocoder/common/todos/__init__.py +61 -0
  310. autocoder/common/todos/cache/__init__.py +16 -0
  311. autocoder/common/todos/cache/base_cache.py +89 -0
  312. autocoder/common/todos/cache/cache_manager.py +228 -0
  313. autocoder/common/todos/cache/memory_cache.py +225 -0
  314. autocoder/common/todos/config.py +155 -0
  315. autocoder/common/todos/exceptions.py +35 -0
  316. autocoder/common/todos/get_todo_manager.py +161 -0
  317. autocoder/common/todos/manager.py +537 -0
  318. autocoder/common/todos/models.py +239 -0
  319. autocoder/common/todos/storage/__init__.py +14 -0
  320. autocoder/common/todos/storage/base_storage.py +76 -0
  321. autocoder/common/todos/storage/file_storage.py +278 -0
  322. autocoder/common/tokens/__init__.py +15 -0
  323. autocoder/common/tokens/counter.py +44 -2
  324. autocoder/common/tools_manager/__init__.py +17 -0
  325. autocoder/common/tools_manager/examples.py +162 -0
  326. autocoder/common/tools_manager/manager.py +385 -0
  327. autocoder/common/tools_manager/models.py +39 -0
  328. autocoder/common/tools_manager/test_tools_manager.py +303 -0
  329. autocoder/common/tools_manager/utils.py +191 -0
  330. autocoder/common/v2/agent/agentic_callbacks.py +270 -0
  331. autocoder/common/v2/agent/agentic_edit.py +2729 -2052
  332. autocoder/common/v2/agent/agentic_edit_change_manager.py +474 -0
  333. autocoder/common/v2/agent/agentic_edit_tools/__init__.py +43 -2
  334. autocoder/common/v2/agent/agentic_edit_tools/ac_mod_list_tool_resolver.py +279 -0
  335. autocoder/common/v2/agent/agentic_edit_tools/ac_mod_read_tool_resolver.py +40 -0
  336. autocoder/common/v2/agent/agentic_edit_tools/ac_mod_write_tool_resolver.py +52 -0
  337. autocoder/common/v2/agent/agentic_edit_tools/ask_followup_question_tool_resolver.py +8 -0
  338. autocoder/common/v2/agent/agentic_edit_tools/background_task_tool_resolver.py +1167 -0
  339. autocoder/common/v2/agent/agentic_edit_tools/base_tool_resolver.py +2 -2
  340. autocoder/common/v2/agent/agentic_edit_tools/conversation_message_ids_read_tool_resolver.py +214 -0
  341. autocoder/common/v2/agent/agentic_edit_tools/conversation_message_ids_write_tool_resolver.py +299 -0
  342. autocoder/common/v2/agent/agentic_edit_tools/count_tokens_tool_resolver.py +290 -0
  343. autocoder/common/v2/agent/agentic_edit_tools/execute_command_tool_resolver.py +565 -30
  344. autocoder/common/v2/agent/agentic_edit_tools/execute_workflow_tool_resolver.py +485 -0
  345. autocoder/common/v2/agent/agentic_edit_tools/extract_to_text_tool_resolver.py +225 -0
  346. autocoder/common/v2/agent/agentic_edit_tools/lint_report.py +79 -0
  347. autocoder/common/v2/agent/agentic_edit_tools/linter_config_models.py +343 -0
  348. autocoder/common/v2/agent/agentic_edit_tools/linter_enabled_tool_resolver.py +189 -0
  349. autocoder/common/v2/agent/agentic_edit_tools/list_files_tool_resolver.py +169 -101
  350. autocoder/common/v2/agent/agentic_edit_tools/load_extra_document_tool_resolver.py +349 -0
  351. autocoder/common/v2/agent/agentic_edit_tools/read_file_tool_resolver.py +244 -51
  352. autocoder/common/v2/agent/agentic_edit_tools/replace_in_file_tool_resolver.py +667 -147
  353. autocoder/common/v2/agent/agentic_edit_tools/run_named_subagents_tool_resolver.py +691 -0
  354. autocoder/common/v2/agent/agentic_edit_tools/search_files_tool_resolver.py +409 -140
  355. autocoder/common/v2/agent/agentic_edit_tools/session_interactive_tool_resolver.py +115 -0
  356. autocoder/common/v2/agent/agentic_edit_tools/session_start_tool_resolver.py +190 -0
  357. autocoder/common/v2/agent/agentic_edit_tools/session_stop_tool_resolver.py +76 -0
  358. autocoder/common/v2/agent/agentic_edit_tools/test_write_to_file_tool_resolver.py +209 -194
  359. autocoder/common/v2/agent/agentic_edit_tools/todo_read_tool_resolver.py +135 -0
  360. autocoder/common/v2/agent/agentic_edit_tools/todo_write_tool_resolver.py +328 -0
  361. autocoder/common/v2/agent/agentic_edit_tools/use_mcp_tool_resolver.py +2 -2
  362. autocoder/common/v2/agent/agentic_edit_tools/web_crawl_tool_resolver.py +557 -0
  363. autocoder/common/v2/agent/agentic_edit_tools/web_search_tool_resolver.py +600 -0
  364. autocoder/common/v2/agent/agentic_edit_tools/write_to_file_tool_resolver.py +56 -121
  365. autocoder/common/v2/agent/agentic_edit_types.py +386 -10
  366. autocoder/common/v2/agent/runner/__init__.py +31 -0
  367. autocoder/common/v2/agent/runner/base_runner.py +92 -0
  368. autocoder/common/v2/agent/runner/file_based_event_runner.py +217 -0
  369. autocoder/common/v2/agent/runner/sdk_runner.py +182 -0
  370. autocoder/common/v2/agent/runner/terminal_runner.py +396 -0
  371. autocoder/common/v2/agent/runner/tool_display.py +589 -0
  372. autocoder/common/v2/agent/test_agentic_callbacks.py +265 -0
  373. autocoder/common/v2/agent/test_agentic_edit.py +194 -0
  374. autocoder/common/v2/agent/tool_caller/__init__.py +24 -0
  375. autocoder/common/v2/agent/tool_caller/default_tool_resolver_map.py +135 -0
  376. autocoder/common/v2/agent/tool_caller/integration_test.py +172 -0
  377. autocoder/common/v2/agent/tool_caller/plugins/__init__.py +14 -0
  378. autocoder/common/v2/agent/tool_caller/plugins/base_plugin.py +126 -0
  379. autocoder/common/v2/agent/tool_caller/plugins/examples/__init__.py +13 -0
  380. autocoder/common/v2/agent/tool_caller/plugins/examples/logging_plugin.py +164 -0
  381. autocoder/common/v2/agent/tool_caller/plugins/examples/security_filter_plugin.py +198 -0
  382. autocoder/common/v2/agent/tool_caller/plugins/plugin_interface.py +141 -0
  383. autocoder/common/v2/agent/tool_caller/test_tool_caller.py +278 -0
  384. autocoder/common/v2/agent/tool_caller/tool_call_plugin_manager.py +331 -0
  385. autocoder/common/v2/agent/tool_caller/tool_caller.py +337 -0
  386. autocoder/common/v2/agent/tool_caller/usage_example.py +193 -0
  387. autocoder/common/v2/code_agentic_editblock_manager.py +4 -4
  388. autocoder/common/v2/code_auto_generate.py +136 -78
  389. autocoder/common/v2/code_auto_generate_diff.py +135 -79
  390. autocoder/common/v2/code_auto_generate_editblock.py +174 -99
  391. autocoder/common/v2/code_auto_generate_strict_diff.py +151 -71
  392. autocoder/common/v2/code_auto_merge.py +1 -1
  393. autocoder/common/v2/code_auto_merge_editblock.py +13 -1
  394. autocoder/common/v2/code_diff_manager.py +3 -3
  395. autocoder/common/v2/code_editblock_manager.py +4 -14
  396. autocoder/common/v2/code_manager.py +1 -1
  397. autocoder/common/v2/code_strict_diff_manager.py +2 -2
  398. autocoder/common/wrap_llm_hint/__init__.py +10 -0
  399. autocoder/common/wrap_llm_hint/test_wrap_llm_hint.py +1067 -0
  400. autocoder/common/wrap_llm_hint/utils.py +432 -0
  401. autocoder/common/wrap_llm_hint/wrap_llm_hint.py +323 -0
  402. autocoder/completer/__init__.py +8 -0
  403. autocoder/completer/command_completer_v2.py +1051 -0
  404. autocoder/default_project/__init__.py +501 -0
  405. autocoder/dispacher/__init__.py +4 -12
  406. autocoder/dispacher/actions/action.py +165 -7
  407. autocoder/dispacher/actions/plugins/action_regex_project.py +2 -2
  408. autocoder/index/entry.py +117 -125
  409. autocoder/{agent → index/filter}/agentic_filter.py +323 -334
  410. autocoder/index/filter/normal_filter.py +5 -11
  411. autocoder/index/filter/quick_filter.py +1 -1
  412. autocoder/index/index.py +36 -9
  413. autocoder/index/tests/__init__.py +1 -0
  414. autocoder/index/tests/run_tests.py +195 -0
  415. autocoder/index/tests/test_entry.py +303 -0
  416. autocoder/index/tests/test_index_manager.py +314 -0
  417. autocoder/index/tests/test_module_integration.py +300 -0
  418. autocoder/index/tests/test_symbols_utils.py +183 -0
  419. autocoder/inner/__init__.py +4 -0
  420. autocoder/inner/agentic.py +932 -0
  421. autocoder/inner/async_command_handler.py +992 -0
  422. autocoder/inner/conversation_command_handlers.py +623 -0
  423. autocoder/inner/merge_command_handler.py +213 -0
  424. autocoder/inner/queue_command_handler.py +684 -0
  425. autocoder/models.py +95 -266
  426. autocoder/plugins/git_helper_plugin.py +31 -29
  427. autocoder/plugins/token_helper_plugin.py +156 -37
  428. autocoder/pyproject/__init__.py +32 -29
  429. autocoder/rag/agentic_rag.py +215 -75
  430. autocoder/rag/cache/simple_cache.py +1 -2
  431. autocoder/rag/loaders/image_loader.py +1 -1
  432. autocoder/rag/long_context_rag.py +42 -26
  433. autocoder/rag/qa_conversation_strategy.py +1 -1
  434. autocoder/rag/terminal/__init__.py +17 -0
  435. autocoder/rag/terminal/args.py +581 -0
  436. autocoder/rag/terminal/bootstrap.py +61 -0
  437. autocoder/rag/terminal/command_handlers.py +653 -0
  438. autocoder/rag/terminal/formatters/__init__.py +20 -0
  439. autocoder/rag/terminal/formatters/base.py +70 -0
  440. autocoder/rag/terminal/formatters/json_format.py +66 -0
  441. autocoder/rag/terminal/formatters/stream_json.py +95 -0
  442. autocoder/rag/terminal/formatters/text.py +28 -0
  443. autocoder/rag/terminal/init.py +120 -0
  444. autocoder/rag/terminal/utils.py +106 -0
  445. autocoder/rag/test_agentic_rag.py +389 -0
  446. autocoder/rag/test_doc_filter.py +3 -3
  447. autocoder/rag/test_long_context_rag.py +1 -1
  448. autocoder/rag/test_token_limiter.py +517 -10
  449. autocoder/rag/token_counter.py +3 -0
  450. autocoder/rag/token_limiter.py +19 -15
  451. autocoder/rag/tools/__init__.py +26 -2
  452. autocoder/rag/tools/bochaai_example.py +343 -0
  453. autocoder/rag/tools/bochaai_sdk.py +541 -0
  454. autocoder/rag/tools/metaso_example.py +268 -0
  455. autocoder/rag/tools/metaso_sdk.py +417 -0
  456. autocoder/rag/tools/recall_tool.py +28 -7
  457. autocoder/rag/tools/run_integration_tests.py +204 -0
  458. autocoder/rag/tools/test_all_providers.py +318 -0
  459. autocoder/rag/tools/test_bochaai_integration.py +482 -0
  460. autocoder/rag/tools/test_final_integration.py +215 -0
  461. autocoder/rag/tools/test_metaso_integration.py +424 -0
  462. autocoder/rag/tools/test_metaso_real.py +171 -0
  463. autocoder/rag/tools/test_web_crawl_tool.py +639 -0
  464. autocoder/rag/tools/test_web_search_tool.py +509 -0
  465. autocoder/rag/tools/todo_read_tool.py +202 -0
  466. autocoder/rag/tools/todo_write_tool.py +412 -0
  467. autocoder/rag/tools/web_crawl_tool.py +634 -0
  468. autocoder/rag/tools/web_search_tool.py +558 -0
  469. autocoder/rag/tools/web_tools_example.py +119 -0
  470. autocoder/rag/types.py +16 -0
  471. autocoder/rag/variable_holder.py +4 -2
  472. autocoder/rags.py +86 -79
  473. autocoder/regexproject/__init__.py +23 -21
  474. autocoder/run_context.py +9 -0
  475. autocoder/sdk/__init__.py +50 -161
  476. autocoder/sdk/api.py +370 -0
  477. autocoder/sdk/async_runner/__init__.py +26 -0
  478. autocoder/sdk/async_runner/async_executor.py +650 -0
  479. autocoder/sdk/async_runner/async_handler.py +356 -0
  480. autocoder/sdk/async_runner/markdown_processor.py +595 -0
  481. autocoder/sdk/async_runner/task_metadata.py +284 -0
  482. autocoder/sdk/async_runner/worktree_manager.py +438 -0
  483. autocoder/sdk/cli/__init__.py +2 -5
  484. autocoder/sdk/cli/formatters.py +28 -204
  485. autocoder/sdk/cli/handlers.py +77 -44
  486. autocoder/sdk/cli/main.py +158 -170
  487. autocoder/sdk/cli/options.py +95 -22
  488. autocoder/sdk/constants.py +139 -51
  489. autocoder/sdk/core/auto_coder_core.py +484 -267
  490. autocoder/sdk/core/bridge.py +298 -118
  491. autocoder/sdk/exceptions.py +18 -12
  492. autocoder/sdk/formatters/__init__.py +19 -0
  493. autocoder/sdk/formatters/input.py +64 -0
  494. autocoder/sdk/formatters/output.py +247 -0
  495. autocoder/sdk/formatters/stream.py +54 -0
  496. autocoder/sdk/models/__init__.py +6 -5
  497. autocoder/sdk/models/options.py +55 -18
  498. autocoder/sdk/utils/formatters.py +27 -195
  499. autocoder/suffixproject/__init__.py +28 -25
  500. autocoder/terminal/__init__.py +14 -0
  501. autocoder/terminal/app.py +454 -0
  502. autocoder/terminal/args.py +32 -0
  503. autocoder/terminal/bootstrap.py +178 -0
  504. autocoder/terminal/command_processor.py +521 -0
  505. autocoder/terminal/command_registry.py +57 -0
  506. autocoder/terminal/help.py +97 -0
  507. autocoder/terminal/tasks/__init__.py +5 -0
  508. autocoder/terminal/tasks/background.py +77 -0
  509. autocoder/terminal/tasks/task_event.py +70 -0
  510. autocoder/terminal/ui/__init__.py +13 -0
  511. autocoder/terminal/ui/completer.py +268 -0
  512. autocoder/terminal/ui/keybindings.py +75 -0
  513. autocoder/terminal/ui/session.py +41 -0
  514. autocoder/terminal/ui/toolbar.py +64 -0
  515. autocoder/terminal/utils/__init__.py +13 -0
  516. autocoder/terminal/utils/errors.py +18 -0
  517. autocoder/terminal/utils/paths.py +19 -0
  518. autocoder/terminal/utils/shell.py +43 -0
  519. autocoder/terminal_v3/__init__.py +10 -0
  520. autocoder/terminal_v3/app.py +201 -0
  521. autocoder/terminal_v3/handlers/__init__.py +5 -0
  522. autocoder/terminal_v3/handlers/command_handler.py +131 -0
  523. autocoder/terminal_v3/models/__init__.py +6 -0
  524. autocoder/terminal_v3/models/conversation_buffer.py +214 -0
  525. autocoder/terminal_v3/models/message.py +50 -0
  526. autocoder/terminal_v3/models/tool_display.py +247 -0
  527. autocoder/terminal_v3/ui/__init__.py +7 -0
  528. autocoder/terminal_v3/ui/keybindings.py +56 -0
  529. autocoder/terminal_v3/ui/layout.py +141 -0
  530. autocoder/terminal_v3/ui/styles.py +43 -0
  531. autocoder/tsproject/__init__.py +23 -23
  532. autocoder/utils/auto_coder_utils/chat_stream_out.py +1 -1
  533. autocoder/utils/llms.py +88 -80
  534. autocoder/utils/math_utils.py +101 -0
  535. autocoder/utils/model_provider_selector.py +16 -4
  536. autocoder/utils/operate_config_api.py +33 -5
  537. autocoder/utils/thread_utils.py +2 -2
  538. autocoder/version.py +4 -2
  539. autocoder/workflow_agents/__init__.py +84 -0
  540. autocoder/workflow_agents/agent.py +143 -0
  541. autocoder/workflow_agents/exceptions.py +573 -0
  542. autocoder/workflow_agents/executor.py +489 -0
  543. autocoder/workflow_agents/loader.py +737 -0
  544. autocoder/workflow_agents/runner.py +267 -0
  545. autocoder/workflow_agents/types.py +172 -0
  546. autocoder/workflow_agents/utils.py +434 -0
  547. autocoder/workflow_agents/workflow_manager.py +211 -0
  548. auto_coder-0.1.400.dist-info/METADATA +0 -396
  549. auto_coder-0.1.400.dist-info/RECORD +0 -425
  550. auto_coder-0.1.400.dist-info/licenses/LICENSE +0 -201
  551. autocoder/auto_coder_server.py +0 -672
  552. autocoder/benchmark.py +0 -138
  553. autocoder/common/ac_style_command_parser/example.py +0 -7
  554. autocoder/common/cleaner.py +0 -31
  555. autocoder/common/command_completer_v2.py +0 -615
  556. autocoder/common/directory_cache/__init__.py +0 -1
  557. autocoder/common/directory_cache/cache.py +0 -192
  558. autocoder/common/directory_cache/test_cache.py +0 -190
  559. autocoder/common/file_checkpoint/examples.py +0 -217
  560. autocoder/common/llm_friendly_package_example.py +0 -138
  561. autocoder/common/llm_friendly_package_test.py +0 -63
  562. autocoder/common/pull_requests/test_module.py +0 -1
  563. autocoder/common/rulefiles/autocoderrules_utils.py +0 -484
  564. autocoder/common/text.py +0 -30
  565. autocoder/common/v2/agent/agentic_edit_tools/list_package_info_tool_resolver.py +0 -42
  566. autocoder/common/v2/agent/agentic_edit_tools/test_execute_command_tool_resolver.py +0 -70
  567. autocoder/common/v2/agent/agentic_edit_tools/test_search_files_tool_resolver.py +0 -163
  568. autocoder/common/v2/agent/agentic_tool_display.py +0 -183
  569. autocoder/plugins/dynamic_completion_example.py +0 -148
  570. autocoder/plugins/sample_plugin.py +0 -160
  571. autocoder/sdk/cli/__main__.py +0 -26
  572. autocoder/sdk/cli/completion_wrapper.py +0 -38
  573. autocoder/sdk/cli/install_completion.py +0 -301
  574. autocoder/sdk/models/messages.py +0 -209
  575. autocoder/sdk/session/__init__.py +0 -32
  576. autocoder/sdk/session/session.py +0 -106
  577. autocoder/sdk/session/session_manager.py +0 -56
  578. {auto_coder-0.1.400.dist-info → auto_coder-2.0.0.dist-info}/top_level.txt +0 -0
  579. /autocoder/{sdk/example.py → common/agent_query_queue/__init__.py} +0 -0
@@ -0,0 +1,595 @@
1
+
2
+
3
+ """
4
+ Markdown 处理器模块
5
+
6
+ 提供智能 Markdown 解析和分割功能,支持多种分割模式。
7
+ """
8
+
9
+ import re
10
+ import yaml
11
+ import hashlib
12
+ from enum import Enum
13
+ from dataclasses import dataclass, field
14
+ from typing import List, Dict, Any, Optional, Callable
15
+ from pathlib import Path
16
+ from autocoder.common.international import get_message, get_message_with_format
17
+
18
+
19
+ class SplitMode(Enum):
20
+ """分割模式枚举"""
21
+ DELIMITER = "delimiter" # 按分隔符分割(兼容模式)
22
+ HEADING1 = "h1" # 按 H1 标题分割
23
+ HEADING2 = "h2" # 按 H2 标题分割
24
+ HEADING3 = "h3" # 按 H3 标题分割
25
+ ANY_HEADING = "any" # 按任何标题分割
26
+ FRONT_MATTER = "frontmatter" # 按 YAML front matter 分割
27
+ CUSTOM_PATTERN = "custom" # 按自定义正则模式分割
28
+
29
+
30
+ @dataclass
31
+ class SplitterConfig:
32
+ """分割器配置"""
33
+ pattern: str = "" # 自定义正则模式
34
+ min_length: int = 50 # 最小文档长度
35
+ max_length: int = 10000 # 最大文档长度
36
+ overlap_size: int = 100 # 重叠大小(用于长文档分割)
37
+ preserve_context: bool = True # 是否保留上下文
38
+ custom_splitter: Optional[Callable[[str], List[str]]] = None # 自定义分割函数
39
+
40
+
41
+ @dataclass
42
+ class DocumentPart:
43
+ """文档部分"""
44
+ content: str
45
+ title: str
46
+ level: int = 1
47
+ metadata: Dict[str, Any] = field(default_factory=dict)
48
+
49
+
50
+ @dataclass
51
+ class Document:
52
+ """Markdown 文档"""
53
+ original_file: str
54
+ index: int
55
+ content: str
56
+ temp_filename: str
57
+ title: str
58
+ heading_level: int = 1
59
+ metadata: Dict[str, Any] = field(default_factory=dict)
60
+
61
+
62
+ class MarkdownProcessor:
63
+ """Markdown 处理器,用于解析和分割 Markdown 内容"""
64
+
65
+ def __init__(self):
66
+ """初始化处理器"""
67
+ self.split_mode = SplitMode.HEADING1
68
+ self.delimiter = "==="
69
+ self.min_heading_level = 1
70
+ self.max_heading_level = 6
71
+ self.config = SplitterConfig()
72
+
73
+ def process_content(self, content: str, filename: str = "stdin") -> List[Document]:
74
+ """
75
+ 处理 Markdown 内容,返回分割后的文档列表
76
+
77
+ Args:
78
+ content: Markdown 内容
79
+ filename: 文件名
80
+
81
+ Returns:
82
+ 分割后的文档列表
83
+ """
84
+ parts = []
85
+
86
+ # 首先检测文档是否包含多个独立文档
87
+ if self._contains_multiple_documents(content):
88
+ print(get_message("detected_multi_document_structure"))
89
+ try:
90
+ parts = self._parse_multiple_documents(content)
91
+ except Exception as e:
92
+ print(get_message_with_format("multi_document_parse_failed_fallback", error=str(e)))
93
+ parts = []
94
+
95
+ # 如果没有检测到多文档或解析失败,使用原有分割逻辑
96
+ if not parts:
97
+ if self.split_mode != SplitMode.DELIMITER:
98
+ try:
99
+ parts = self._split_by_headings(content)
100
+ if len(parts) <= 1:
101
+ # 如果没有找到标题,回退到分隔符模式
102
+ parts = self._split_by_delimiter(content)
103
+ except Exception:
104
+ # 如果解析失败,回退到分隔符模式
105
+ parts = self._split_by_delimiter(content)
106
+ else:
107
+ # 使用分隔符模式
108
+ parts = self._split_by_delimiter(content)
109
+
110
+ # 使用自定义分割器(如果配置了)
111
+ if self.config.custom_splitter:
112
+ print(get_message("using_custom_splitter"))
113
+ custom_parts = self.config.custom_splitter(content)
114
+ parts = self._convert_to_document_parts(custom_parts)
115
+
116
+ # 如果没有找到任何分割,将整个内容作为一个文档
117
+ if not parts:
118
+ parts = [DocumentPart(
119
+ content=content.strip(),
120
+ title=self._extract_title(content),
121
+ level=1
122
+ )]
123
+
124
+ # 应用长度和重叠配置
125
+ parts = self._apply_length_constraints(parts)
126
+
127
+ # 转换为 Document 对象
128
+ documents = []
129
+ base_name = self._get_base_name(filename)
130
+
131
+ for i, part in enumerate(parts):
132
+ doc = Document(
133
+ original_file=filename,
134
+ index=i,
135
+ content=part.content,
136
+ title=part.title,
137
+ heading_level=part.level,
138
+ temp_filename=self._generate_temp_filename(base_name, i, len(parts), part.content),
139
+ metadata=part.metadata
140
+ )
141
+ documents.append(doc)
142
+
143
+ return documents
144
+
145
+ def _contains_multiple_documents(self, content: str) -> bool:
146
+ """检测内容是否包含多个独立文档"""
147
+ # 检测 YAML front matter 分隔符
148
+ front_matter_pattern = re.compile(r'^---\s*$', re.MULTILINE)
149
+ matches = front_matter_pattern.findall(content)
150
+ if len(matches) >= 3: # 至少有3个分隔符才认为是多文档
151
+ return True
152
+
153
+ # 检测连续的空行分隔(可能是多文档)
154
+ empty_line_pattern = re.compile(r'\n\s*\n\s*\n')
155
+ if len(empty_line_pattern.findall(content)) >= 2:
156
+ # 进一步检查是否有标题结构
157
+ heading_pattern = re.compile(r'^#{1,6}\s+.+$', re.MULTILINE)
158
+ headings = heading_pattern.findall(content)
159
+ return len(headings) >= 2
160
+
161
+ return False
162
+
163
+ def _parse_multiple_documents(self, content: str) -> List[DocumentPart]:
164
+ """解析多文档结构"""
165
+ parts = []
166
+
167
+ # 尝试按 YAML front matter 分割
168
+ if "---" in content:
169
+ yaml_parts = self._split_by_front_matter(content)
170
+ if len(yaml_parts) > 1:
171
+ parts = yaml_parts
172
+
173
+ # 如果没有找到 YAML 分割,抛出异常
174
+ if not parts:
175
+ raise ValueError(get_message("cannot_parse_multi_document_structure"))
176
+
177
+ return parts
178
+
179
+ def _split_by_front_matter(self, content: str) -> List[DocumentPart]:
180
+ """按 YAML front matter 分割"""
181
+ doc_parts = []
182
+ lines = content.split('\n')
183
+ current_doc = []
184
+ current_yaml = []
185
+ in_yaml = False
186
+ in_content = False
187
+
188
+ for line in lines:
189
+ trimmed = line.strip()
190
+
191
+ if trimmed == "---":
192
+ if not in_yaml and not in_content:
193
+ # 开始新的 YAML block
194
+ in_yaml = True
195
+ continue
196
+ elif in_yaml and not in_content:
197
+ # YAML block 结束,内容开始
198
+ in_yaml = False
199
+ in_content = True
200
+ continue
201
+ elif in_content:
202
+ # 当前文档结束,保存并开始新文档
203
+ if current_doc or current_yaml:
204
+ self._add_front_matter_doc(doc_parts, '\n'.join(current_yaml), '\n'.join(current_doc))
205
+
206
+ # 重置状态
207
+ current_doc = []
208
+ current_yaml = []
209
+ in_yaml = True
210
+ in_content = False
211
+ continue
212
+
213
+ if in_yaml:
214
+ current_yaml.append(line)
215
+ elif in_content:
216
+ current_doc.append(line)
217
+ else:
218
+ # 没有 YAML header 的情况,直接当作内容处理
219
+ current_doc.append(line)
220
+ in_content = True
221
+
222
+ # 添加最后一个文档
223
+ if current_doc or current_yaml:
224
+ self._add_front_matter_doc(doc_parts, '\n'.join(current_yaml), '\n'.join(current_doc))
225
+
226
+ # 如果没有找到任何文档,返回整个内容作为一个文档
227
+ if not doc_parts:
228
+ doc_parts = [DocumentPart(
229
+ content=content.strip(),
230
+ title=self._extract_title(content),
231
+ level=1,
232
+ metadata={}
233
+ )]
234
+
235
+ return doc_parts
236
+
237
+ def _add_front_matter_doc(self, doc_parts: List[DocumentPart], yaml_content: str, markdown_content: str):
238
+ """添加一个 front matter 文档"""
239
+ metadata = self._parse_yaml_metadata(yaml_content)
240
+ content = markdown_content.strip()
241
+
242
+ title = self._extract_title(content)
243
+ if 'title' in metadata and metadata['title']:
244
+ title = str(metadata['title'])
245
+
246
+ if content or metadata:
247
+ doc_parts.append(DocumentPart(
248
+ content=content,
249
+ title=title,
250
+ level=1,
251
+ metadata=metadata
252
+ ))
253
+
254
+ def _parse_yaml_metadata(self, yaml_content: str) -> Dict[str, Any]:
255
+ """解析 YAML 元数据"""
256
+ if not yaml_content.strip():
257
+ return {}
258
+
259
+ try:
260
+ return yaml.safe_load(yaml_content) or {}
261
+ except yaml.YAMLError:
262
+ # 简单解析失败时的备用方案
263
+ metadata = {}
264
+ lines = yaml_content.split('\n')
265
+
266
+ for line in lines:
267
+ line = line.strip()
268
+ if not line or line.startswith('#'):
269
+ continue
270
+
271
+ if ':' in line:
272
+ parts = line.split(':', 1)
273
+ if len(parts) == 2:
274
+ key = parts[0].strip()
275
+ value = parts[1].strip().strip('"\'')
276
+ metadata[key] = value
277
+
278
+ return metadata
279
+
280
+ def _convert_to_document_parts(self, parts: List[str]) -> List[DocumentPart]:
281
+ """将字符串数组转换为 DocumentPart"""
282
+ doc_parts = []
283
+ for part in parts:
284
+ if part.strip():
285
+ doc_parts.append(DocumentPart(
286
+ content=part.strip(),
287
+ title=self._extract_title(part),
288
+ level=1
289
+ ))
290
+ return doc_parts
291
+
292
+ def _apply_length_constraints(self, parts: List[DocumentPart]) -> List[DocumentPart]:
293
+ """应用长度约束和重叠配置"""
294
+ result = []
295
+ too_short_parts = []
296
+
297
+ for part in parts:
298
+ # 如果文档太短,先保存起来
299
+ if len(part.content) < self.config.min_length:
300
+ too_short_parts.append(part)
301
+ continue
302
+
303
+ # 如果文档太长,分割
304
+ if len(part.content) > self.config.max_length:
305
+ sub_parts = self._split_long_document(part)
306
+ result.extend(sub_parts)
307
+ else:
308
+ result.append(part)
309
+
310
+ # 如果所有文档都被过滤掉了(因为太短),至少保留一个最长的
311
+ if not result and too_short_parts:
312
+ longest = max(too_short_parts, key=lambda x: len(x.content))
313
+ result.append(longest)
314
+
315
+ return result
316
+
317
+ def _split_long_document(self, part: DocumentPart) -> List[DocumentPart]:
318
+ """分割过长的文档"""
319
+ parts = []
320
+ content = part.content
321
+ max_len = self.config.max_length
322
+ overlap = self.config.overlap_size
323
+
324
+ # 安全检查:防止无限循环
325
+ max_iterations = 100
326
+ iterations = 0
327
+
328
+ while len(content) > max_len and iterations < max_iterations:
329
+ iterations += 1
330
+
331
+ # 找到合适的分割点
332
+ split_pos = self._find_best_split_position(content, max_len)
333
+
334
+ # 安全检查
335
+ if split_pos <= 0:
336
+ split_pos = max_len // 2
337
+ if split_pos >= len(content):
338
+ break
339
+
340
+ # 创建当前部分
341
+ current_part = DocumentPart(
342
+ content=content[:split_pos],
343
+ title=f"{part.title} (第{len(parts)+1}部分)",
344
+ level=part.level,
345
+ metadata=part.metadata.copy()
346
+ )
347
+ parts.append(current_part)
348
+
349
+ # 计算下一部分的起始位置(考虑重叠)
350
+ next_start = max(0, split_pos - overlap)
351
+ if next_start >= split_pos:
352
+ next_start = split_pos
353
+
354
+ if next_start >= len(content):
355
+ break
356
+
357
+ content = content[next_start:]
358
+
359
+ if len(content) <= overlap:
360
+ break
361
+
362
+ # 添加最后一部分
363
+ if len(content) > self.config.min_length:
364
+ parts.append(DocumentPart(
365
+ content=content,
366
+ title=f"{part.title} (第{len(parts)+1}部分)",
367
+ level=part.level,
368
+ metadata=part.metadata.copy()
369
+ ))
370
+
371
+ # 如果没有成功分割,返回原文档
372
+ if not parts:
373
+ return [part]
374
+
375
+ return parts
376
+
377
+ def _find_best_split_position(self, content: str, max_pos: int) -> int:
378
+ """找到最佳分割位置"""
379
+ if max_pos >= len(content):
380
+ return len(content)
381
+
382
+ # 优先在句号后分割
383
+ for i in range(max_pos - 1, max(0, max_pos - 100), -1):
384
+ if i < len(content) and content[i] == '.' and i + 1 < len(content) and content[i + 1] == ' ':
385
+ return i + 1
386
+
387
+ # 其次在换行符处分割
388
+ for i in range(max_pos - 1, max(0, max_pos - 100), -1):
389
+ if i < len(content) and content[i] == '\n':
390
+ return i + 1
391
+
392
+ # 最后在空格处分割
393
+ for i in range(max_pos - 1, max(0, max_pos - 50), -1):
394
+ if i < len(content) and content[i] == ' ':
395
+ return i + 1
396
+
397
+ return max_pos
398
+
399
+ def _split_by_headings(self, content: str) -> List[DocumentPart]:
400
+ """按标题分割 Markdown 内容"""
401
+ lines = content.split('\n')
402
+ parts = []
403
+ current_part = DocumentPart(content="", title="", level=1)
404
+ current_lines = []
405
+
406
+ for line in lines:
407
+ # 检查是否是标题行
408
+ if line.strip().startswith('#'):
409
+ level = self._get_heading_level(line)
410
+ title = self._extract_title_from_line(line)
411
+
412
+ # 如果这是我们要分割的标题级别
413
+ if self._should_split_at_level(level):
414
+ # 保存之前的部分
415
+ if current_lines:
416
+ current_part.content = '\n'.join(current_lines)
417
+ if not current_part.title:
418
+ current_part.title = self._extract_title(current_part.content)
419
+ current_part.level = 1
420
+ parts.append(current_part)
421
+
422
+ # 开始新的部分
423
+ current_part = DocumentPart(
424
+ content="",
425
+ title=title,
426
+ level=level
427
+ )
428
+ current_lines = [line]
429
+ else:
430
+ # 不是分割级别的标题,添加到当前部分
431
+ current_lines.append(line)
432
+ else:
433
+ # 普通行,添加到当前部分
434
+ current_lines.append(line)
435
+
436
+ # 添加最后一个部分
437
+ if current_lines:
438
+ current_part.content = '\n'.join(current_lines)
439
+ if not current_part.title:
440
+ current_part.title = self._extract_title(current_part.content)
441
+ current_part.level = 1
442
+ parts.append(current_part)
443
+
444
+ # 如果没有找到任何部分,使用整个内容
445
+ if not parts:
446
+ parts = [DocumentPart(
447
+ content=content,
448
+ title=self._extract_title(content),
449
+ level=1
450
+ )]
451
+
452
+ return parts
453
+
454
+ def _get_heading_level(self, line: str) -> int:
455
+ """获取标题级别"""
456
+ trimmed = line.strip()
457
+ level = 0
458
+ for char in trimmed:
459
+ if char == '#':
460
+ level += 1
461
+ else:
462
+ break
463
+ return level
464
+
465
+ def _extract_title_from_line(self, line: str) -> str:
466
+ """从标题行提取标题文本"""
467
+ title = re.sub(r'^#+\s*', '', line.strip())
468
+ title = title.strip()
469
+ return title if title else "Untitled"
470
+
471
+ def _should_split_at_level(self, level: int) -> bool:
472
+ """判断是否应该在指定级别分割"""
473
+ if self.split_mode == SplitMode.HEADING1:
474
+ return level == 1
475
+ elif self.split_mode == SplitMode.HEADING2:
476
+ return level <= 2
477
+ elif self.split_mode == SplitMode.HEADING3:
478
+ return level <= 3
479
+ elif self.split_mode == SplitMode.ANY_HEADING:
480
+ return self.min_heading_level <= level <= self.max_heading_level
481
+ else:
482
+ return False
483
+
484
+ def _split_by_delimiter(self, content: str) -> List[DocumentPart]:
485
+ """按分隔符分割内容(向后兼容)"""
486
+ parts = content.split(self.delimiter)
487
+ result = []
488
+
489
+ for part in parts:
490
+ trimmed = part.strip()
491
+ if trimmed:
492
+ result.append(DocumentPart(
493
+ content=trimmed,
494
+ title=self._extract_title(trimmed),
495
+ level=1
496
+ ))
497
+
498
+ return result
499
+
500
+ def _extract_title(self, content: str) -> str:
501
+ """从内容中提取标题"""
502
+ lines = content.split('\n')
503
+ for line in lines:
504
+ line = line.strip()
505
+ if line.startswith('#'):
506
+ # 移除 # 符号和前后空格
507
+ title = re.sub(r'^#+\s*', '', line)
508
+ title = title.strip()
509
+ if title:
510
+ return title
511
+
512
+ # 如果没有找到标题,使用前50个字符
513
+ if len(content) > 50:
514
+ return content[:50] + "..."
515
+ return content
516
+
517
+ def _get_base_name(self, filename: str) -> str:
518
+ """获取文件的基本名称(不包含扩展名)"""
519
+ if not filename or filename == "stdin":
520
+ return "stdin"
521
+
522
+ return Path(filename).stem
523
+
524
+ def _generate_temp_filename(self, base_name: str, index: int, total: int, content: str) -> str:
525
+ """生成临时文件名,基于内容MD5哈希"""
526
+ # 生成内容的MD5哈希(取前8位)
527
+ content_hash = hashlib.md5(content.encode('utf-8')).hexdigest()[:8]
528
+
529
+ if total == 1:
530
+ return f"{base_name}_{content_hash}.md"
531
+
532
+ return f"{base_name}_{index+1:02d}_{content_hash}.md"
533
+
534
+ def _sanitize_filename(self, title: str) -> str:
535
+ """清理文件名,移除不安全字符"""
536
+ # 移除或替换不安全的文件名字符
537
+ safe = re.sub(r'[<>:"/\\|?*\s]+', '_', title)
538
+
539
+ # 移除多余的下划线
540
+ safe = re.sub(r'_+', '_', safe)
541
+
542
+ # 移除开头和结尾的下划线
543
+ safe = safe.strip('_')
544
+
545
+ # 限制长度
546
+ if len(safe) > 50:
547
+ safe = safe[:50]
548
+
549
+ return safe.lower()
550
+
551
+ def validate_content(self, content: str) -> None:
552
+ """验证 Markdown 内容"""
553
+ if not content.strip():
554
+ raise ValueError(get_message("content_empty"))
555
+
556
+ def get_document_info(self, doc: Document) -> str:
557
+ """获取文档信息摘要"""
558
+ content_preview = doc.content
559
+ if len(content_preview) > 100:
560
+ content_preview = content_preview[:100] + "..."
561
+
562
+ title = doc.title if doc.title else "无标题"
563
+
564
+ return (f"标题: {title} (H{doc.heading_level}), 文件: {doc.original_file}, "
565
+ f"部分: {doc.index+1}, 临时文件: {doc.temp_filename}, 内容预览: {content_preview}")
566
+
567
+ def set_split_mode(self, mode: SplitMode):
568
+ """设置分割模式"""
569
+ self.split_mode = mode
570
+
571
+ def set_delimiter(self, delimiter: str):
572
+ """设置自定义分隔符(用于兼容模式)"""
573
+ if delimiter:
574
+ self.delimiter = delimiter
575
+ self.split_mode = SplitMode.DELIMITER
576
+
577
+ def set_heading_level_range(self, min_level: int, max_level: int):
578
+ """设置标题级别范围"""
579
+ if 1 <= min_level <= 6 and min_level <= max_level <= 6:
580
+ self.min_heading_level = min_level
581
+ self.max_heading_level = max_level
582
+
583
+ def set_custom_splitter(self, splitter: Callable[[str], List[str]]):
584
+ """设置自定义分割器"""
585
+ self.config.custom_splitter = splitter
586
+
587
+ def set_length_constraints(self, min_length: int, max_length: int):
588
+ """设置长度约束"""
589
+ self.config.min_length = min_length
590
+ self.config.max_length = max_length
591
+
592
+ def set_overlap_size(self, size: int):
593
+ """设置重叠大小"""
594
+ self.config.overlap_size = size
595
+