PyPI - cecli-dev - Versions diffs - 0.93.1__py3-none-any.whl - Mend

cecli-dev 0.93.1__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (366) hide show

cecli/__init__.py +20 -0
cecli/__main__.py +4 -0
cecli/_version.py +34 -0
cecli/args.py +1092 -0
cecli/args_formatter.py +228 -0
cecli/change_tracker.py +133 -0
cecli/coders/__init__.py +38 -0
cecli/coders/agent_coder.py +1872 -0
cecli/coders/architect_coder.py +63 -0
cecli/coders/ask_coder.py +8 -0
cecli/coders/base_coder.py +3993 -0
cecli/coders/chat_chunks.py +116 -0
cecli/coders/context_coder.py +52 -0
cecli/coders/copypaste_coder.py +269 -0
cecli/coders/editblock_coder.py +656 -0
cecli/coders/editblock_fenced_coder.py +9 -0
cecli/coders/editblock_func_coder.py +140 -0
cecli/coders/editor_diff_fenced_coder.py +8 -0
cecli/coders/editor_editblock_coder.py +8 -0
cecli/coders/editor_whole_coder.py +8 -0
cecli/coders/help_coder.py +15 -0
cecli/coders/patch_coder.py +705 -0
cecli/coders/search_replace.py +757 -0
cecli/coders/shell.py +37 -0
cecli/coders/single_wholefile_func_coder.py +101 -0
cecli/coders/udiff_coder.py +428 -0
cecli/coders/udiff_simple.py +12 -0
cecli/coders/wholefile_coder.py +143 -0
cecli/coders/wholefile_func_coder.py +133 -0
cecli/commands/__init__.py +192 -0
cecli/commands/add.py +226 -0
cecli/commands/agent.py +51 -0
cecli/commands/architect.py +46 -0
cecli/commands/ask.py +44 -0
cecli/commands/chat_mode.py +0 -0
cecli/commands/clear.py +37 -0
cecli/commands/code.py +46 -0
cecli/commands/command_prefix.py +44 -0
cecli/commands/commit.py +52 -0
cecli/commands/context.py +47 -0
cecli/commands/context_blocks.py +124 -0
cecli/commands/context_management.py +51 -0
cecli/commands/copy.py +62 -0
cecli/commands/copy_context.py +81 -0
cecli/commands/core.py +287 -0
cecli/commands/diff.py +68 -0
cecli/commands/drop.py +217 -0
cecli/commands/editor.py +78 -0
cecli/commands/exit.py +55 -0
cecli/commands/git.py +57 -0
cecli/commands/help.py +140 -0
cecli/commands/history_search.py +40 -0
cecli/commands/lint.py +109 -0
cecli/commands/list_sessions.py +56 -0
cecli/commands/load.py +85 -0
cecli/commands/load_session.py +48 -0
cecli/commands/load_skill.py +68 -0
cecli/commands/ls.py +75 -0
cecli/commands/map.py +37 -0
cecli/commands/map_refresh.py +35 -0
cecli/commands/model.py +118 -0
cecli/commands/models.py +41 -0
cecli/commands/multiline_mode.py +38 -0
cecli/commands/paste.py +91 -0
cecli/commands/quit.py +32 -0
cecli/commands/read_only.py +267 -0
cecli/commands/read_only_stub.py +270 -0
cecli/commands/reasoning_effort.py +70 -0
cecli/commands/remove_skill.py +68 -0
cecli/commands/report.py +40 -0
cecli/commands/reset.py +88 -0
cecli/commands/run.py +99 -0
cecli/commands/save.py +49 -0
cecli/commands/save_session.py +43 -0
cecli/commands/settings.py +69 -0
cecli/commands/test.py +58 -0
cecli/commands/think_tokens.py +74 -0
cecli/commands/tokens.py +207 -0
cecli/commands/undo.py +145 -0
cecli/commands/utils/__init__.py +0 -0
cecli/commands/utils/base_command.py +131 -0
cecli/commands/utils/helpers.py +142 -0
cecli/commands/utils/registry.py +53 -0
cecli/commands/utils/save_load_manager.py +98 -0
cecli/commands/voice.py +78 -0
cecli/commands/weak_model.py +123 -0
cecli/commands/web.py +87 -0
cecli/deprecated_args.py +185 -0
cecli/diffs.py +129 -0
cecli/dump.py +29 -0
cecli/editor.py +147 -0
cecli/exceptions.py +115 -0
cecli/format_settings.py +26 -0
cecli/help.py +119 -0
cecli/help_pats.py +19 -0
cecli/helpers/__init__.py +9 -0
cecli/helpers/copypaste.py +123 -0
cecli/helpers/coroutines.py +8 -0
cecli/helpers/file_searcher.py +142 -0
cecli/helpers/model_providers.py +552 -0
cecli/helpers/plugin_manager.py +81 -0
cecli/helpers/profiler.py +162 -0
cecli/helpers/requests.py +77 -0
cecli/helpers/similarity.py +98 -0
cecli/helpers/skills.py +577 -0
cecli/history.py +186 -0
cecli/io.py +1782 -0
cecli/linter.py +304 -0
cecli/llm.py +101 -0
cecli/main.py +1280 -0
cecli/mcp/__init__.py +154 -0
cecli/mcp/oauth.py +250 -0
cecli/mcp/server.py +278 -0
cecli/mdstream.py +243 -0
cecli/models.py +1255 -0
cecli/onboarding.py +301 -0
cecli/prompts/__init__.py +0 -0
cecli/prompts/agent.yml +71 -0
cecli/prompts/architect.yml +35 -0
cecli/prompts/ask.yml +31 -0
cecli/prompts/base.yml +99 -0
cecli/prompts/context.yml +60 -0
cecli/prompts/copypaste.yml +5 -0
cecli/prompts/editblock.yml +143 -0
cecli/prompts/editblock_fenced.yml +106 -0
cecli/prompts/editblock_func.yml +25 -0
cecli/prompts/editor_diff_fenced.yml +115 -0
cecli/prompts/editor_editblock.yml +121 -0
cecli/prompts/editor_whole.yml +46 -0
cecli/prompts/help.yml +37 -0
cecli/prompts/patch.yml +110 -0
cecli/prompts/single_wholefile_func.yml +24 -0
cecli/prompts/udiff.yml +106 -0
cecli/prompts/udiff_simple.yml +13 -0
cecli/prompts/utils/__init__.py +0 -0
cecli/prompts/utils/prompt_registry.py +167 -0
cecli/prompts/utils/system.py +56 -0
cecli/prompts/wholefile.yml +50 -0
cecli/prompts/wholefile_func.yml +24 -0
cecli/queries/tree-sitter-language-pack/README.md +7 -0
cecli/queries/tree-sitter-language-pack/arduino-tags.scm +5 -0
cecli/queries/tree-sitter-language-pack/c-tags.scm +12 -0
cecli/queries/tree-sitter-language-pack/chatito-tags.scm +16 -0
cecli/queries/tree-sitter-language-pack/clojure-tags.scm +12 -0
cecli/queries/tree-sitter-language-pack/commonlisp-tags.scm +127 -0
cecli/queries/tree-sitter-language-pack/cpp-tags.scm +18 -0
cecli/queries/tree-sitter-language-pack/csharp-tags.scm +32 -0
cecli/queries/tree-sitter-language-pack/d-tags.scm +26 -0
cecli/queries/tree-sitter-language-pack/dart-tags.scm +97 -0
cecli/queries/tree-sitter-language-pack/elisp-tags.scm +5 -0
cecli/queries/tree-sitter-language-pack/elixir-tags.scm +59 -0
cecli/queries/tree-sitter-language-pack/elm-tags.scm +22 -0
cecli/queries/tree-sitter-language-pack/gleam-tags.scm +41 -0
cecli/queries/tree-sitter-language-pack/go-tags.scm +49 -0
cecli/queries/tree-sitter-language-pack/java-tags.scm +26 -0
cecli/queries/tree-sitter-language-pack/javascript-tags.scm +96 -0
cecli/queries/tree-sitter-language-pack/lua-tags.scm +39 -0
cecli/queries/tree-sitter-language-pack/matlab-tags.scm +10 -0
cecli/queries/tree-sitter-language-pack/ocaml-tags.scm +115 -0
cecli/queries/tree-sitter-language-pack/ocaml_interface-tags.scm +101 -0
cecli/queries/tree-sitter-language-pack/pony-tags.scm +39 -0
cecli/queries/tree-sitter-language-pack/properties-tags.scm +5 -0
cecli/queries/tree-sitter-language-pack/python-tags.scm +24 -0
cecli/queries/tree-sitter-language-pack/r-tags.scm +27 -0
cecli/queries/tree-sitter-language-pack/racket-tags.scm +12 -0
cecli/queries/tree-sitter-language-pack/ruby-tags.scm +69 -0
cecli/queries/tree-sitter-language-pack/rust-tags.scm +63 -0
cecli/queries/tree-sitter-language-pack/solidity-tags.scm +43 -0
cecli/queries/tree-sitter-language-pack/swift-tags.scm +54 -0
cecli/queries/tree-sitter-language-pack/udev-tags.scm +20 -0
cecli/queries/tree-sitter-languages/README.md +24 -0
cecli/queries/tree-sitter-languages/c-tags.scm +12 -0
cecli/queries/tree-sitter-languages/c_sharp-tags.scm +52 -0
cecli/queries/tree-sitter-languages/cpp-tags.scm +18 -0
cecli/queries/tree-sitter-languages/dart-tags.scm +92 -0
cecli/queries/tree-sitter-languages/elisp-tags.scm +8 -0
cecli/queries/tree-sitter-languages/elixir-tags.scm +59 -0
cecli/queries/tree-sitter-languages/elm-tags.scm +22 -0
cecli/queries/tree-sitter-languages/fortran-tags.scm +18 -0
cecli/queries/tree-sitter-languages/go-tags.scm +36 -0
cecli/queries/tree-sitter-languages/haskell-tags.scm +5 -0
cecli/queries/tree-sitter-languages/hcl-tags.scm +77 -0
cecli/queries/tree-sitter-languages/java-tags.scm +26 -0
cecli/queries/tree-sitter-languages/javascript-tags.scm +96 -0
cecli/queries/tree-sitter-languages/julia-tags.scm +60 -0
cecli/queries/tree-sitter-languages/kotlin-tags.scm +30 -0
cecli/queries/tree-sitter-languages/matlab-tags.scm +10 -0
cecli/queries/tree-sitter-languages/ocaml-tags.scm +115 -0
cecli/queries/tree-sitter-languages/ocaml_interface-tags.scm +104 -0
cecli/queries/tree-sitter-languages/php-tags.scm +32 -0
cecli/queries/tree-sitter-languages/python-tags.scm +22 -0
cecli/queries/tree-sitter-languages/ql-tags.scm +26 -0
cecli/queries/tree-sitter-languages/ruby-tags.scm +69 -0
cecli/queries/tree-sitter-languages/rust-tags.scm +63 -0
cecli/queries/tree-sitter-languages/scala-tags.scm +64 -0
cecli/queries/tree-sitter-languages/typescript-tags.scm +44 -0
cecli/queries/tree-sitter-languages/zig-tags.scm +20 -0
cecli/reasoning_tags.py +82 -0
cecli/repo.py +626 -0
cecli/repomap.py +1368 -0
cecli/report.py +260 -0
cecli/resources/__init__.py +3 -0
cecli/resources/model-metadata.json +25751 -0
cecli/resources/model-settings.yml +2394 -0
cecli/resources/providers.json +67 -0
cecli/run_cmd.py +143 -0
cecli/scrape.py +295 -0
cecli/sendchat.py +250 -0
cecli/sessions.py +281 -0
cecli/special.py +203 -0
cecli/tools/__init__.py +72 -0
cecli/tools/command.py +103 -0
cecli/tools/command_interactive.py +113 -0
cecli/tools/context_manager.py +175 -0
cecli/tools/delete_block.py +154 -0
cecli/tools/delete_line.py +120 -0
cecli/tools/delete_lines.py +144 -0
cecli/tools/extract_lines.py +281 -0
cecli/tools/finished.py +35 -0
cecli/tools/git_branch.py +132 -0
cecli/tools/git_diff.py +49 -0
cecli/tools/git_log.py +43 -0
cecli/tools/git_remote.py +39 -0
cecli/tools/git_show.py +37 -0
cecli/tools/git_status.py +32 -0
cecli/tools/grep.py +242 -0
cecli/tools/indent_lines.py +195 -0
cecli/tools/insert_block.py +263 -0
cecli/tools/list_changes.py +71 -0
cecli/tools/load_skill.py +51 -0
cecli/tools/ls.py +77 -0
cecli/tools/remove_skill.py +51 -0
cecli/tools/replace_all.py +113 -0
cecli/tools/replace_line.py +135 -0
cecli/tools/replace_lines.py +180 -0
cecli/tools/replace_text.py +186 -0
cecli/tools/show_numbered_context.py +137 -0
cecli/tools/thinking.py +52 -0
cecli/tools/undo_change.py +82 -0
cecli/tools/update_todo_list.py +148 -0
cecli/tools/utils/base_tool.py +64 -0
cecli/tools/utils/helpers.py +359 -0
cecli/tools/utils/output.py +119 -0
cecli/tools/utils/registry.py +145 -0
cecli/tools/view_files_matching.py +138 -0
cecli/tools/view_files_with_symbol.py +117 -0
cecli/tui/__init__.py +83 -0
cecli/tui/app.py +971 -0
cecli/tui/io.py +566 -0
cecli/tui/styles.tcss +117 -0
cecli/tui/widgets/__init__.py +19 -0
cecli/tui/widgets/completion_bar.py +331 -0
cecli/tui/widgets/file_list.py +76 -0
cecli/tui/widgets/footer.py +165 -0
cecli/tui/widgets/input_area.py +320 -0
cecli/tui/widgets/key_hints.py +16 -0
cecli/tui/widgets/output.py +354 -0
cecli/tui/widgets/status_bar.py +279 -0
cecli/tui/worker.py +160 -0
cecli/urls.py +16 -0
cecli/utils.py +499 -0
cecli/versioncheck.py +90 -0
cecli/voice.py +90 -0
cecli/waiting.py +38 -0
cecli/watch.py +316 -0
cecli/watch_prompts.py +12 -0
cecli/website/Gemfile +8 -0
cecli/website/_includes/blame.md +162 -0
cecli/website/_includes/get-started.md +22 -0
cecli/website/_includes/help-tip.md +5 -0
cecli/website/_includes/help.md +24 -0
cecli/website/_includes/install.md +5 -0
cecli/website/_includes/keys.md +4 -0
cecli/website/_includes/model-warnings.md +67 -0
cecli/website/_includes/multi-line.md +22 -0
cecli/website/_includes/python-m-aider.md +5 -0
cecli/website/_includes/recording.css +228 -0
cecli/website/_includes/recording.md +34 -0
cecli/website/_includes/replit-pipx.md +9 -0
cecli/website/_includes/works-best.md +1 -0
cecli/website/_sass/custom/custom.scss +103 -0
cecli/website/docs/config/adv-model-settings.md +2498 -0
cecli/website/docs/config/agent-mode.md +320 -0
cecli/website/docs/config/aider_conf.md +548 -0
cecli/website/docs/config/api-keys.md +90 -0
cecli/website/docs/config/custom-commands.md +187 -0
cecli/website/docs/config/dotenv.md +493 -0
cecli/website/docs/config/editor.md +127 -0
cecli/website/docs/config/mcp.md +210 -0
cecli/website/docs/config/model-aliases.md +173 -0
cecli/website/docs/config/options.md +890 -0
cecli/website/docs/config/reasoning.md +210 -0
cecli/website/docs/config/skills.md +172 -0
cecli/website/docs/config/tui.md +126 -0
cecli/website/docs/config.md +44 -0
cecli/website/docs/faq.md +379 -0
cecli/website/docs/git.md +76 -0
cecli/website/docs/index.md +47 -0
cecli/website/docs/install/codespaces.md +39 -0
cecli/website/docs/install/docker.md +48 -0
cecli/website/docs/install/optional.md +100 -0
cecli/website/docs/install/replit.md +8 -0
cecli/website/docs/install.md +115 -0
cecli/website/docs/languages.md +264 -0
cecli/website/docs/legal/contributor-agreement.md +111 -0
cecli/website/docs/legal/privacy.md +104 -0
cecli/website/docs/llms/anthropic.md +77 -0
cecli/website/docs/llms/azure.md +48 -0
cecli/website/docs/llms/bedrock.md +132 -0
cecli/website/docs/llms/cohere.md +34 -0
cecli/website/docs/llms/deepseek.md +32 -0
cecli/website/docs/llms/gemini.md +49 -0
cecli/website/docs/llms/github.md +111 -0
cecli/website/docs/llms/groq.md +36 -0
cecli/website/docs/llms/lm-studio.md +39 -0
cecli/website/docs/llms/ollama.md +75 -0
cecli/website/docs/llms/openai-compat.md +39 -0
cecli/website/docs/llms/openai.md +58 -0
cecli/website/docs/llms/openrouter.md +78 -0
cecli/website/docs/llms/other.md +117 -0
cecli/website/docs/llms/vertex.md +50 -0
cecli/website/docs/llms/warnings.md +10 -0
cecli/website/docs/llms/xai.md +53 -0
cecli/website/docs/llms.md +54 -0
cecli/website/docs/more/analytics.md +127 -0
cecli/website/docs/more/edit-formats.md +116 -0
cecli/website/docs/more/infinite-output.md +192 -0
cecli/website/docs/more-info.md +8 -0
cecli/website/docs/recordings/auto-accept-architect.md +31 -0
cecli/website/docs/recordings/dont-drop-original-read-files.md +35 -0
cecli/website/docs/recordings/index.md +21 -0
cecli/website/docs/recordings/model-accepts-settings.md +69 -0
cecli/website/docs/recordings/tree-sitter-language-pack.md +80 -0
cecli/website/docs/repomap.md +112 -0
cecli/website/docs/scripting.md +100 -0
cecli/website/docs/sessions.md +213 -0
cecli/website/docs/troubleshooting/aider-not-found.md +24 -0
cecli/website/docs/troubleshooting/edit-errors.md +76 -0
cecli/website/docs/troubleshooting/imports.md +62 -0
cecli/website/docs/troubleshooting/models-and-keys.md +54 -0
cecli/website/docs/troubleshooting/support.md +79 -0
cecli/website/docs/troubleshooting/token-limits.md +96 -0
cecli/website/docs/troubleshooting/warnings.md +12 -0
cecli/website/docs/troubleshooting.md +11 -0
cecli/website/docs/usage/browser.md +57 -0
cecli/website/docs/usage/caching.md +49 -0
cecli/website/docs/usage/commands.md +133 -0
cecli/website/docs/usage/conventions.md +119 -0
cecli/website/docs/usage/copypaste.md +136 -0
cecli/website/docs/usage/images-urls.md +48 -0
cecli/website/docs/usage/lint-test.md +118 -0
cecli/website/docs/usage/modes.md +211 -0
cecli/website/docs/usage/not-code.md +179 -0
cecli/website/docs/usage/notifications.md +87 -0
cecli/website/docs/usage/tips.md +79 -0
cecli/website/docs/usage/tutorials.md +30 -0
cecli/website/docs/usage/voice.md +121 -0
cecli/website/docs/usage/watch.md +294 -0
cecli/website/docs/usage.md +102 -0
cecli/website/share/index.md +101 -0
cecli_dev-0.93.1.dist-info/METADATA +549 -0
cecli_dev-0.93.1.dist-info/RECORD +366 -0
cecli_dev-0.93.1.dist-info/WHEEL +5 -0
cecli_dev-0.93.1.dist-info/entry_points.txt +4 -0
cecli_dev-0.93.1.dist-info/licenses/LICENSE.txt +202 -0
cecli_dev-0.93.1.dist-info/top_level.txt +1 -0

cecli/repomap.py ADDED Viewed

@@ -0,0 +1,1368 @@
+import math
+import os
+import re
+import shutil
+import sqlite3
+import sys
+import time
+import warnings
+from collections import defaultdict, namedtuple
+from importlib import resources
+from pathlib import Path
+import tree_sitter
+from diskcache import Cache
+from grep_ast import TreeContext, filename_to_lang
+from pygments.lexers import guess_lexer_for_filename
+from pygments.token import Token
+from cecli.dump import dump
+from cecli.helpers.similarity import (
+    cosine_similarity,
+    create_bigram_vector,
+    normalize_vector,
+)
+from cecli.special import filter_important_files
+from cecli.tools.utils.helpers import ToolError
+# tree_sitter is throwing a FutureWarning
+warnings.simplefilter("ignore", category=FutureWarning)
+from grep_ast.tsl import USING_TSL_PACK, get_language, get_parser  # noqa: E402
+# Define the Tag namedtuple with a default for specific_kind to maintain compatibility
+# with cached entries that might have been created with the old definition
+class TagBase(
+    namedtuple(
+        "TagBase",
+        "rel_fname fname line name kind specific_kind start_line end_line start_byte end_byte",
+    )
+):
+    __slots__ = ()
+    def __new__(
+        cls,
+        rel_fname,
+        fname,
+        line,
+        name,
+        kind,
+        specific_kind=None,
+        start_line=None,
+        end_line=None,
+        start_byte=None,
+        end_byte=None,
+    ):
+        # Provide a default value for specific_kind to handle old cached objects
+        return super(TagBase, cls).__new__(
+            cls,
+            rel_fname,
+            fname,
+            line,
+            name,
+            kind,
+            specific_kind,
+            start_line,
+            end_line,
+            start_byte,
+            end_byte,
+        )
+Tag = TagBase
+SQLITE_ERRORS = (sqlite3.OperationalError, sqlite3.DatabaseError, OSError)
+CACHE_VERSION = 7
+if USING_TSL_PACK:
+    CACHE_VERSION = 9
+UPDATING_REPO_MAP_MESSAGE = "Updating repo map"
+class RepoMap:
+    TAGS_CACHE_DIR = f".cecli/tags.cache.v{CACHE_VERSION}"
+    warned_files = set()
+    # Class variable to store initial ranked tags results
+    _initial_ranked_tags = None
+    _initial_ident_to_files = None
+    # Define kinds that typically represent definitions across languages
+    # Used by AgentCoder to filter tags for the symbol outline
+    definition_kinds = {
+        "class",
+        "struct",
+        "enum",
+        "interface",
+        "trait",  # Structure definitions
+        "function",
+        "method",
+        "constructor",  # Function/method definitions
+        "module",
+        "namespace",  # Module/namespace definitions
+        "constant",
+        "variable",  # Top-level/class variable definitions (consider refining)
+        "type",  # Type definitions
+        # Add more based on tree-sitter queries if needed
+    }
+    @staticmethod
+    def get_file_stub(fname, io):
+        """Generate a complete structural outline of a source code file.
+        Args:
+            fname (str): Absolute path to the source file
+            io: InputOutput instance for file operations
+        Returns:
+            str: Formatted outline showing the file's structure
+        """
+        # Use cached instance if available
+        if not hasattr(RepoMap, "_stub_instance"):
+            RepoMap._stub_instance = RepoMap(map_tokens=0, io=io)
+        rm = RepoMap._stub_instance
+        rel_fname = rm.get_rel_fname(fname)
+        # Reuse existing tag parsing
+        tags = rm.get_tags(fname, rel_fname)
+        if not tags:
+            return "# No outline available"
+        # Get all definition lines
+        lois = [tag.line for tag in tags if tag.kind == "def"]
+        # Reuse existing tree rendering
+        outline = rm.render_tree(fname, rel_fname, lois)
+        return f"{outline}"
+    def __init__(
+        self,
+        map_tokens=1024,
+        map_cache_dir=".",
+        main_model=None,
+        io=None,
+        repo_content_prefix=None,
+        verbose=False,
+        max_context_window=None,
+        map_mul_no_files=8,
+        refresh="auto",
+        max_code_line_length=100,
+        repo_root=None,
+        use_memory_cache=False,
+        use_enhanced_map=False,
+    ):
+        self.io = io
+        self.verbose = verbose
+        self.refresh = refresh
+        self.use_enhanced_map = use_enhanced_map
+        self.map_cache_dir = map_cache_dir
+        # Prefer an explicit repo root (eg per-test repo), fallback to CWD
+        self.root = repo_root or os.getcwd()
+        # Allow opting into an in-memory tags cache to avoid disk/SQLite locks
+        if use_memory_cache:
+            self.TAGS_CACHE = dict()
+        else:
+            self.load_tags_cache()
+        self.cache_threshold = 0.95
+        self.max_map_tokens = map_tokens
+        self.map_mul_no_files = map_mul_no_files
+        self.max_context_window = max_context_window
+        self.max_code_line_length = max_code_line_length
+        self.repo_content_prefix = repo_content_prefix
+        self.main_model = main_model
+        self.tree_cache = {}
+        self.tree_context_cache = {}
+        self.map_cache = {}
+        self.map_processing_time = 0
+        self.last_map = None
+        # Initialize cache for mentioned identifiers similarity
+        self._last_mentioned_idents = None
+        self._last_mentioned_idents_vector = None
+        self._has_last_mentioned_idents = False
+        self._mentioned_ident_similarity = 0.8
+        if self.verbose:
+            self.io.tool_output(f"RepoMap loaded entries from tags cache: {len(self.TAGS_CACHE)}")
+            self.io.tool_output(
+                f"RepoMap initialized with map_mul_no_files: {self.map_mul_no_files}"
+            )
+            self.io.tool_output(f"RepoMap initialized with map_cache_dir: {self.map_cache_dir}")
+            self.io.tool_output(f"RepoMap assumes repo root is: {self.root}")
+    def token_count(self, text):
+        len_text = len(text)
+        if len_text < 200:
+            return self.main_model.token_count(text)
+        lines = text.splitlines(keepends=True)
+        num_lines = len(lines)
+        step = num_lines // 100 or 1
+        lines = lines[::step]
+        sample_text = "".join(lines)
+        sample_tokens = self.main_model.token_count(sample_text)
+        est_tokens = sample_tokens / len(sample_text) * len_text
+        return est_tokens
+    def get_repo_map(
+        self,
+        chat_files,
+        other_files,
+        mentioned_fnames=None,
+        mentioned_idents=None,
+        force_refresh=False,
+    ):
+        if self.max_map_tokens <= 0:
+            return
+        if not other_files:
+            return
+        if not mentioned_fnames:
+            mentioned_fnames = set()
+        if not mentioned_idents:
+            mentioned_idents = set()
+        max_map_tokens = self.max_map_tokens
+        # With no files in the chat, give a bigger view of the entire repo
+        padding = 4096
+        if max_map_tokens and self.max_context_window:
+            target = min(
+                int(max_map_tokens * self.map_mul_no_files),
+                self.max_context_window - padding,
+            )
+        else:
+            target = 0
+        if not chat_files and self.max_context_window and target > 0:
+            max_map_tokens = target
+        try:
+            files_listing = self.get_ranked_tags_map(
+                chat_files,
+                other_files,
+                max_map_tokens,
+                mentioned_fnames,
+                mentioned_idents,
+                force_refresh,
+            )
+        except RecursionError:
+            self.io.tool_error("Disabling repo map, git repo too large?")
+            self.max_map_tokens = 0
+            return
+        if not files_listing:
+            return
+        if self.verbose:
+            num_tokens = self.token_count(files_listing)
+            self.io.tool_output(f"Repo-map: {num_tokens / 1024:.1f} k-tokens")
+        if chat_files:
+            other = "other "
+        else:
+            other = ""
+        if self.repo_content_prefix:
+            repo_content = self.repo_content_prefix.format(other=other)
+        else:
+            repo_content = ""
+        repo_content += files_listing
+        return repo_content
+    def get_rel_fname(self, fname):
+        try:
+            return os.path.relpath(fname, self.root)
+        except ValueError:
+            # Issue #1288: ValueError: path is on mount 'C:', start on mount 'D:'
+            # Just return the full fname.
+            return fname
+    def tags_cache_error(self, original_error=None):
+        """Handle SQLite errors by trying to recreate cache, falling back to dict if needed"""
+        if self.verbose and original_error:
+            self.io.tool_warning(f"Tags cache error: {str(original_error)}")
+        if isinstance(getattr(self, "TAGS_CACHE", None), dict):
+            return
+        path = Path(self.map_cache_dir) / self.TAGS_CACHE_DIR
+        # Try to recreate the cache
+        try:
+            # Delete existing cache dir
+            if path.exists():
+                shutil.rmtree(path)
+            # Try to create new cache
+            new_cache = Cache(path)
+            # Test that it works
+            test_key = "test"
+            new_cache[test_key] = "test"
+            _ = new_cache[test_key]
+            del new_cache[test_key]
+            # If we got here, the new cache works
+            self.TAGS_CACHE = new_cache
+            return
+        except SQLITE_ERRORS as e:
+            # If anything goes wrong, warn and fall back to dict
+            self.io.tool_warning(
+                f"Unable to use tags cache at {path}, falling back to memory cache"
+            )
+            if self.verbose:
+                self.io.tool_warning(f"Cache recreation error: {str(e)}")
+        self.TAGS_CACHE = dict()
+    def load_tags_cache(self):
+        path = Path(self.map_cache_dir) / self.TAGS_CACHE_DIR
+        try:
+            self.TAGS_CACHE = Cache(path)
+        except SQLITE_ERRORS as e:
+            self.tags_cache_error(e)
+    def save_tags_cache(self):
+        pass
+    def get_mtime(self, fname):
+        try:
+            return os.path.getmtime(fname)
+        except FileNotFoundError:
+            self.io.tool_warning(f"File not found error: {fname}")
+    def _compute_file_summary(self, tags, rel_fname):
+        """Compute file-level summary from tags."""
+        defines = set()
+        references = defaultdict(int)
+        imports = set()
+        for tag in tags:
+            if tag.kind == "def":
+                defines.add(tag.name)
+            elif tag.kind == "ref":
+                references[tag.name] += 1
+            if tag.specific_kind == "import":
+                imports.add(tag.name)
+        return {"defines": defines, "references": dict(references), "imports": imports}
+    def _get_cached_summary(self, fname, file_mtime):
+        """Get cached summary for a file if available and up-to-date."""
+        cache_key = fname
+        try:
+            val = self.TAGS_CACHE.get(cache_key)  # Issue #1308
+        except SQLITE_ERRORS as e:
+            self.tags_cache_error(e)
+            val = self.TAGS_CACHE.get(cache_key)
+        if val is not None and val.get("mtime") == file_mtime:
+            # Handle backward compatibility: old cache entries won't have "summary"
+            summary = val.get("summary")
+            if summary is None:
+                # Compute summary from cached data
+                data = val.get("data")
+                if data is not None:
+                    rel_fname = self.get_rel_fname(fname)
+                    summary = self._compute_file_summary(data, rel_fname)
+                    # Update cache with summary for future use
+                    val["summary"] = summary
+                    self.TAGS_CACHE[cache_key] = val
+            return summary
+        return None
+    def get_tags(self, fname, rel_fname):
+        # Check if the file is in the cache and if the modification time has not changed
+        file_mtime = self.get_mtime(fname)
+        if file_mtime is None:
+            return []
+        cache_key = fname
+        try:
+            val = self.TAGS_CACHE.get(cache_key)  # Issue #1308
+        except SQLITE_ERRORS as e:
+            self.tags_cache_error(e)
+            val = self.TAGS_CACHE.get(cache_key)
+        if val is not None and val.get("mtime") == file_mtime:
+            try:
+                # Get the cached data
+                data = self.TAGS_CACHE[cache_key]["data"]
+                # Let our Tag class handle compatibility with old cache formats
+                # No need for special handling as TagBase.__new__ will supply default specific_kind
+                return data
+            except SQLITE_ERRORS as e:
+                self.tags_cache_error(e)
+                return self.TAGS_CACHE[cache_key]["data"]
+            except (TypeError, AttributeError) as e:
+                # If we hit an error related to missing fields in old cached Tag objects,
+                # force a cache refresh for this file
+                if self.verbose:
+                    self.io.tool_warning(f"Cache format error for {fname}, refreshing: {e}")
+                # Return empty list to trigger cache refresh
+                return []
+        # miss!
+        data = list(self.get_tags_raw(fname, rel_fname))
+        # Compute file summary
+        summary = self._compute_file_summary(data, rel_fname)
+        # Update the cache
+        try:
+            self.TAGS_CACHE[cache_key] = {"mtime": file_mtime, "data": data, "summary": summary}
+            self.save_tags_cache()
+        except SQLITE_ERRORS as e:
+            self.tags_cache_error(e)
+            self.TAGS_CACHE[cache_key] = {"mtime": file_mtime, "data": data, "summary": summary}
+        return data
+    def get_symbol_definition_location(self, file_path, symbol_name):
+        """
+        Finds the unique definition location (start/end line) for a symbol in a file.
+        Args:
+            file_path (str): The relative path to the file.
+            symbol_name (str): The name of the symbol to find.
+        Returns:
+            tuple: (start_line, end_line) (0-based) if a unique definition is found.
+        Raises:
+            ToolError: If the symbol is not found, not unique, or not a definition.
+        """
+        abs_path = self.io.root_abs_path(file_path)  # Assuming io has this helper or similar
+        rel_path = self.get_rel_fname(abs_path)  # Ensure we use consistent relative path
+        tags = self.get_tags(abs_path, rel_path)
+        if not tags:
+            raise ToolError(f"Symbol '{symbol_name}' not found in '{file_path}' (no tags).")
+        definitions = []
+        for tag in tags:
+            # Check if it's a definition and the name matches
+            if tag.kind == "def" and tag.name == symbol_name:
+                # Ensure we have valid location info
+                if tag.start_line is not None and tag.end_line is not None and tag.start_line >= 0:
+                    definitions.append(tag)
+        if not definitions:
+            # Check if it exists as a non-definition tag
+            non_defs = [tag for tag in tags if tag.name == symbol_name and tag.kind != "def"]
+            if non_defs:
+                raise ToolError(
+                    f"Symbol '{symbol_name}' found in '{file_path}', but not as a unique definition"
+                    f" (found as {non_defs[0].kind})."
+                )
+            else:
+                raise ToolError(f"Symbol '{symbol_name}' definition not found in '{file_path}'.")
+        if len(definitions) > 1:
+            # Provide more context about ambiguity if possible
+            lines = sorted([d.start_line + 1 for d in definitions])  # 1-based for user message
+            raise ToolError(
+                f"Symbol '{symbol_name}' is ambiguous in '{file_path}'. Found definitions on lines:"
+                f" {', '.join(map(str, lines))}."
+            )
+        # Unique definition found
+        definition_tag = definitions[0]
+        return definition_tag.start_line, definition_tag.end_line
+        # Check if the file is in the cache and if the modification time has not changed
+    def shared_path_components(self, path1_str, path2_str):
+        """
+        Calculates distance based on how many parent components are shared.
+        Distance = Total parts - (2 * Shared parts). Lower is closer.
+        """
+        p1 = Path(path1_str).parts
+        p2 = Path(path2_str).parts
+        # Count the number of common leading parts
+        common_count = 0
+        for comp1, comp2 in zip(p1, p2):
+            if comp1 == comp2:
+                common_count += 1
+            else:
+                break
+        # A simple metric of difference:
+        # (Total parts in P1 + Total parts in P2) - (2 * Common parts)
+        distance = len(p1) + len(p2) - (2 * common_count)
+        return distance
+    def check_import_match(self, definer, imports):
+        definer_path = Path(definer)
+        definer_parts = list(definer_path.parts)
+        if not definer_parts:
+            return False
+        # Remove extension from last part
+        definer_parts[-1] = os.path.splitext(definer_parts[-1])[0]
+        for imp in imports:
+            imp_parts = [p for p in re.split(r"[.\\/]", imp) if p]
+            if len(imp_parts) > len(definer_parts):
+                continue
+            # Check for sub-sequence match
+            # Check for sub-sequence match
+            for i in range(len(definer_parts) - len(imp_parts) + 1):
+                if definer_parts[i : i + len(imp_parts)] == imp_parts:
+                    # Allow if it's a suffix match (standard aliasing)
+                    if i + len(imp_parts) == len(definer_parts):
+                        return True
+                    # Allow partial/middle match if enough specificity (>= 2 parts)
+                    if len(imp_parts) >= 2:
+                        return True
+        return False
+    def get_tags_raw(self, fname, rel_fname):
+        lang = filename_to_lang(fname)
+        if not lang:
+            return
+        try:
+            language = get_language(lang)
+            parser = get_parser(lang)
+        except Exception as err:
+            if self.verbose:
+                print(f"Skipping file {fname}: {err}")
+            return
+        query_scm = get_scm_fname(lang)
+        if not query_scm.exists():
+            return
+        query_scm = query_scm.read_text()
+        code = self.io.read_text(fname)
+        if not code:
+            return
+        tree = parser.parse(bytes(code, "utf-8"))
+        # Run the tags queries
+        if sys.version_info >= (3, 10):
+            query = tree_sitter.Query(language, query_scm)
+            cursor = tree_sitter.QueryCursor(query)
+            captures = cursor.captures(tree.root_node)
+        else:
+            query = language.query(query_scm)
+            captures = query.captures(tree.root_node)
+        saw = set()
+        if USING_TSL_PACK:
+            all_nodes = []
+            for tag, nodes in captures.items():
+                all_nodes += [(node, tag) for node in nodes]
+        else:
+            all_nodes = list(captures)
+        for node, tag in all_nodes:
+            if tag.startswith("name.definition."):
+                kind = "def"
+            elif tag.startswith("name.reference."):
+                kind = "ref"
+            else:
+                continue
+            saw.add(kind)
+            # Extract specific kind from the tag, e.g., 'function' from 'name.definition.function'
+            specific_kind = tag.split(".")[-1] if "." in tag else None
+            result = Tag(
+                rel_fname=rel_fname,
+                fname=fname,
+                name=node.text.decode("utf-8"),
+                kind=kind,
+                specific_kind=specific_kind,
+                line=node.start_point[0],  # Legacy line number
+                start_line=node.start_point[0],
+                end_line=node.end_point[0],
+                start_byte=node.start_byte,
+                end_byte=node.end_byte,
+            )
+            yield result
+        if "ref" in saw:
+            return
+        if "def" not in saw:
+            return
+        # We saw defs, without any refs
+        # Some tags files only provide defs (cpp, for example)
+        # Use pygments to backfill refs
+        try:
+            lexer = guess_lexer_for_filename(fname, code)
+        except Exception:  # On Windows, bad ref to time.clock which is deprecated?
+            # self.io.tool_error(f"Error lexing {fname}")
+            return
+        tokens = list(lexer.get_tokens(code))
+        tokens = [token[1] for token in tokens if token[0] in Token.Name]
+        for token in tokens:
+            yield Tag(
+                rel_fname=rel_fname,
+                fname=fname,
+                name=token,
+                kind="ref",
+                specific_kind="name",  # Default for pygments fallback
+                line=-1,  # Pygments doesn't give precise locations easily
+                start_line=-1,
+                end_line=-1,
+                start_byte=-1,
+                end_byte=-1,
+            )
+    def get_ranked_tags(
+        self, chat_fnames, other_fnames, mentioned_fnames, mentioned_idents, progress=True
+    ):
+        import rustworkx
+        defines = defaultdict(set)
+        references = defaultdict(lambda: defaultdict(int))
+        total_ref_count = defaultdict(int)  # Track total references per identifier
+        definitions = defaultdict(set)
+        file_imports = defaultdict(set)
+        import_ast_mode = False
+        personalization = dict()
+        fnames = set(chat_fnames).union(set(other_fnames))
+        chat_rel_fnames = set()
+        fnames = sorted(fnames)
+        # Default personalization for unspecified files is 1/num_nodes
+        personalize = 100 / len(fnames)
+        fname_to_parts = {}
+        fname_to_suffix = {}
+        try:
+            cache_size = len(self.TAGS_CACHE)
+        except SQLITE_ERRORS as e:
+            self.tags_cache_error(e)
+            cache_size = len(self.TAGS_CACHE)
+        if len(fnames) - cache_size > 100:
+            self.io.tool_output(
+                "Initial repo scan can be slow in larger repos, but only happens once."
+            )
+            self.io.update_spinner("Scanning repo")
+            showing_bar = True
+        else:
+            showing_bar = False
+        num_fnames = len(fnames)
+        fname_index = 0
+        for fname in fnames:
+            if self.verbose:
+                self.io.tool_output(f"Processing {fname}")
+            if progress:
+                if showing_bar:
+                    fname_index += 1
+                    self.io.update_spinner(f"Scanning repo: {fname_index}/{num_fnames}")
+                else:
+                    self.io.update_spinner(f"{UPDATING_REPO_MAP_MESSAGE}: {fname}")
+            try:
+                file_ok = os.path.isfile(fname)
+            except OSError:
+                file_ok = False
+            if not file_ok:
+                if fname not in self.warned_files:
+                    self.io.tool_warning(f"Repo-map can't include {fname}")
+                    self.io.tool_output(
+                        "Has it been deleted from the file system but not from git?"
+                    )
+                    self.warned_files.add(fname)
+                continue
+            # dump(fname)
+            rel_fname = self.get_rel_fname(fname)
+            current_pers = 0.0  # Start with 0 personalization score
+            if fname in chat_fnames:
+                current_pers += personalize
+                chat_rel_fnames.add(rel_fname)
+            if rel_fname in mentioned_fnames:
+                # Use max to avoid double counting if in chat_fnames and mentioned_fnames
+                current_pers = max(current_pers, personalize)
+            # Check path components against mentioned_idents
+            path_obj = Path(rel_fname)
+            fname_to_parts[rel_fname] = path_obj.parts
+            fname_to_suffix[rel_fname] = path_obj.suffix
+            path_components = set(path_obj.parts)
+            basename_with_ext = path_obj.name
+            basename_without_ext, _ = os.path.splitext(basename_with_ext)
+            components_to_check = path_components.union({basename_with_ext, basename_without_ext})
+            matched_idents = components_to_check.intersection(mentioned_idents)
+            if matched_idents:
+                # Add personalization *once* if any path component matches a mentioned ident
+                current_pers += personalize
+            if current_pers > 0:
+                personalization[rel_fname] = current_pers  # Assign the final calculated value
+            # Get file mtime and check for cached summary
+            file_mtime = self.get_mtime(fname)
+            summary = None
+            if file_mtime is not None:
+                summary = self._get_cached_summary(fname, file_mtime)
+            if summary is not None:
+                # Use cached summary for defines and references
+                for ident in summary["defines"]:
+                    defines[ident].add(rel_fname)
+                for ident, count in summary["references"].items():
+                    references[ident][rel_fname] += count
+                    total_ref_count[ident] += count
+                for imp in summary["imports"]:
+                    file_imports[rel_fname].add(imp)
+                # Still need to parse tags for definitions (Tag objects)
+                # But only if this file has definitions
+                if summary["defines"]:
+                    tags = list(self.get_tags(fname, rel_fname))
+                    if tags is not None:
+                        for tag in tags:
+                            if tag.kind == "def":
+                                key = (rel_fname, tag.name)
+                                definitions[key].add(tag)
+            else:
+                # No cached summary, parse all tags
+                tags = list(self.get_tags(fname, rel_fname))
+                if tags is None:
+                    continue
+                for tag in tags:
+                    if tag.kind == "def":
+                        defines[tag.name].add(rel_fname)
+                        key = (rel_fname, tag.name)
+                        definitions[key].add(tag)
+                    elif tag.kind == "ref":
+                        references[tag.name][rel_fname] += 1
+                        total_ref_count[tag.name] += 1
+                    if tag.specific_kind == "import":
+                        file_imports[rel_fname].add(tag.name)
+        self.io.profile("Process Files")
+        if self.use_enhanced_map and len(file_imports) > 0:
+            import_ast_mode = True
+        if len(references) == 0:
+            # Convert defines to the new references structure: dict of dicts with counts
+            references = {}
+            for ident, files in defines.items():
+                references[ident] = {file: 1 for file in files}
+                total_ref_count[ident] = len(files)  # Each file has count 1
+        idents = set(defines.keys()).intersection(set(references.keys()))
+        G = rustworkx.PyDiGraph(multigraph=True)
+        # Collect all unique file names that will be nodes
+        all_files = set()
+        for files in defines.values():
+            all_files.update(files)
+        for ref_dict in references.values():
+            all_files.update(ref_dict.keys())
+        all_files.update(file_imports.keys())
+        all_files.update(personalization.keys())
+        # Add all nodes and create mapping from file name to node index
+        file_to_node = {}
+        node_to_file = {}
+        for fname in sorted(all_files):
+            node_idx = G.add_node(fname)
+            file_to_node[fname] = node_idx
+            node_to_file[node_idx] = fname
+        # Add a small self-edge for every definition that has no references
+        # Helps with tree-sitter 0.23.2 with ruby, where "def greet(name)"
+        # isn't counted as a def AND a ref. tree-sitter 0.24.0 does.
+        unreferenced_weight = 2**-32 / (len(idents) + 1)
+        for ident in defines.keys():
+            if ident in references:
+                continue
+            for definer in defines[ident]:
+                definer_idx = file_to_node[definer]
+                G.add_edge(
+                    definer_idx, definer_idx, {"weight": unreferenced_weight, "ident": ident}
+                )
+        for ident in idents:
+            if progress:
+                self.io.update_spinner(f"{UPDATING_REPO_MAP_MESSAGE}: {ident}")
+            definers = defines[ident]
+            mul = 1.0
+            is_snake = ("_" in ident) and any(c.isalpha() for c in ident)
+            is_kebab = ("-" in ident) and any(c.isalpha() for c in ident)
+            is_camel = any(c.isupper() for c in ident) and any(c.islower() for c in ident)
+            if ident in mentioned_idents:
+                mul *= 16
+            # Prioritize function-like identifiers
+            if (
+                (is_snake or is_kebab or is_camel)
+                and len(ident) >= 8
+                and "test" not in ident.lower()
+            ):
+                mul *= 16
+            # Downplay repetitive definitions in case of common boiler plate
+            # Scale down logarithmically given the increasing number of references in a codebase
+            # Ideally, this will help downweight boiler plate in frameworks, interfaces, and abstract classes
+            if len(defines[ident]) > 4:
+                exp = min(len(defines[ident]), 32)
+                mul *= math.log2((4 / (2**exp)) + 1)
+            # Calculate multiplier: log(number of unique file references * total references ^ 2)
+            # Used to balance the number of times an identifier appears with its number of refs per file
+            # Penetration in code base is important
+            # So is the frequency
+            # And the logarithm keeps them from scaling out of bounds forever
+            # Combined with the above downweighting
+            # There should be a push/pull that balances repetitiveness of identifier defs
+            # With absolute number of references throughout a codebase
+            unique_file_refs = len(references[ident])
+            total_refs = total_ref_count[ident]
+            ext_mul = round(math.log2(unique_file_refs * total_refs**2 + 1))
+            for referencer, num_refs in references[ident].items():
+                relevant_definers = [] if import_ast_mode else definers
+                # A referencer should not link to any definiers of an identifier it also defines
+                if referencer in definers:
+                    relevant_definers = [referencer]
+                elif import_ast_mode:
+                    if referencer in file_imports:
+                        matches = [
+                            d
+                            for d in definers
+                            if self.check_import_match(d, file_imports[referencer])
+                        ]
+                        if matches:
+                            relevant_definers = matches
+                for definer in relevant_definers:
+                    # dump(referencer, definer, num_refs, mul)
+                    # Only add edge if file extensions match
+                    referencer_ext = fname_to_suffix[referencer]
+                    definer_ext = fname_to_suffix[definer]
+                    if referencer_ext != definer_ext:
+                        continue
+                    use_mul = mul * ext_mul
+                    if referencer in chat_rel_fnames:
+                        use_mul *= 64
+                    elif referencer == definer:
+                        use_mul *= num_refs / 128
+                    # scale down so high freq (low value) mentions don't dominate
+                    # num_refs = math.sqrt(num_refs)
+                    p1 = fname_to_parts[referencer]
+                    p2 = fname_to_parts[definer]
+                    # Count common leading parts
+                    common_count = 0
+                    for c1, c2 in zip(p1, p2):
+                        if c1 == c2:
+                            common_count += 1
+                        else:
+                            break
+                    path_distance = len(p1) + len(p2) - (2 * common_count)
+                    weight = use_mul * 2 ** (-1 * path_distance)
+                    referencer_idx = file_to_node[referencer]
+                    definer_idx = file_to_node[definer]
+                    G.add_edge(
+                        referencer_idx,
+                        definer_idx,
+                        {"weight": weight, "key": ident, "ident": ident},
+                    )
+        self.io.profile("Build Graph")
+        self.io.profile("PERSONALIZATION START")
+        # Convert personalization from file names to node indices
+        if personalization:
+            pers_node = {file_to_node[fname]: val for fname, val in personalization.items()}
+            pers_args = dict(personalization=pers_node, dangling=pers_node)
+        else:
+            pers_args = dict()
+        self.io.profile("PERSONALIZATION END")
+        try:
+            ranked = rustworkx.pagerank(G, weight_fn=lambda edge: edge["weight"], **pers_args)
+        except ZeroDivisionError:
+            # Issue #1536
+            try:
+                ranked = rustworkx.pagerank(G, weight_fn=lambda edge: edge["weight"])
+            except ZeroDivisionError:
+                self.io.profile("zero")
+                return []
+            except Exception as e:
+                self.io.profile(e)
+        except Exception as e:
+            self.io.profile(e)
+        self.io.profile("PageRank")
+        # distribute the rank from each source node, across all of its out edges
+        ranked_definitions = defaultdict(float)
+        for src in G.node_indices():
+            if progress:
+                self.io.update_spinner(f"{UPDATING_REPO_MAP_MESSAGE}: {src}")
+            src_rank = ranked[src]
+            total_weight = sum(data["weight"] for _src, _dst, data in G.out_edges(src))
+            # dump(src, src_rank, total_weight)
+            for _src, dst, data in G.out_edges(src):
+                data["rank"] = src_rank * data["weight"] / total_weight
+                ident = data["ident"]
+                fname = node_to_file[dst]
+                ranked_definitions[(fname, ident)] += data["rank"]
+        self.io.profile("Distribute Rank")
+        ranked_tags = []
+        ranked_definitions = sorted(
+            ranked_definitions.items(), reverse=True, key=lambda x: (x[1], x[0])
+        )
+        # with open('defs.txt', 'w') as out_file:
+        #     import pprint
+        #     printer = pprint.PrettyPrinter(indent=2, stream=out_file)
+        #     printer.pprint(ranked_definitions)
+        for (fname, ident), rank in ranked_definitions:
+            # print(f"{rank:.03f} {fname} {ident}")
+            if fname in chat_rel_fnames:
+                continue
+            ranked_tags += list(definitions.get((fname, ident), []))
+        rel_other_fnames_without_tags = set(self.get_rel_fname(fname) for fname in other_fnames)
+        fnames_already_included = set(rt[0] for rt in ranked_tags)
+        top_rank = sorted([(rank, node_idx) for (node_idx, rank) in ranked.items()], reverse=True)
+        for rank, node_idx in top_rank:
+            fname = node_to_file[node_idx]
+            if fname in rel_other_fnames_without_tags:
+                rel_other_fnames_without_tags.remove(fname)
+            if fname not in fnames_already_included:
+                ranked_tags.append((fname,))
+        for fname in rel_other_fnames_without_tags:
+            ranked_tags.append((fname,))
+        return ranked_tags
+    def get_ranked_tags_map(
+        self,
+        chat_fnames,
+        other_fnames=None,
+        max_map_tokens=None,
+        mentioned_fnames=None,
+        mentioned_idents=None,
+        force_refresh=False,
+    ):
+        if not other_fnames:
+            other_fnames = list()
+        if not max_map_tokens:
+            max_map_tokens = self.max_map_tokens
+        if not mentioned_fnames:
+            mentioned_fnames = set()
+        if not mentioned_idents:
+            mentioned_idents = set()
+        # Create a cache key
+        cache_key = [
+            tuple(sorted(chat_fnames)) if chat_fnames else None,
+            len(other_fnames) if other_fnames else None,
+            max_map_tokens,
+        ]
+        if self.refresh == "auto":
+            # Handle mentioned_fnames normally
+            cache_key += [
+                tuple(sorted(mentioned_fnames)) if mentioned_fnames else None,
+            ]
+            # Handle mentioned_idents with similarity check
+            cache_key_component = self._get_mentioned_idents_cache_component(mentioned_idents)
+            cache_key.append(cache_key_component)
+        cache_key = hash(str(tuple(cache_key)))
+        use_cache = False
+        if not force_refresh:
+            if self.refresh == "manual" and self.last_map:
+                return self.last_map
+            if self.refresh == "always":
+                use_cache = False
+            elif self.refresh == "files":
+                use_cache = True
+            elif self.refresh == "auto":
+                use_cache = self.map_processing_time > 1.0
+            # Check if the result is in the cache
+            if use_cache and cache_key in self.map_cache:
+                return self.map_cache[cache_key]
+        # If not in cache or force_refresh is True, generate the map
+        start_time = time.time()
+        result = self.get_ranked_tags_map_uncached(
+            chat_fnames, other_fnames, max_map_tokens, mentioned_fnames, mentioned_idents
+        )
+        end_time = time.time()
+        self.map_processing_time = end_time - start_time
+        # Store the result in the cache
+        self.map_cache[cache_key] = result
+        self.last_map = result
+        return result
+    def get_ranked_tags_map_uncached(
+        self,
+        chat_fnames,
+        other_fnames=None,
+        max_map_tokens=None,
+        mentioned_fnames=None,
+        mentioned_idents=None,
+    ):
+        self.io.profile("Start Rank Tags Map Uncached", start=True)
+        if not other_fnames:
+            other_fnames = list()
+        if not max_map_tokens:
+            max_map_tokens = self.max_map_tokens
+        if not mentioned_fnames:
+            mentioned_fnames = set()
+        if not mentioned_idents:
+            mentioned_idents = set()
+        self.io.update_spinner(UPDATING_REPO_MAP_MESSAGE)
+        ranked_tags = self.get_ranked_tags(
+            chat_fnames, other_fnames, mentioned_fnames, mentioned_idents, True
+        )
+        self.io.profile("Finish Getting Ranked Tags")
+        other_rel_fnames = sorted(set(self.get_rel_fname(fname) for fname in other_fnames))
+        special_fnames = filter_important_files(other_rel_fnames)
+        ranked_tags_fnames = set(tag[0] for tag in ranked_tags)
+        special_fnames = [fn for fn in special_fnames if fn not in ranked_tags_fnames]
+        special_fnames = [(fn,) for fn in special_fnames]
+        ranked_tags = special_fnames + ranked_tags
+        num_tags = len(ranked_tags)
+        lower_bound = 0
+        upper_bound = num_tags
+        best_tree = None
+        best_tree_tokens = 0
+        chat_rel_fnames = set(self.get_rel_fname(fname) for fname in chat_fnames)
+        self.tree_cache = dict()
+        middle = min(int(max_map_tokens // 25), num_tags)
+        while lower_bound <= upper_bound:
+            # dump(lower_bound, middle, upper_bound)
+            if middle > 1500:
+                show_tokens = f"{middle / 1000.0:.1f}K"
+            else:
+                show_tokens = str(middle)
+            self.io.update_spinner(f"{UPDATING_REPO_MAP_MESSAGE}: {show_tokens} tokens")
+            tree = self.to_tree(ranked_tags[:middle], chat_rel_fnames)
+            num_tokens = self.token_count(tree)
+            pct_err = abs(num_tokens - max_map_tokens) / max_map_tokens
+            ok_err = 0.15
+            if (num_tokens <= max_map_tokens and num_tokens > best_tree_tokens) or pct_err < ok_err:
+                best_tree = tree
+                best_tree_tokens = num_tokens
+                if pct_err < ok_err:
+                    break
+            if num_tokens < max_map_tokens:
+                lower_bound = middle + 1
+            else:
+                upper_bound = middle - 1
+            middle = int((lower_bound + upper_bound) // 2)
+        self.io.profile("Calculate Best Tree")
+        return best_tree
+    tree_cache = dict()
+    def render_tree(self, abs_fname, rel_fname, lois):
+        mtime = self.get_mtime(abs_fname)
+        key = (rel_fname, tuple(sorted(lois)), mtime)
+        if key in self.tree_cache:
+            return self.tree_cache[key]
+        if (
+            rel_fname not in self.tree_context_cache
+            or self.tree_context_cache[rel_fname]["mtime"] != mtime
+        ):
+            code = self.io.read_text(abs_fname) or ""
+            if not code.endswith("\n"):
+                code += "\n"
+            context = TreeContext(
+                rel_fname,
+                code,
+                color=False,
+                line_number=False,
+                child_context=False,
+                last_line=False,
+                margin=0,
+                mark_lois=False,
+                loi_pad=0,
+                # header_max=30,
+                show_top_of_file_parent_scope=False,
+            )
+            self.tree_context_cache[rel_fname] = {"context": context, "mtime": mtime}
+        context = self.tree_context_cache[rel_fname]["context"]
+        context.lines_of_interest = set()
+        context.add_lines_of_interest(lois)
+        context.add_context()
+        res = context.format()
+        self.tree_cache[key] = res
+        return res
+    def to_tree(self, tags, chat_rel_fnames):
+        if not tags:
+            return ""
+        cur_fname = None
+        cur_abs_fname = None
+        lois = None
+        output = ""
+        # add a bogus tag at the end so we trip the this_fname != cur_fname...
+        dummy_tag = (None,)
+        for tag in sorted(tags) + [dummy_tag]:
+            this_rel_fname = tag[0]
+            if this_rel_fname in chat_rel_fnames:
+                continue
+            # ... here ... to output the final real entry in the list
+            if this_rel_fname != cur_fname:
+                if lois is not None:
+                    output += "\n"
+                    output += cur_fname + ":\n"
+                    # truncate long lines, in case we get minified js or something else crazy
+                    output += truncate_long_lines(
+                        self.render_tree(cur_abs_fname, cur_fname, lois), self.max_code_line_length
+                    )
+                    lois = None
+                elif cur_fname:
+                    output += "\n" + cur_fname + "\n"
+                if type(tag) is Tag:
+                    lois = []
+                    cur_abs_fname = tag.fname
+                cur_fname = this_rel_fname
+            if lois is not None:
+                lois.append(tag.line)
+        return output
+    def _get_mentioned_idents_cache_component(self, mentioned_idents):
+        """
+        Determine the cache key component for mentioned_idents using similarity comparison.
+        This method compares the current mentioned_idents with the previous ones using
+        cosine similarity. If the similarity is high enough, it returns the previous
+        cache key component to maintain cache hits. Otherwise, it updates the stored
+        values and returns the current mentioned_idents.
+        Args:
+            mentioned_idents (set): Current set of mentioned identifiers
+        Returns:
+            tuple or None: Cache key component for mentioned_idents
+        """
+        if not mentioned_idents:
+            self._last_mentioned_idents = None
+            self._last_mentioned_idents_vector = None
+            self._has_last_mentioned_idents = False
+            return None
+        current_mentioned_idents = tuple(mentioned_idents)
+        # Check if we have a previous cached value to compare against
+        if self._has_last_mentioned_idents:
+            # Create vector for current mentioned_idents
+            current_vector = create_bigram_vector(current_mentioned_idents)
+            current_vector_norm = normalize_vector(current_vector)
+            # Calculate cosine similarity
+            similarity = cosine_similarity(self._last_mentioned_idents_vector, current_vector_norm)
+            # If similarity is high enough, use the previous cache key component
+            if similarity >= self._mentioned_ident_similarity:
+                # Use the previous mentioned_idents for cache key to maintain cache hit
+                cache_key_component = self._last_mentioned_idents
+                # Make similarity more strict the more consecutive cache hits
+                self._mentioned_ident_similarity = min(
+                    0.9, self._mentioned_ident_similarity + 0.025
+                )
+            else:
+                # Similarity is too low, use current mentioned_idents
+                cache_key_component = current_mentioned_idents
+                # Update stored values
+                self._last_mentioned_idents = current_mentioned_idents
+                self._last_mentioned_idents_vector = current_vector_norm
+                # Make similarity less strict the more consecutive cache misses
+                self._mentioned_ident_similarity = max(
+                    0.5, self._mentioned_ident_similarity - 0.025
+                )
+        else:
+            # First time or no previous value, use current mentioned_idents
+            cache_key_component = current_mentioned_idents
+            current_vector = create_bigram_vector(current_mentioned_idents)
+            # Store for future comparisons
+            self._last_mentioned_idents = current_mentioned_idents
+            self._last_mentioned_idents_vector = normalize_vector(current_vector)
+        self._has_last_mentioned_idents = True
+        return cache_key_component
+def truncate_long_lines(text, max_length):
+    return "\n".join([line[:max_length] for line in text.splitlines()]) + "\n"
+def find_src_files(directory):
+    if not os.path.isdir(directory):
+        return [directory]
+    src_files = []
+    for root, dirs, files in os.walk(directory):
+        for file in files:
+            src_files.append(os.path.join(root, file))
+    return src_files
+def get_scm_fname(lang):
+    # Load the tags queries
+    if USING_TSL_PACK:
+        subdir = "tree-sitter-language-pack"
+        try:
+            path = resources.files(__package__).joinpath(
+                "queries",
+                subdir,
+                f"{lang}-tags.scm",
+            )
+            if path.exists():
+                return path
+        except KeyError:
+            pass
+    # Fall back to tree-sitter-languages
+    subdir = "tree-sitter-languages"
+    try:
+        return resources.files(__package__).joinpath(
+            "queries",
+            subdir,
+            f"{lang}-tags.scm",
+        )
+    except KeyError:
+        return
+def get_supported_languages_md():
+    from grep_ast.parsers import PARSERS
+    res = """
+| Language | File extension | Repo map | Linter |
+|:--------:|:--------------:|:--------:|:------:|
+"""
+    data = sorted((lang, ex) for ex, lang in PARSERS.items())
+    for lang, ext in data:
+        fn = get_scm_fname(lang)
+        repo_map = "✓" if fn and os.path.exists(fn) else ""
+        linter_support = "✓"
+        res += f"| {lang:20} | {ext:20} | {repo_map:^8} | {linter_support:^6} |\n"
+    res += "\n"
+    return res
+if __name__ == "__main__":
+    fnames = sys.argv[1:]
+    chat_fnames = []
+    other_fnames = []
+    for fname in sys.argv[1:]:
+        if os.path.isdir(fname):
+            chat_fnames += find_src_files(fname)
+        else:
+            chat_fnames.append(fname)
+    rm = RepoMap(root=".")
+    repo_map = rm.get_ranked_tags_map(chat_fnames, other_fnames)
+    dump(len(repo_map))
+    print(repo_map)