coderay 1.2.0__tar.gz → 1.2.1__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (120) hide show
  1. {coderay-1.2.0/src/coderay.egg-info → coderay-1.2.1}/PKG-INFO +2 -2
  2. {coderay-1.2.0 → coderay-1.2.1}/README.md +1 -1
  3. {coderay-1.2.0 → coderay-1.2.1}/pyproject.toml +1 -1
  4. coderay-1.2.1/src/coderay/__init__.py +1 -0
  5. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/core/defaults/default.coderay.toml +2 -2
  6. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/embedding/README.md +21 -13
  7. {coderay-1.2.0 → coderay-1.2.1/src/coderay.egg-info}/PKG-INFO +2 -2
  8. coderay-1.2.0/src/coderay/__init__.py +0 -1
  9. {coderay-1.2.0 → coderay-1.2.1}/LICENSE +0 -0
  10. {coderay-1.2.0 → coderay-1.2.1}/MANIFEST.in +0 -0
  11. {coderay-1.2.0 → coderay-1.2.1}/NOTICE +0 -0
  12. {coderay-1.2.0 → coderay-1.2.1}/setup.cfg +0 -0
  13. {coderay-1.2.0 → coderay-1.2.1}/src/README.md +0 -0
  14. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/chunking/README.md +0 -0
  15. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/chunking/__init__.py +0 -0
  16. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/chunking/chunker.py +0 -0
  17. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/cli/README.md +0 -0
  18. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/cli/__init__.py +0 -0
  19. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/cli/commands.py +0 -0
  20. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/cli/search_input.py +0 -0
  21. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/core/README.md +0 -0
  22. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/core/__init__.py +0 -0
  23. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/core/config.py +0 -0
  24. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/core/defaults/__init__.py +0 -0
  25. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/core/errors.py +0 -0
  26. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/core/index_workspace.py +0 -0
  27. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/core/lock.py +0 -0
  28. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/core/models.py +0 -0
  29. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/core/timing.py +0 -0
  30. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/core/utils.py +0 -0
  31. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/embedding/__init__.py +0 -0
  32. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/embedding/backend_resolve.py +0 -0
  33. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/embedding/base.py +0 -0
  34. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/embedding/format.py +0 -0
  35. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/embedding/local.py +0 -0
  36. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/embedding/mlx_backend.py +0 -0
  37. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/embedding/prefixes.py +0 -0
  38. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/graph/README.md +0 -0
  39. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/graph/__init__.py +0 -0
  40. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/graph/builder.py +0 -0
  41. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/graph/code_graph.py +0 -0
  42. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/graph/extractors/__init__.py +0 -0
  43. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/graph/extractors/base.py +0 -0
  44. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/graph/extractors/js_ts/__init__.py +0 -0
  45. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/graph/extractors/js_ts/extractor.py +0 -0
  46. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/graph/extractors/python/__init__.py +0 -0
  47. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/graph/extractors/python/extractor.py +0 -0
  48. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/graph/facts.py +0 -0
  49. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/graph/graph_builder.py +0 -0
  50. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/graph/handlers/__init__.py +0 -0
  51. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/graph/handlers/assignment_binder.py +0 -0
  52. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/graph/handlers/call_emitter.py +0 -0
  53. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/graph/handlers/decorator_emitter.py +0 -0
  54. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/graph/handlers/definition_binder.py +0 -0
  55. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/graph/handlers/definition_emitter.py +0 -0
  56. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/graph/handlers/helpers.py +0 -0
  57. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/graph/handlers/js_ts/__init__.py +0 -0
  58. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/graph/handlers/js_ts/import_binder.py +0 -0
  59. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/graph/handlers/js_ts/import_emitter.py +0 -0
  60. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/graph/handlers/python/__init__.py +0 -0
  61. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/graph/handlers/python/assignment_binder.py +0 -0
  62. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/graph/handlers/python/function_binder.py +0 -0
  63. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/graph/handlers/python/import_binder.py +0 -0
  64. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/graph/handlers/python/import_emitter.py +0 -0
  65. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/graph/handlers/python/with_binder.py +0 -0
  66. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/graph/handlers/typed_annotations.py +0 -0
  67. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/graph/handlers/typed_params.py +0 -0
  68. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/graph/impact.py +0 -0
  69. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/graph/language_plugin.py +0 -0
  70. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/graph/lowering/__init__.py +0 -0
  71. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/graph/lowering/callee_resolver.py +0 -0
  72. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/graph/lowering/callee_strategy.py +0 -0
  73. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/graph/lowering/cst_helpers.py +0 -0
  74. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/graph/lowering/name_bindings.py +0 -0
  75. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/graph/materialise.py +0 -0
  76. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/graph/passes/__init__.py +0 -0
  77. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/graph/passes/python.py +0 -0
  78. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/graph/passes/resolve_bare_phantoms.py +0 -0
  79. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/graph/pipeline.py +0 -0
  80. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/graph/project_index.py +0 -0
  81. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/graph/refs.py +0 -0
  82. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/graph/utils.py +0 -0
  83. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/mcp_server/README.md +0 -0
  84. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/mcp_server/__init__.py +0 -0
  85. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/mcp_server/errors.py +0 -0
  86. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/mcp_server/server.py +0 -0
  87. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/parsing/README.md +0 -0
  88. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/parsing/base.py +0 -0
  89. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/parsing/conventions.py +0 -0
  90. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/parsing/cst_kind.py +0 -0
  91. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/parsing/cst_traversal.py +0 -0
  92. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/parsing/languages.py +0 -0
  93. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/pipeline/README.md +0 -0
  94. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/pipeline/__init__.py +0 -0
  95. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/pipeline/indexer.py +0 -0
  96. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/pipeline/watcher.py +0 -0
  97. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/retrieval/README.md +0 -0
  98. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/retrieval/__init__.py +0 -0
  99. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/retrieval/boosting.py +0 -0
  100. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/retrieval/models.py +0 -0
  101. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/retrieval/search.py +0 -0
  102. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/skeleton/README.md +0 -0
  103. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/skeleton/__init__.py +0 -0
  104. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/skeleton/extractor.py +0 -0
  105. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/skeleton/path_range.py +0 -0
  106. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/state/README.md +0 -0
  107. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/state/__init__.py +0 -0
  108. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/state/machine.py +0 -0
  109. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/state/version.py +0 -0
  110. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/storage/README.md +0 -0
  111. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/storage/__init__.py +0 -0
  112. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/storage/lancedb.py +0 -0
  113. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/vcs/README.md +0 -0
  114. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/vcs/__init__.py +0 -0
  115. {coderay-1.2.0 → coderay-1.2.1}/src/coderay/vcs/git.py +0 -0
  116. {coderay-1.2.0 → coderay-1.2.1}/src/coderay.egg-info/SOURCES.txt +0 -0
  117. {coderay-1.2.0 → coderay-1.2.1}/src/coderay.egg-info/dependency_links.txt +0 -0
  118. {coderay-1.2.0 → coderay-1.2.1}/src/coderay.egg-info/entry_points.txt +0 -0
  119. {coderay-1.2.0 → coderay-1.2.1}/src/coderay.egg-info/requires.txt +0 -0
  120. {coderay-1.2.0 → coderay-1.2.1}/src/coderay.egg-info/top_level.txt +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: coderay
3
- Version: 1.2.0
3
+ Version: 1.2.1
4
4
  Summary: X-ray your codebase — semantic search, code graphs, file skeletons, and MCP server
5
5
  Author-email: Bogdan Copocean <bogdancopocean@gmail.com>
6
6
  License-Expression: MIT
@@ -162,7 +162,7 @@ which coderay-mcp
162
162
  - **Languages** — Python, JavaScript, and TypeScript — [`parsing/README.md`](src/coderay/parsing/README.md)
163
163
  - **Multi-repo / monorepo** — roots, aliases, optional `include` subtrees — [`core/README.md`](src/coderay/core/README.md)
164
164
  - **Hybrid search** — vector + BM25 (RRF), optional boosting — [`retrieval/README.md`](src/coderay/retrieval/README.md)
165
- - **Embeddings** — fastembed (CPU) or MLX on Apple Silicon — [`embedding/README.md`](src/coderay/embedding/README.md)
165
+ - **Embeddings** — fastembed (CPU) or MLX on Apple Silicon; defaults to MiniLM L6 for speed configure BGE in `.coderay.toml` for stronger (heavier) vectors — [`embedding/README.md`](src/coderay/embedding/README.md)
166
166
  - **Watch** — incremental re-index; `.coderay.toml` is the source of truth for what’s indexed
167
167
 
168
168
 
@@ -109,7 +109,7 @@ which coderay-mcp
109
109
  - **Languages** — Python, JavaScript, and TypeScript — [`parsing/README.md`](src/coderay/parsing/README.md)
110
110
  - **Multi-repo / monorepo** — roots, aliases, optional `include` subtrees — [`core/README.md`](src/coderay/core/README.md)
111
111
  - **Hybrid search** — vector + BM25 (RRF), optional boosting — [`retrieval/README.md`](src/coderay/retrieval/README.md)
112
- - **Embeddings** — fastembed (CPU) or MLX on Apple Silicon — [`embedding/README.md`](src/coderay/embedding/README.md)
112
+ - **Embeddings** — fastembed (CPU) or MLX on Apple Silicon; defaults to MiniLM L6 for speed configure BGE in `.coderay.toml` for stronger (heavier) vectors — [`embedding/README.md`](src/coderay/embedding/README.md)
113
113
  - **Watch** — incremental re-index; `.coderay.toml` is the source of truth for what’s indexed
114
114
 
115
115
 
@@ -4,7 +4,7 @@ build-backend = "setuptools.build_meta"
4
4
 
5
5
  [project]
6
6
  name = "coderay"
7
- version = "1.2.0"
7
+ version = "1.2.1"
8
8
  description = "X-ray your codebase — semantic search, code graphs, file skeletons, and MCP server"
9
9
  readme = "README.md"
10
10
  license = "MIT"
@@ -0,0 +1 @@
1
+ __version__ = "1.2.1"
@@ -38,13 +38,13 @@ backend = "auto"
38
38
 
39
39
  [embedder.fastembed]
40
40
  # Default embedder. Runs on CPU.
41
- model_name = "BAAI/bge-small-en-v1.5"
41
+ model_name = "sentence-transformers/all-MiniLM-L6-v2"
42
42
  dimensions = 384
43
43
  batch_size = 64
44
44
 
45
45
  [embedder.mlx]
46
46
  # Apple Silicon embedder (MLX/Metal; device depends on runtime).
47
- model_name = "mlx-community/bge-small-en-v1.5-bf16"
47
+ model_name = "mlx-community/all-MiniLM-L6-v2-4bit"
48
48
  dimensions = 384
49
49
  batch_size = 256
50
50
 
@@ -27,25 +27,33 @@ Maps code chunks to dense vectors for storage and query.
27
27
  Run `coderay build --full` after any change to `[embedder]` config. Vectors
28
28
  from different models are not compatible.
29
29
 
30
- ## If indexing is slow
30
+ ## Defaults and trade-offs
31
31
 
32
- The default model (BGE Small, ~67MB via fastembed / ~25MB via MLX bf16) is a
33
- good balance of speed and retrieval quality. If your repo is large and the first
34
- build takes too long, consider a lighter model:
32
+ The default is **MiniLM L6** (`sentence-transformers/all-MiniLM-L6-v2` on CPU,
33
+ `mlx-community/all-MiniLM-L6-v2-bf16` on MLX): fast indexing and good enough
34
+ semantic search for most workflows. For **stronger embeddings** (often better
35
+ retrieval on code), switch to **BGE Small** — expect a heavier download and more
36
+ compute than MiniLM.
35
37
 
36
- | Model | Backend | Size | Dimensions | Trade-off |
37
- |-------|---------|------|------------|-----------|
38
- | `BAAI/bge-small-en-v1.5` | fastembed | ~67MB | 384 | **Default.** Best retrieval quality in this size class. |
39
- | `sentence-transformers/all-MiniLM-L6-v2` | fastembed | ~90MB | 384 | Widely used, slightly lower code retrieval quality than BGE Small. Larger download. |
40
- | `mlx-community/bge-small-en-v1.5-4bit` | mlx | ~19MB | 384 | 4-bit quantised BGE Small. Fast on Apple Silicon, minimal download. Small quality delta vs bf16 — untested on code retrieval specifically. |
41
- | `mlx-community/all-MiniLM-L6-v2-4bit` | mlx | ~13MB | 384 | Smallest option. Fastest cold start. Noticeably lower retrieval quality for code; best suited for quick experimentation. |
38
+ | Model | Backend | Size (approx.) | Dimensions | Notes |
39
+ |-------|---------|----------------|------------|-------|
40
+ | `sentence-transformers/all-MiniLM-L6-v2` | fastembed | ~90MB | 384 | **Default.** Fast; widely used. |
41
+ | `BAAI/bge-small-en-v1.5` | fastembed | ~67MB | 384 | Heavier quality focus; strong retrieval in this size class. |
42
+ | `mlx-community/all-MiniLM-L6-v2-bf16` | mlx | ~45MB | 384 | **Default** on Apple Silicon with `coderay[mlx]`. |
43
+ | `mlx-community/bge-small-en-v1.5-bf16` | mlx | ~25MB | 384 | BGE on MLX; better embeddings than MiniLM, more work per batch. |
44
+ | `mlx-community/bge-small-en-v1.5-4bit` | mlx | ~19MB | 384 | 4-bit BGE; smaller download, small quality delta vs bf16. |
45
+ | `mlx-community/all-MiniLM-L6-v2-4bit` | mlx | ~13MB | 384 | Smallest; fastest cold start; lower retrieval quality for code. |
42
46
 
43
- To switch, update `.coderay.toml` and run `coderay build --full`:
47
+ To use BGE instead of the defaults, edit `.coderay.toml` and run `coderay build --full`:
44
48
 
45
49
  ```toml
46
- # Example: lighter MLX model on Apple Silicon
50
+ [embedder.fastembed]
51
+ model_name = "BAAI/bge-small-en-v1.5"
52
+ dimensions = 384
53
+ batch_size = 64
54
+
47
55
  [embedder.mlx]
48
- model_name = "mlx-community/bge-small-en-v1.5-4bit"
56
+ model_name = "mlx-community/bge-small-en-v1.5-bf16"
49
57
  dimensions = 384
50
58
  batch_size = 256
51
59
  ```
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: coderay
3
- Version: 1.2.0
3
+ Version: 1.2.1
4
4
  Summary: X-ray your codebase — semantic search, code graphs, file skeletons, and MCP server
5
5
  Author-email: Bogdan Copocean <bogdancopocean@gmail.com>
6
6
  License-Expression: MIT
@@ -162,7 +162,7 @@ which coderay-mcp
162
162
  - **Languages** — Python, JavaScript, and TypeScript — [`parsing/README.md`](src/coderay/parsing/README.md)
163
163
  - **Multi-repo / monorepo** — roots, aliases, optional `include` subtrees — [`core/README.md`](src/coderay/core/README.md)
164
164
  - **Hybrid search** — vector + BM25 (RRF), optional boosting — [`retrieval/README.md`](src/coderay/retrieval/README.md)
165
- - **Embeddings** — fastembed (CPU) or MLX on Apple Silicon — [`embedding/README.md`](src/coderay/embedding/README.md)
165
+ - **Embeddings** — fastembed (CPU) or MLX on Apple Silicon; defaults to MiniLM L6 for speed configure BGE in `.coderay.toml` for stronger (heavier) vectors — [`embedding/README.md`](src/coderay/embedding/README.md)
166
166
  - **Watch** — incremental re-index; `.coderay.toml` is the source of truth for what’s indexed
167
167
 
168
168
 
@@ -1 +0,0 @@
1
- __version__ = "1.2.0"
File without changes
File without changes
File without changes
File without changes
File without changes
File without changes