mcp-vector-search 0.0.3__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of mcp-vector-search might be problematic. Click here for more details.
- mcp_vector_search-0.0.3/.gitignore +233 -0
- mcp_vector_search-0.0.3/.pre-commit-config.yaml +29 -0
- mcp_vector_search-0.0.3/LICENSE +21 -0
- mcp_vector_search-0.0.3/PKG-INFO +333 -0
- mcp_vector_search-0.0.3/README.md +279 -0
- mcp_vector_search-0.0.3/docs/prd/mcp_vector_search_prd_updated.md +1860 -0
- mcp_vector_search-0.0.3/pyproject.toml +189 -0
- mcp_vector_search-0.0.3/scripts/dev-setup.py +81 -0
- mcp_vector_search-0.0.3/src/mcp_vector_search/__init__.py +9 -0
- mcp_vector_search-0.0.3/src/mcp_vector_search/cli/__init__.py +1 -0
- mcp_vector_search-0.0.3/src/mcp_vector_search/cli/commands/__init__.py +1 -0
- mcp_vector_search-0.0.3/src/mcp_vector_search/cli/commands/config.py +303 -0
- mcp_vector_search-0.0.3/src/mcp_vector_search/cli/commands/index.py +304 -0
- mcp_vector_search-0.0.3/src/mcp_vector_search/cli/commands/init.py +212 -0
- mcp_vector_search-0.0.3/src/mcp_vector_search/cli/commands/search.py +395 -0
- mcp_vector_search-0.0.3/src/mcp_vector_search/cli/commands/status.py +340 -0
- mcp_vector_search-0.0.3/src/mcp_vector_search/cli/commands/watch.py +288 -0
- mcp_vector_search-0.0.3/src/mcp_vector_search/cli/main.py +117 -0
- mcp_vector_search-0.0.3/src/mcp_vector_search/cli/output.py +242 -0
- mcp_vector_search-0.0.3/src/mcp_vector_search/config/__init__.py +1 -0
- mcp_vector_search-0.0.3/src/mcp_vector_search/config/defaults.py +175 -0
- mcp_vector_search-0.0.3/src/mcp_vector_search/config/settings.py +108 -0
- mcp_vector_search-0.0.3/src/mcp_vector_search/core/__init__.py +1 -0
- mcp_vector_search-0.0.3/src/mcp_vector_search/core/database.py +431 -0
- mcp_vector_search-0.0.3/src/mcp_vector_search/core/embeddings.py +250 -0
- mcp_vector_search-0.0.3/src/mcp_vector_search/core/exceptions.py +66 -0
- mcp_vector_search-0.0.3/src/mcp_vector_search/core/indexer.py +310 -0
- mcp_vector_search-0.0.3/src/mcp_vector_search/core/models.py +174 -0
- mcp_vector_search-0.0.3/src/mcp_vector_search/core/project.py +304 -0
- mcp_vector_search-0.0.3/src/mcp_vector_search/core/search.py +324 -0
- mcp_vector_search-0.0.3/src/mcp_vector_search/core/watcher.py +320 -0
- mcp_vector_search-0.0.3/src/mcp_vector_search/mcp/__init__.py +1 -0
- mcp_vector_search-0.0.3/src/mcp_vector_search/parsers/__init__.py +1 -0
- mcp_vector_search-0.0.3/src/mcp_vector_search/parsers/base.py +180 -0
- mcp_vector_search-0.0.3/src/mcp_vector_search/parsers/javascript.py +238 -0
- mcp_vector_search-0.0.3/src/mcp_vector_search/parsers/python.py +407 -0
- mcp_vector_search-0.0.3/src/mcp_vector_search/parsers/registry.py +187 -0
- mcp_vector_search-0.0.3/src/mcp_vector_search/py.typed +1 -0
- mcp_vector_search-0.0.3/tests/__init__.py +1 -0
- mcp_vector_search-0.0.3/uv.lock +3644 -0
|
@@ -0,0 +1,233 @@
|
|
|
1
|
+
# MCP Vector Search specific
|
|
2
|
+
.mcp-vector-search/
|
|
3
|
+
*.db
|
|
4
|
+
*.sqlite
|
|
5
|
+
*.sqlite3
|
|
6
|
+
|
|
7
|
+
# Python
|
|
8
|
+
__pycache__/
|
|
9
|
+
*.py[cod]
|
|
10
|
+
*$py.class
|
|
11
|
+
*.so
|
|
12
|
+
.Python
|
|
13
|
+
build/
|
|
14
|
+
develop-eggs/
|
|
15
|
+
dist/
|
|
16
|
+
downloads/
|
|
17
|
+
eggs/
|
|
18
|
+
.eggs/
|
|
19
|
+
lib/
|
|
20
|
+
lib64/
|
|
21
|
+
parts/
|
|
22
|
+
sdist/
|
|
23
|
+
var/
|
|
24
|
+
wheels/
|
|
25
|
+
share/python-wheels/
|
|
26
|
+
*.egg-info/
|
|
27
|
+
.installed.cfg
|
|
28
|
+
*.egg
|
|
29
|
+
MANIFEST
|
|
30
|
+
|
|
31
|
+
# PyInstaller
|
|
32
|
+
*.manifest
|
|
33
|
+
*.spec
|
|
34
|
+
|
|
35
|
+
# Installer logs
|
|
36
|
+
pip-log.txt
|
|
37
|
+
pip-delete-this-directory.txt
|
|
38
|
+
|
|
39
|
+
# Unit test / coverage reports
|
|
40
|
+
htmlcov/
|
|
41
|
+
.tox/
|
|
42
|
+
.nox/
|
|
43
|
+
.coverage
|
|
44
|
+
.coverage.*
|
|
45
|
+
.cache
|
|
46
|
+
nosetests.xml
|
|
47
|
+
coverage.xml
|
|
48
|
+
*.cover
|
|
49
|
+
*.py,cover
|
|
50
|
+
.hypothesis/
|
|
51
|
+
.pytest_cache/
|
|
52
|
+
cover/
|
|
53
|
+
|
|
54
|
+
# Translations
|
|
55
|
+
*.mo
|
|
56
|
+
*.pot
|
|
57
|
+
|
|
58
|
+
# Django stuff:
|
|
59
|
+
*.log
|
|
60
|
+
local_settings.py
|
|
61
|
+
db.sqlite3
|
|
62
|
+
db.sqlite3-journal
|
|
63
|
+
|
|
64
|
+
# Flask stuff:
|
|
65
|
+
instance/
|
|
66
|
+
.webassets-cache
|
|
67
|
+
|
|
68
|
+
# Scrapy stuff:
|
|
69
|
+
.scrapy
|
|
70
|
+
|
|
71
|
+
# Sphinx documentation
|
|
72
|
+
docs/_build/
|
|
73
|
+
|
|
74
|
+
# PyBuilder
|
|
75
|
+
.pybuilder/
|
|
76
|
+
target/
|
|
77
|
+
|
|
78
|
+
# Jupyter Notebook
|
|
79
|
+
.ipynb_checkpoints
|
|
80
|
+
|
|
81
|
+
# IPython
|
|
82
|
+
profile_default/
|
|
83
|
+
ipython_config.py
|
|
84
|
+
|
|
85
|
+
# pyenv
|
|
86
|
+
.python-version
|
|
87
|
+
|
|
88
|
+
# pipenv
|
|
89
|
+
Pipfile.lock
|
|
90
|
+
|
|
91
|
+
# poetry
|
|
92
|
+
poetry.lock
|
|
93
|
+
|
|
94
|
+
# pdm
|
|
95
|
+
.pdm.toml
|
|
96
|
+
|
|
97
|
+
# PEP 582
|
|
98
|
+
__pypackages__/
|
|
99
|
+
|
|
100
|
+
# Celery stuff
|
|
101
|
+
celerybeat-schedule
|
|
102
|
+
celerybeat.pid
|
|
103
|
+
|
|
104
|
+
# SageMath parsed files
|
|
105
|
+
*.sage.py
|
|
106
|
+
|
|
107
|
+
# Environments
|
|
108
|
+
.env
|
|
109
|
+
.venv
|
|
110
|
+
env/
|
|
111
|
+
venv/
|
|
112
|
+
ENV/
|
|
113
|
+
env.bak/
|
|
114
|
+
venv.bak/
|
|
115
|
+
|
|
116
|
+
# Spyder project settings
|
|
117
|
+
.spyderproject
|
|
118
|
+
.spyproject
|
|
119
|
+
|
|
120
|
+
# Rope project settings
|
|
121
|
+
.ropeproject
|
|
122
|
+
|
|
123
|
+
# mkdocs documentation
|
|
124
|
+
/site
|
|
125
|
+
|
|
126
|
+
# mypy
|
|
127
|
+
.mypy_cache/
|
|
128
|
+
.dmypy.json
|
|
129
|
+
dmypy.json
|
|
130
|
+
|
|
131
|
+
# Pyre type checker
|
|
132
|
+
.pyre/
|
|
133
|
+
|
|
134
|
+
# pytype static type analyzer
|
|
135
|
+
.pytype/
|
|
136
|
+
|
|
137
|
+
# Cython debug symbols
|
|
138
|
+
cython_debug/
|
|
139
|
+
|
|
140
|
+
# PyCharm
|
|
141
|
+
.idea/
|
|
142
|
+
|
|
143
|
+
# VS Code
|
|
144
|
+
.vscode/
|
|
145
|
+
|
|
146
|
+
# macOS
|
|
147
|
+
.DS_Store
|
|
148
|
+
.AppleDouble
|
|
149
|
+
.LSOverride
|
|
150
|
+
|
|
151
|
+
# Windows
|
|
152
|
+
Thumbs.db
|
|
153
|
+
Thumbs.db:encryptable
|
|
154
|
+
ehthumbs.db
|
|
155
|
+
ehthumbs_vista.db
|
|
156
|
+
*.tmp
|
|
157
|
+
*.temp
|
|
158
|
+
Desktop.ini
|
|
159
|
+
$RECYCLE.BIN/
|
|
160
|
+
|
|
161
|
+
# Linux
|
|
162
|
+
*~
|
|
163
|
+
|
|
164
|
+
# Node.js (for any JS/TS development)
|
|
165
|
+
node_modules/
|
|
166
|
+
npm-debug.log*
|
|
167
|
+
yarn-debug.log*
|
|
168
|
+
yarn-error.log*
|
|
169
|
+
|
|
170
|
+
# Temporary files
|
|
171
|
+
*.tmp
|
|
172
|
+
*.temp
|
|
173
|
+
*.swp
|
|
174
|
+
*.swo
|
|
175
|
+
*~
|
|
176
|
+
|
|
177
|
+
# Test files
|
|
178
|
+
test_*.py
|
|
179
|
+
*_test.py
|
|
180
|
+
debug_*.py
|
|
181
|
+
test_js_project/
|
|
182
|
+
|
|
183
|
+
# UV specific
|
|
184
|
+
.uv/
|
|
185
|
+
|
|
186
|
+
# ChromaDB
|
|
187
|
+
chroma.sqlite3
|
|
188
|
+
chroma/
|
|
189
|
+
|
|
190
|
+
# Logs
|
|
191
|
+
*.log
|
|
192
|
+
logs/
|
|
193
|
+
|
|
194
|
+
# Backup files
|
|
195
|
+
*.bak
|
|
196
|
+
*.backup
|
|
197
|
+
|
|
198
|
+
# OS generated files
|
|
199
|
+
.directory
|
|
200
|
+
.fuse_hidden*
|
|
201
|
+
.nfs*
|
|
202
|
+
|
|
203
|
+
# JetBrains IDEs
|
|
204
|
+
.idea/
|
|
205
|
+
*.iws
|
|
206
|
+
*.iml
|
|
207
|
+
*.ipr
|
|
208
|
+
|
|
209
|
+
# Sublime Text
|
|
210
|
+
*.sublime-project
|
|
211
|
+
*.sublime-workspace
|
|
212
|
+
|
|
213
|
+
# Vim
|
|
214
|
+
*.swp
|
|
215
|
+
*.swo
|
|
216
|
+
*~
|
|
217
|
+
.netrwhist
|
|
218
|
+
|
|
219
|
+
# Emacs
|
|
220
|
+
*~
|
|
221
|
+
\#*\#
|
|
222
|
+
/.emacs.desktop
|
|
223
|
+
/.emacs.desktop.lock
|
|
224
|
+
*.elc
|
|
225
|
+
auto-save-list
|
|
226
|
+
tramp
|
|
227
|
+
.\#*
|
|
228
|
+
|
|
229
|
+
# Archive files
|
|
230
|
+
*.zip
|
|
231
|
+
*.tar.gz
|
|
232
|
+
*.rar
|
|
233
|
+
*.7z
|
|
@@ -0,0 +1,29 @@
|
|
|
1
|
+
repos:
|
|
2
|
+
- repo: https://github.com/pre-commit/pre-commit-hooks
|
|
3
|
+
rev: v4.5.0
|
|
4
|
+
hooks:
|
|
5
|
+
- id: trailing-whitespace
|
|
6
|
+
- id: end-of-file-fixer
|
|
7
|
+
- id: check-yaml
|
|
8
|
+
- id: check-added-large-files
|
|
9
|
+
- id: check-merge-conflict
|
|
10
|
+
- id: debug-statements
|
|
11
|
+
|
|
12
|
+
- repo: https://github.com/psf/black
|
|
13
|
+
rev: 23.12.1
|
|
14
|
+
hooks:
|
|
15
|
+
- id: black
|
|
16
|
+
language_version: python3.11
|
|
17
|
+
|
|
18
|
+
- repo: https://github.com/astral-sh/ruff-pre-commit
|
|
19
|
+
rev: v0.1.9
|
|
20
|
+
hooks:
|
|
21
|
+
- id: ruff
|
|
22
|
+
args: [--fix, --exit-non-zero-on-fix]
|
|
23
|
+
|
|
24
|
+
- repo: https://github.com/pre-commit/mirrors-mypy
|
|
25
|
+
rev: v1.8.0
|
|
26
|
+
hooks:
|
|
27
|
+
- id: mypy
|
|
28
|
+
additional_dependencies: [types-all]
|
|
29
|
+
args: [--strict, --ignore-missing-imports]
|
|
@@ -0,0 +1,21 @@
|
|
|
1
|
+
MIT License
|
|
2
|
+
|
|
3
|
+
Copyright (c) 2024 Robert Matsuoka
|
|
4
|
+
|
|
5
|
+
Permission is hereby granted, free of charge, to any person obtaining a copy
|
|
6
|
+
of this software and associated documentation files (the "Software"), to deal
|
|
7
|
+
in the Software without restriction, including without limitation the rights
|
|
8
|
+
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
|
|
9
|
+
copies of the Software, and to permit persons to whom the Software is
|
|
10
|
+
furnished to do so, subject to the following conditions:
|
|
11
|
+
|
|
12
|
+
The above copyright notice and this permission notice shall be included in all
|
|
13
|
+
copies or substantial portions of the Software.
|
|
14
|
+
|
|
15
|
+
THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
|
16
|
+
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
17
|
+
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
|
|
18
|
+
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
|
19
|
+
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
|
|
20
|
+
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
|
|
21
|
+
SOFTWARE.
|
|
@@ -0,0 +1,333 @@
|
|
|
1
|
+
Metadata-Version: 2.4
|
|
2
|
+
Name: mcp-vector-search
|
|
3
|
+
Version: 0.0.3
|
|
4
|
+
Summary: CLI-first semantic code search with MCP integration
|
|
5
|
+
Project-URL: Homepage, https://github.com/bobmatnyc/mcp-vector-search
|
|
6
|
+
Project-URL: Documentation, https://mcp-vector-search.readthedocs.io
|
|
7
|
+
Project-URL: Repository, https://github.com/bobmatnyc/mcp-vector-search
|
|
8
|
+
Project-URL: Bug Tracker, https://github.com/bobmatnyc/mcp-vector-search/issues
|
|
9
|
+
Author-email: Robert Matsuoka <bobmatnyc@gmail.com>
|
|
10
|
+
License: MIT License
|
|
11
|
+
|
|
12
|
+
Copyright (c) 2024 Robert Matsuoka
|
|
13
|
+
|
|
14
|
+
Permission is hereby granted, free of charge, to any person obtaining a copy
|
|
15
|
+
of this software and associated documentation files (the "Software"), to deal
|
|
16
|
+
in the Software without restriction, including without limitation the rights
|
|
17
|
+
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
|
|
18
|
+
copies of the Software, and to permit persons to whom the Software is
|
|
19
|
+
furnished to do so, subject to the following conditions:
|
|
20
|
+
|
|
21
|
+
The above copyright notice and this permission notice shall be included in all
|
|
22
|
+
copies or substantial portions of the Software.
|
|
23
|
+
|
|
24
|
+
THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
|
25
|
+
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
26
|
+
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
|
|
27
|
+
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
|
28
|
+
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
|
|
29
|
+
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
|
|
30
|
+
SOFTWARE.
|
|
31
|
+
License-File: LICENSE
|
|
32
|
+
Keywords: code-search,mcp,semantic-search,vector-database
|
|
33
|
+
Classifier: Development Status :: 3 - Alpha
|
|
34
|
+
Classifier: Intended Audience :: Developers
|
|
35
|
+
Classifier: License :: OSI Approved :: MIT License
|
|
36
|
+
Classifier: Programming Language :: Python :: 3.11
|
|
37
|
+
Classifier: Programming Language :: Python :: 3.12
|
|
38
|
+
Classifier: Topic :: Software Development :: Code Generators
|
|
39
|
+
Classifier: Topic :: Software Development :: Libraries :: Python Modules
|
|
40
|
+
Requires-Python: >=3.11
|
|
41
|
+
Requires-Dist: aiofiles>=23.0.0
|
|
42
|
+
Requires-Dist: chromadb>=0.5.0
|
|
43
|
+
Requires-Dist: httpx>=0.25.0
|
|
44
|
+
Requires-Dist: loguru>=0.7.0
|
|
45
|
+
Requires-Dist: pydantic-settings>=2.1.0
|
|
46
|
+
Requires-Dist: pydantic>=2.5.0
|
|
47
|
+
Requires-Dist: rich>=13.0.0
|
|
48
|
+
Requires-Dist: sentence-transformers>=2.2.2
|
|
49
|
+
Requires-Dist: tree-sitter-languages>=1.8.0
|
|
50
|
+
Requires-Dist: tree-sitter>=0.20.1
|
|
51
|
+
Requires-Dist: typer>=0.9.0
|
|
52
|
+
Requires-Dist: watchdog>=3.0.0
|
|
53
|
+
Description-Content-Type: text/markdown
|
|
54
|
+
|
|
55
|
+
# MCP Vector Search
|
|
56
|
+
|
|
57
|
+
🔍 **CLI-first semantic code search with MCP integration**
|
|
58
|
+
|
|
59
|
+
> ⚠️ **Alpha Release (v0.0.3)**: This is an early-stage project under active development. Expect breaking changes and rough edges. Feedback and contributions are welcome!
|
|
60
|
+
|
|
61
|
+
A modern, fast, and intelligent code search tool that understands your codebase through semantic analysis and AST parsing. Built with Python, powered by ChromaDB, and designed for developer productivity.
|
|
62
|
+
|
|
63
|
+
## ✨ Features
|
|
64
|
+
|
|
65
|
+
### 🚀 **Core Capabilities**
|
|
66
|
+
- **Semantic Search**: Find code by meaning, not just keywords
|
|
67
|
+
- **AST-Aware Parsing**: Understands code structure (functions, classes, methods)
|
|
68
|
+
- **Multi-Language Support**: Python, JavaScript, TypeScript (with extensible architecture)
|
|
69
|
+
- **Real-time Indexing**: File watching with automatic index updates
|
|
70
|
+
- **Local-First**: Complete privacy with on-device processing
|
|
71
|
+
- **Zero Configuration**: Auto-detects project structure and languages
|
|
72
|
+
|
|
73
|
+
### 🛠️ **Developer Experience**
|
|
74
|
+
- **CLI-First Design**: Simple commands for immediate productivity
|
|
75
|
+
- **Rich Output**: Syntax highlighting, similarity scores, context
|
|
76
|
+
- **Fast Performance**: Sub-second search responses, efficient indexing
|
|
77
|
+
- **Modern Architecture**: Async-first, type-safe, modular design
|
|
78
|
+
|
|
79
|
+
### 🔧 **Technical Features**
|
|
80
|
+
- **Vector Database**: ChromaDB for efficient similarity search
|
|
81
|
+
- **Embedding Models**: Configurable sentence transformers
|
|
82
|
+
- **Incremental Updates**: Smart file watching and re-indexing
|
|
83
|
+
- **Extensible Parsers**: Plugin architecture for new languages
|
|
84
|
+
- **Configuration Management**: Project-specific settings
|
|
85
|
+
|
|
86
|
+
## 🚀 Quick Start
|
|
87
|
+
|
|
88
|
+
### Installation
|
|
89
|
+
|
|
90
|
+
```bash
|
|
91
|
+
# Install with UV (recommended)
|
|
92
|
+
uv add mcp-vector-search
|
|
93
|
+
|
|
94
|
+
# Or with pip
|
|
95
|
+
pip install mcp-vector-search
|
|
96
|
+
```
|
|
97
|
+
|
|
98
|
+
### Basic Usage
|
|
99
|
+
|
|
100
|
+
```bash
|
|
101
|
+
# Initialize your project
|
|
102
|
+
mcp-vector-search init
|
|
103
|
+
|
|
104
|
+
# Index your codebase
|
|
105
|
+
mcp-vector-search index
|
|
106
|
+
|
|
107
|
+
# Search your code
|
|
108
|
+
mcp-vector-search search "authentication logic"
|
|
109
|
+
mcp-vector-search search "database connection setup"
|
|
110
|
+
mcp-vector-search search "error handling patterns"
|
|
111
|
+
|
|
112
|
+
# Check project status
|
|
113
|
+
mcp-vector-search status
|
|
114
|
+
|
|
115
|
+
# Start file watching (auto-update index)
|
|
116
|
+
mcp-vector-search watch
|
|
117
|
+
```
|
|
118
|
+
|
|
119
|
+
## 📖 Documentation
|
|
120
|
+
|
|
121
|
+
### Commands
|
|
122
|
+
|
|
123
|
+
#### `init` - Initialize Project
|
|
124
|
+
```bash
|
|
125
|
+
# Basic initialization
|
|
126
|
+
mcp-vector-search init
|
|
127
|
+
|
|
128
|
+
# Custom configuration
|
|
129
|
+
mcp-vector-search init --extensions .py,.js,.ts --embedding-model sentence-transformers/all-MiniLM-L6-v2
|
|
130
|
+
|
|
131
|
+
# Force re-initialization
|
|
132
|
+
mcp-vector-search init --force
|
|
133
|
+
```
|
|
134
|
+
|
|
135
|
+
#### `index` - Index Codebase
|
|
136
|
+
```bash
|
|
137
|
+
# Index all files
|
|
138
|
+
mcp-vector-search index
|
|
139
|
+
|
|
140
|
+
# Index specific directory
|
|
141
|
+
mcp-vector-search index /path/to/code
|
|
142
|
+
|
|
143
|
+
# Force re-indexing
|
|
144
|
+
mcp-vector-search index --force
|
|
145
|
+
```
|
|
146
|
+
|
|
147
|
+
#### `search` - Semantic Search
|
|
148
|
+
```bash
|
|
149
|
+
# Basic search
|
|
150
|
+
mcp-vector-search search "function that handles user authentication"
|
|
151
|
+
|
|
152
|
+
# Adjust similarity threshold
|
|
153
|
+
mcp-vector-search search "database queries" --threshold 0.7
|
|
154
|
+
|
|
155
|
+
# Limit results
|
|
156
|
+
mcp-vector-search search "error handling" --limit 10
|
|
157
|
+
|
|
158
|
+
# Search in specific context
|
|
159
|
+
mcp-vector-search search similar "path/to/function.py:25"
|
|
160
|
+
```
|
|
161
|
+
|
|
162
|
+
#### `watch` - File Watching
|
|
163
|
+
```bash
|
|
164
|
+
# Start watching for changes
|
|
165
|
+
mcp-vector-search watch
|
|
166
|
+
|
|
167
|
+
# Check watch status
|
|
168
|
+
mcp-vector-search watch status
|
|
169
|
+
|
|
170
|
+
# Enable/disable watching
|
|
171
|
+
mcp-vector-search watch enable
|
|
172
|
+
mcp-vector-search watch disable
|
|
173
|
+
```
|
|
174
|
+
|
|
175
|
+
#### `status` - Project Information
|
|
176
|
+
```bash
|
|
177
|
+
# Basic status
|
|
178
|
+
mcp-vector-search status
|
|
179
|
+
|
|
180
|
+
# Detailed information
|
|
181
|
+
mcp-vector-search status --verbose
|
|
182
|
+
```
|
|
183
|
+
|
|
184
|
+
#### `config` - Configuration Management
|
|
185
|
+
```bash
|
|
186
|
+
# View configuration
|
|
187
|
+
mcp-vector-search config show
|
|
188
|
+
|
|
189
|
+
# Update settings
|
|
190
|
+
mcp-vector-search config set similarity_threshold 0.8
|
|
191
|
+
mcp-vector-search config set embedding_model microsoft/codebert-base
|
|
192
|
+
|
|
193
|
+
# List available models
|
|
194
|
+
mcp-vector-search config models
|
|
195
|
+
```
|
|
196
|
+
|
|
197
|
+
### Configuration
|
|
198
|
+
|
|
199
|
+
Projects are configured via `.mcp-vector-search/config.json`:
|
|
200
|
+
|
|
201
|
+
```json
|
|
202
|
+
{
|
|
203
|
+
"project_root": "/path/to/project",
|
|
204
|
+
"file_extensions": [".py", ".js", ".ts"],
|
|
205
|
+
"embedding_model": "sentence-transformers/all-MiniLM-L6-v2",
|
|
206
|
+
"similarity_threshold": 0.75,
|
|
207
|
+
"languages": ["python", "javascript", "typescript"],
|
|
208
|
+
"watch_files": true,
|
|
209
|
+
"cache_embeddings": true
|
|
210
|
+
}
|
|
211
|
+
```
|
|
212
|
+
|
|
213
|
+
## 🏗️ Architecture
|
|
214
|
+
|
|
215
|
+
### Core Components
|
|
216
|
+
|
|
217
|
+
- **Parser Registry**: Extensible system for language-specific parsing
|
|
218
|
+
- **Semantic Indexer**: Efficient code chunking and embedding generation
|
|
219
|
+
- **Vector Database**: ChromaDB integration for similarity search
|
|
220
|
+
- **File Watcher**: Real-time monitoring and incremental updates
|
|
221
|
+
- **CLI Interface**: Rich, user-friendly command-line experience
|
|
222
|
+
|
|
223
|
+
### Supported Languages
|
|
224
|
+
|
|
225
|
+
| Language | Status | Features |
|
|
226
|
+
|------------|--------|----------|
|
|
227
|
+
| Python | ✅ Full | Functions, classes, methods, docstrings |
|
|
228
|
+
| JavaScript | ✅ Full | Functions, classes, JSDoc, ES6+ syntax |
|
|
229
|
+
| TypeScript | ✅ Full | Interfaces, types, generics, decorators |
|
|
230
|
+
| Java | 🔄 Planned | Classes, methods, annotations |
|
|
231
|
+
| Go | 🔄 Planned | Functions, structs, interfaces |
|
|
232
|
+
| Rust | 🔄 Planned | Functions, structs, traits |
|
|
233
|
+
|
|
234
|
+
## 🤝 Contributing
|
|
235
|
+
|
|
236
|
+
We welcome contributions! Please see our [Contributing Guide](CONTRIBUTING.md) for details.
|
|
237
|
+
|
|
238
|
+
### Development Setup
|
|
239
|
+
|
|
240
|
+
```bash
|
|
241
|
+
# Clone the repository
|
|
242
|
+
git clone https://github.com/bobmatnyc/mcp-vector-search.git
|
|
243
|
+
cd mcp-vector-search
|
|
244
|
+
|
|
245
|
+
# Install dependencies with UV
|
|
246
|
+
uv sync
|
|
247
|
+
|
|
248
|
+
# Install in development mode
|
|
249
|
+
uv pip install -e .
|
|
250
|
+
|
|
251
|
+
# Run tests
|
|
252
|
+
uv run pytest
|
|
253
|
+
|
|
254
|
+
# Run linting
|
|
255
|
+
uv run ruff check
|
|
256
|
+
uv run mypy src/
|
|
257
|
+
```
|
|
258
|
+
|
|
259
|
+
### Adding Language Support
|
|
260
|
+
|
|
261
|
+
1. Create a new parser in `src/mcp_vector_search/parsers/`
|
|
262
|
+
2. Extend the `BaseParser` class
|
|
263
|
+
3. Register the parser in `parsers/registry.py`
|
|
264
|
+
4. Add tests and documentation
|
|
265
|
+
|
|
266
|
+
## 📊 Performance
|
|
267
|
+
|
|
268
|
+
- **Indexing Speed**: ~1000 files/minute (typical Python project)
|
|
269
|
+
- **Search Latency**: <100ms for most queries
|
|
270
|
+
- **Memory Usage**: ~50MB baseline + ~1MB per 1000 code chunks
|
|
271
|
+
- **Storage**: ~1KB per code chunk (compressed embeddings)
|
|
272
|
+
|
|
273
|
+
## ⚠️ Known Limitations (Alpha)
|
|
274
|
+
|
|
275
|
+
- **Tree-sitter Integration**: Currently using regex fallback parsing (Tree-sitter setup needs improvement)
|
|
276
|
+
- **Search Relevance**: Embedding model may need tuning for code-specific queries
|
|
277
|
+
- **Error Handling**: Some edge cases may not be gracefully handled
|
|
278
|
+
- **Documentation**: API documentation is minimal
|
|
279
|
+
- **Testing**: Limited test coverage, needs real-world validation
|
|
280
|
+
|
|
281
|
+
## 🙏 Feedback Needed
|
|
282
|
+
|
|
283
|
+
We're actively seeking feedback on:
|
|
284
|
+
|
|
285
|
+
- **Search Quality**: How relevant are the search results for your codebase?
|
|
286
|
+
- **Performance**: How does indexing and search speed feel in practice?
|
|
287
|
+
- **Usability**: Is the CLI interface intuitive and helpful?
|
|
288
|
+
- **Language Support**: Which languages would you like to see added next?
|
|
289
|
+
- **Features**: What functionality is missing for your workflow?
|
|
290
|
+
|
|
291
|
+
Please [open an issue](https://github.com/bobmatnyc/mcp-vector-search/issues) or start a [discussion](https://github.com/bobmatnyc/mcp-vector-search/discussions) to share your experience!
|
|
292
|
+
|
|
293
|
+
## 🔮 Roadmap
|
|
294
|
+
|
|
295
|
+
### v0.0.x: Alpha (Current) 🔄
|
|
296
|
+
- [x] Core CLI interface
|
|
297
|
+
- [x] Python/JS/TS parsing
|
|
298
|
+
- [x] ChromaDB integration
|
|
299
|
+
- [x] File watching
|
|
300
|
+
- [x] Basic search functionality
|
|
301
|
+
- [ ] Real-world testing and feedback
|
|
302
|
+
- [ ] Bug fixes and stability improvements
|
|
303
|
+
- [ ] Performance optimizations
|
|
304
|
+
|
|
305
|
+
### v0.1.x: Beta 🔮
|
|
306
|
+
- [ ] Advanced search modes (contextual, similar code)
|
|
307
|
+
- [ ] Additional language support (Java, Go, Rust)
|
|
308
|
+
- [ ] Configuration improvements
|
|
309
|
+
- [ ] Comprehensive testing suite
|
|
310
|
+
- [ ] Documentation improvements
|
|
311
|
+
|
|
312
|
+
### v1.0.x: Stable 🔮
|
|
313
|
+
- [ ] MCP server implementation
|
|
314
|
+
- [ ] IDE extensions (VS Code, JetBrains)
|
|
315
|
+
- [ ] Git integration
|
|
316
|
+
- [ ] Team collaboration features
|
|
317
|
+
- [ ] Production-ready performance
|
|
318
|
+
|
|
319
|
+
## 📄 License
|
|
320
|
+
|
|
321
|
+
MIT License - see [LICENSE](LICENSE) file for details.
|
|
322
|
+
|
|
323
|
+
## 🙏 Acknowledgments
|
|
324
|
+
|
|
325
|
+
- [ChromaDB](https://github.com/chroma-core/chroma) for vector database
|
|
326
|
+
- [Tree-sitter](https://tree-sitter.github.io/) for parsing infrastructure
|
|
327
|
+
- [Sentence Transformers](https://www.sbert.net/) for embeddings
|
|
328
|
+
- [Typer](https://typer.tiangolo.com/) for CLI framework
|
|
329
|
+
- [Rich](https://rich.readthedocs.io/) for beautiful terminal output
|
|
330
|
+
|
|
331
|
+
---
|
|
332
|
+
|
|
333
|
+
**Built with ❤️ for developers who love efficient code search**
|