trelix-langchain 0.5.0__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- trelix_langchain-0.5.0/.gitignore +58 -0
- trelix_langchain-0.5.0/LICENSE +21 -0
- trelix_langchain-0.5.0/PKG-INFO +9 -0
- trelix_langchain-0.5.0/pyproject.toml +16 -0
- trelix_langchain-0.5.0/src/trelix_langchain/__init__.py +4 -0
- trelix_langchain-0.5.0/src/trelix_langchain/retriever.py +49 -0
- trelix_langchain-0.5.0/tests/__init__.py +0 -0
- trelix_langchain-0.5.0/tests/test_retriever.py +218 -0
|
@@ -0,0 +1,58 @@
|
|
|
1
|
+
# Python
|
|
2
|
+
__pycache__/
|
|
3
|
+
*.pyc
|
|
4
|
+
*.pyo
|
|
5
|
+
*.pyd
|
|
6
|
+
.Python
|
|
7
|
+
*.egg-info/
|
|
8
|
+
*.egg
|
|
9
|
+
build/
|
|
10
|
+
.eggs/
|
|
11
|
+
pip-wheel-metadata/
|
|
12
|
+
|
|
13
|
+
# dist/ — ignore generated packaging artefacts; binaries are attached via GitHub Releases.
|
|
14
|
+
dist/
|
|
15
|
+
|
|
16
|
+
# Virtual environments
|
|
17
|
+
.venv/
|
|
18
|
+
venv/
|
|
19
|
+
env/
|
|
20
|
+
ENV/
|
|
21
|
+
|
|
22
|
+
# Trelix index data — never commit these
|
|
23
|
+
.trelix/
|
|
24
|
+
|
|
25
|
+
# Test / coverage artefacts
|
|
26
|
+
.pytest_cache/
|
|
27
|
+
.coverage
|
|
28
|
+
htmlcov/
|
|
29
|
+
.tox/
|
|
30
|
+
|
|
31
|
+
# Ruff / Mypy caches
|
|
32
|
+
.ruff_cache/
|
|
33
|
+
.mypy_cache/
|
|
34
|
+
|
|
35
|
+
# Environment files — secrets must not be committed
|
|
36
|
+
.env
|
|
37
|
+
.env.local
|
|
38
|
+
.env.*.local
|
|
39
|
+
|
|
40
|
+
# Claude Code internal data
|
|
41
|
+
.claude/
|
|
42
|
+
|
|
43
|
+
# uv lockfile (not committed — project uses pip/hatchling)
|
|
44
|
+
uv.lock
|
|
45
|
+
|
|
46
|
+
# Editor / OS
|
|
47
|
+
.DS_Store
|
|
48
|
+
.idea/
|
|
49
|
+
.vscode/
|
|
50
|
+
*.swp
|
|
51
|
+
*.swo
|
|
52
|
+
Thumbs.db
|
|
53
|
+
|
|
54
|
+
# Distribution / packaging
|
|
55
|
+
*.tar.gz
|
|
56
|
+
*.whl
|
|
57
|
+
MANIFEST
|
|
58
|
+
.superpowers/
|
|
@@ -0,0 +1,21 @@
|
|
|
1
|
+
MIT License
|
|
2
|
+
|
|
3
|
+
Copyright (c) 2025 Trelix Contributors
|
|
4
|
+
|
|
5
|
+
Permission is hereby granted, free of charge, to any person obtaining a copy
|
|
6
|
+
of this software and associated documentation files (the "Software"), to deal
|
|
7
|
+
in the Software without restriction, including without limitation the rights
|
|
8
|
+
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
|
|
9
|
+
copies of the Software, and to permit persons to whom the Software is
|
|
10
|
+
furnished to do so, subject to the following conditions:
|
|
11
|
+
|
|
12
|
+
The above copyright notice and this permission notice shall be included in all
|
|
13
|
+
copies or substantial portions of the Software.
|
|
14
|
+
|
|
15
|
+
THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
|
16
|
+
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
17
|
+
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
|
|
18
|
+
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
|
19
|
+
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
|
|
20
|
+
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
|
|
21
|
+
SOFTWARE.
|
|
@@ -0,0 +1,9 @@
|
|
|
1
|
+
Metadata-Version: 2.4
|
|
2
|
+
Name: trelix-langchain
|
|
3
|
+
Version: 0.5.0
|
|
4
|
+
Summary: LangChain retriever for trelix code intelligence
|
|
5
|
+
Project-URL: Homepage, https://github.com/sairam0424/trelix
|
|
6
|
+
License-File: LICENSE
|
|
7
|
+
Requires-Python: >=3.11
|
|
8
|
+
Requires-Dist: langchain-core>=0.1.0
|
|
9
|
+
Requires-Dist: trelix>=0.4.0
|
|
@@ -0,0 +1,16 @@
|
|
|
1
|
+
[build-system]
|
|
2
|
+
requires = ["hatchling"]
|
|
3
|
+
build-backend = "hatchling.build"
|
|
4
|
+
|
|
5
|
+
[tool.hatch.build.targets.wheel]
|
|
6
|
+
packages = ["src/trelix_langchain"]
|
|
7
|
+
|
|
8
|
+
[project]
|
|
9
|
+
name = "trelix-langchain"
|
|
10
|
+
version = "0.5.0"
|
|
11
|
+
description = "LangChain retriever for trelix code intelligence"
|
|
12
|
+
requires-python = ">=3.11"
|
|
13
|
+
dependencies = ["trelix>=0.4.0", "langchain-core>=0.1.0"]
|
|
14
|
+
|
|
15
|
+
[project.urls]
|
|
16
|
+
Homepage = "https://github.com/sairam0424/trelix"
|
|
@@ -0,0 +1,49 @@
|
|
|
1
|
+
from langchain_core.callbacks import CallbackManagerForRetrieverRun
|
|
2
|
+
from langchain_core.documents import Document
|
|
3
|
+
from langchain_core.retrievers import BaseRetriever
|
|
4
|
+
|
|
5
|
+
|
|
6
|
+
class TrelixRetriever(BaseRetriever):
|
|
7
|
+
repo_path: str
|
|
8
|
+
provider: str = "local"
|
|
9
|
+
k: int = 10
|
|
10
|
+
|
|
11
|
+
def _get_trelix_retriever(self):
|
|
12
|
+
from typing import Literal, cast
|
|
13
|
+
|
|
14
|
+
from trelix.core.config import EmbedderConfig, IndexConfig
|
|
15
|
+
from trelix.retrieval.retriever import Retriever
|
|
16
|
+
|
|
17
|
+
config = IndexConfig(
|
|
18
|
+
repo_path=self.repo_path,
|
|
19
|
+
embedder=EmbedderConfig(
|
|
20
|
+
provider=cast(
|
|
21
|
+
Literal["openai", "azure", "local", "voyage", "local-code"],
|
|
22
|
+
self.provider,
|
|
23
|
+
)
|
|
24
|
+
),
|
|
25
|
+
)
|
|
26
|
+
return Retriever(config)
|
|
27
|
+
|
|
28
|
+
def _get_relevant_documents(
|
|
29
|
+
self,
|
|
30
|
+
query: str,
|
|
31
|
+
*,
|
|
32
|
+
run_manager: CallbackManagerForRetrieverRun,
|
|
33
|
+
) -> list[Document]:
|
|
34
|
+
ctx = self._get_trelix_retriever().retrieve(query)
|
|
35
|
+
return [
|
|
36
|
+
Document(
|
|
37
|
+
page_content=r.symbol.body,
|
|
38
|
+
metadata={
|
|
39
|
+
"source": r.file.rel_path,
|
|
40
|
+
"symbol": r.symbol.qualified_name,
|
|
41
|
+
"language": r.file.language.value,
|
|
42
|
+
"kind": r.symbol.kind.value,
|
|
43
|
+
"lines": str(r.symbol.line_start) + "-" + str(r.symbol.line_end),
|
|
44
|
+
"score": r.score,
|
|
45
|
+
"retrieval_source": r.source,
|
|
46
|
+
},
|
|
47
|
+
)
|
|
48
|
+
for r in ctx.results[: self.k]
|
|
49
|
+
]
|
|
File without changes
|
|
@@ -0,0 +1,218 @@
|
|
|
1
|
+
"""
|
|
2
|
+
Tests for TrelixRetriever.
|
|
3
|
+
|
|
4
|
+
Strategy:
|
|
5
|
+
- Import / subclass checks run without any trelix index on disk.
|
|
6
|
+
- Functional tests mock out trelix internals so they stay fast and hermetic.
|
|
7
|
+
"""
|
|
8
|
+
|
|
9
|
+
from __future__ import annotations
|
|
10
|
+
|
|
11
|
+
from dataclasses import dataclass, field
|
|
12
|
+
from unittest.mock import MagicMock
|
|
13
|
+
|
|
14
|
+
import pytest
|
|
15
|
+
from langchain_core.documents import Document
|
|
16
|
+
from langchain_core.retrievers import BaseRetriever
|
|
17
|
+
from trelix_langchain import TrelixRetriever
|
|
18
|
+
|
|
19
|
+
# ---------------------------------------------------------------------------
|
|
20
|
+
# Helpers — minimal stubs that mimic trelix data-model shapes
|
|
21
|
+
# ---------------------------------------------------------------------------
|
|
22
|
+
|
|
23
|
+
|
|
24
|
+
@dataclass
|
|
25
|
+
class _Language:
|
|
26
|
+
value: str = "python"
|
|
27
|
+
|
|
28
|
+
|
|
29
|
+
@dataclass
|
|
30
|
+
class _SymbolKind:
|
|
31
|
+
value: str = "function"
|
|
32
|
+
|
|
33
|
+
|
|
34
|
+
@dataclass
|
|
35
|
+
class _Symbol:
|
|
36
|
+
body: str = "def hello(): pass"
|
|
37
|
+
qualified_name: str = "mymodule.hello"
|
|
38
|
+
kind: _SymbolKind = field(default_factory=_SymbolKind)
|
|
39
|
+
line_start: int = 1
|
|
40
|
+
line_end: int = 3
|
|
41
|
+
|
|
42
|
+
|
|
43
|
+
@dataclass
|
|
44
|
+
class _File:
|
|
45
|
+
rel_path: str = "src/mymodule.py"
|
|
46
|
+
language: _Language = field(default_factory=_Language)
|
|
47
|
+
|
|
48
|
+
|
|
49
|
+
@dataclass
|
|
50
|
+
class _SearchResult:
|
|
51
|
+
symbol: _Symbol = field(default_factory=_Symbol)
|
|
52
|
+
file: _File = field(default_factory=_File)
|
|
53
|
+
score: float = 0.95
|
|
54
|
+
source: str = "vector"
|
|
55
|
+
|
|
56
|
+
|
|
57
|
+
@dataclass
|
|
58
|
+
class _RetrievedContext:
|
|
59
|
+
results: list
|
|
60
|
+
|
|
61
|
+
|
|
62
|
+
def _make_context(n: int = 3) -> _RetrievedContext:
|
|
63
|
+
"""Return a fake RetrievedContext with *n* results."""
|
|
64
|
+
return _RetrievedContext(results=[_SearchResult() for _ in range(n)])
|
|
65
|
+
|
|
66
|
+
|
|
67
|
+
# ---------------------------------------------------------------------------
|
|
68
|
+
# 1. Importability
|
|
69
|
+
# ---------------------------------------------------------------------------
|
|
70
|
+
|
|
71
|
+
|
|
72
|
+
def test_import_trelix_retriever():
|
|
73
|
+
"""TrelixRetriever must be importable from the package root."""
|
|
74
|
+
from trelix_langchain import TrelixRetriever as TR # noqa: F401
|
|
75
|
+
|
|
76
|
+
assert TR is TrelixRetriever
|
|
77
|
+
|
|
78
|
+
|
|
79
|
+
def test_version_exposed():
|
|
80
|
+
import trelix_langchain
|
|
81
|
+
|
|
82
|
+
assert hasattr(trelix_langchain, "__version__")
|
|
83
|
+
assert trelix_langchain.__version__ == "0.4.0"
|
|
84
|
+
|
|
85
|
+
|
|
86
|
+
# ---------------------------------------------------------------------------
|
|
87
|
+
# 2. BaseRetriever subclass
|
|
88
|
+
# ---------------------------------------------------------------------------
|
|
89
|
+
|
|
90
|
+
|
|
91
|
+
def test_is_base_retriever_subclass():
|
|
92
|
+
assert issubclass(TrelixRetriever, BaseRetriever)
|
|
93
|
+
|
|
94
|
+
|
|
95
|
+
def test_instantiation_sets_fields():
|
|
96
|
+
r = TrelixRetriever(repo_path="/tmp/repo", provider="openai", k=5)
|
|
97
|
+
assert r.repo_path == "/tmp/repo"
|
|
98
|
+
assert r.provider == "openai"
|
|
99
|
+
assert r.k == 5
|
|
100
|
+
|
|
101
|
+
|
|
102
|
+
def test_default_field_values():
|
|
103
|
+
r = TrelixRetriever(repo_path="/tmp/repo")
|
|
104
|
+
assert r.provider == "local"
|
|
105
|
+
assert r.k == 10
|
|
106
|
+
|
|
107
|
+
|
|
108
|
+
# ---------------------------------------------------------------------------
|
|
109
|
+
# 3. invoke() / _get_relevant_documents() returns Documents with correct metadata
|
|
110
|
+
# ---------------------------------------------------------------------------
|
|
111
|
+
|
|
112
|
+
|
|
113
|
+
def _make_retriever_with_mock(k: int = 10, n_results: int = 3) -> TrelixRetriever:
|
|
114
|
+
"""Return a TrelixRetriever whose internal trelix retriever is mocked."""
|
|
115
|
+
tr = TrelixRetriever(repo_path="/tmp/fake-repo", k=k)
|
|
116
|
+
mock_inner = MagicMock()
|
|
117
|
+
mock_inner.retrieve.return_value = _make_context(n_results)
|
|
118
|
+
tr._get_trelix_retriever = lambda: mock_inner # type: ignore[method-assign]
|
|
119
|
+
return tr
|
|
120
|
+
|
|
121
|
+
|
|
122
|
+
def test_invoke_returns_list_of_documents():
|
|
123
|
+
tr = _make_retriever_with_mock()
|
|
124
|
+
docs = tr.invoke("find hello function")
|
|
125
|
+
assert isinstance(docs, list)
|
|
126
|
+
assert len(docs) == 3
|
|
127
|
+
assert all(isinstance(d, Document) for d in docs)
|
|
128
|
+
|
|
129
|
+
|
|
130
|
+
def test_document_page_content_is_symbol_body():
|
|
131
|
+
tr = _make_retriever_with_mock()
|
|
132
|
+
docs = tr.invoke("hello")
|
|
133
|
+
assert docs[0].page_content == "def hello(): pass"
|
|
134
|
+
|
|
135
|
+
|
|
136
|
+
def test_document_metadata_source():
|
|
137
|
+
tr = _make_retriever_with_mock()
|
|
138
|
+
docs = tr.invoke("hello")
|
|
139
|
+
assert docs[0].metadata["source"] == "src/mymodule.py"
|
|
140
|
+
|
|
141
|
+
|
|
142
|
+
def test_document_metadata_symbol():
|
|
143
|
+
tr = _make_retriever_with_mock()
|
|
144
|
+
docs = tr.invoke("hello")
|
|
145
|
+
assert docs[0].metadata["symbol"] == "mymodule.hello"
|
|
146
|
+
|
|
147
|
+
|
|
148
|
+
def test_document_metadata_language():
|
|
149
|
+
tr = _make_retriever_with_mock()
|
|
150
|
+
docs = tr.invoke("hello")
|
|
151
|
+
assert docs[0].metadata["language"] == "python"
|
|
152
|
+
|
|
153
|
+
|
|
154
|
+
def test_document_metadata_kind():
|
|
155
|
+
tr = _make_retriever_with_mock()
|
|
156
|
+
docs = tr.invoke("hello")
|
|
157
|
+
assert docs[0].metadata["kind"] == "function"
|
|
158
|
+
|
|
159
|
+
|
|
160
|
+
def test_document_metadata_lines():
|
|
161
|
+
tr = _make_retriever_with_mock()
|
|
162
|
+
docs = tr.invoke("hello")
|
|
163
|
+
assert docs[0].metadata["lines"] == "1-3"
|
|
164
|
+
|
|
165
|
+
|
|
166
|
+
def test_document_metadata_score():
|
|
167
|
+
tr = _make_retriever_with_mock()
|
|
168
|
+
docs = tr.invoke("hello")
|
|
169
|
+
assert docs[0].metadata["score"] == pytest.approx(0.95)
|
|
170
|
+
|
|
171
|
+
|
|
172
|
+
def test_document_metadata_retrieval_source():
|
|
173
|
+
tr = _make_retriever_with_mock()
|
|
174
|
+
docs = tr.invoke("hello")
|
|
175
|
+
assert docs[0].metadata["retrieval_source"] == "vector"
|
|
176
|
+
|
|
177
|
+
|
|
178
|
+
# ---------------------------------------------------------------------------
|
|
179
|
+
# 4. k limits number of returned documents
|
|
180
|
+
# ---------------------------------------------------------------------------
|
|
181
|
+
|
|
182
|
+
|
|
183
|
+
def test_k_limits_results_when_fewer_available():
|
|
184
|
+
"""k=5, but only 3 results available — should return 3."""
|
|
185
|
+
tr = _make_retriever_with_mock(k=5, n_results=3)
|
|
186
|
+
docs = tr.invoke("query")
|
|
187
|
+
assert len(docs) == 3
|
|
188
|
+
|
|
189
|
+
|
|
190
|
+
def test_k_limits_results_when_more_available():
|
|
191
|
+
"""k=2, 5 results available — should return exactly 2."""
|
|
192
|
+
tr = _make_retriever_with_mock(k=2, n_results=5)
|
|
193
|
+
docs = tr.invoke("query")
|
|
194
|
+
assert len(docs) == 2
|
|
195
|
+
|
|
196
|
+
|
|
197
|
+
def test_k_equals_zero_returns_empty():
|
|
198
|
+
tr = _make_retriever_with_mock(k=0, n_results=5)
|
|
199
|
+
docs = tr.invoke("query")
|
|
200
|
+
assert docs == []
|
|
201
|
+
|
|
202
|
+
|
|
203
|
+
def test_k_default_ten_limits_large_result_set():
|
|
204
|
+
"""Default k=10: 15 results available — should cap at 10."""
|
|
205
|
+
tr = _make_retriever_with_mock(k=10, n_results=15)
|
|
206
|
+
docs = tr.invoke("query")
|
|
207
|
+
assert len(docs) == 10
|
|
208
|
+
|
|
209
|
+
|
|
210
|
+
# ---------------------------------------------------------------------------
|
|
211
|
+
# 5. Empty results
|
|
212
|
+
# ---------------------------------------------------------------------------
|
|
213
|
+
|
|
214
|
+
|
|
215
|
+
def test_empty_results_returns_empty_list():
|
|
216
|
+
tr = _make_retriever_with_mock(k=10, n_results=0)
|
|
217
|
+
docs = tr.invoke("nothing here")
|
|
218
|
+
assert docs == []
|