vexor 0.20.0__py3-none-any.whl → 0.21.1__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- vexor/__init__.py +1 -1
- vexor/api.py +26 -0
- vexor/cache.py +525 -286
- vexor/cli.py +53 -0
- vexor/config.py +54 -1
- vexor/providers/gemini.py +79 -13
- vexor/providers/openai.py +79 -13
- vexor/services/config_service.py +14 -0
- vexor/services/index_service.py +132 -5
- vexor/services/search_service.py +94 -27
- vexor/text.py +10 -0
- {vexor-0.20.0.dist-info → vexor-0.21.1.dist-info}/METADATA +15 -13
- {vexor-0.20.0.dist-info → vexor-0.21.1.dist-info}/RECORD +16 -16
- {vexor-0.20.0.dist-info → vexor-0.21.1.dist-info}/WHEEL +0 -0
- {vexor-0.20.0.dist-info → vexor-0.21.1.dist-info}/entry_points.txt +0 -0
- {vexor-0.20.0.dist-info → vexor-0.21.1.dist-info}/licenses/LICENSE +0 -0
vexor/__init__.py
CHANGED
vexor/api.py
CHANGED
|
@@ -42,6 +42,8 @@ class RuntimeSettings:
|
|
|
42
42
|
model_name: str
|
|
43
43
|
batch_size: int
|
|
44
44
|
embed_concurrency: int
|
|
45
|
+
extract_concurrency: int
|
|
46
|
+
extract_backend: str
|
|
45
47
|
base_url: str | None
|
|
46
48
|
api_key: str | None
|
|
47
49
|
local_cuda: bool
|
|
@@ -90,6 +92,8 @@ def search(
|
|
|
90
92
|
model: str | None = None,
|
|
91
93
|
batch_size: int | None = None,
|
|
92
94
|
embed_concurrency: int | None = None,
|
|
95
|
+
extract_concurrency: int | None = None,
|
|
96
|
+
extract_backend: str | None = None,
|
|
93
97
|
base_url: str | None = None,
|
|
94
98
|
api_key: str | None = None,
|
|
95
99
|
local_cuda: bool | None = None,
|
|
@@ -121,6 +125,8 @@ def search(
|
|
|
121
125
|
model=model,
|
|
122
126
|
batch_size=batch_size,
|
|
123
127
|
embed_concurrency=embed_concurrency,
|
|
128
|
+
extract_concurrency=extract_concurrency,
|
|
129
|
+
extract_backend=extract_backend,
|
|
124
130
|
base_url=base_url,
|
|
125
131
|
api_key=api_key,
|
|
126
132
|
local_cuda=local_cuda,
|
|
@@ -141,6 +147,8 @@ def search(
|
|
|
141
147
|
model_name=settings.model_name,
|
|
142
148
|
batch_size=settings.batch_size,
|
|
143
149
|
embed_concurrency=settings.embed_concurrency,
|
|
150
|
+
extract_concurrency=settings.extract_concurrency,
|
|
151
|
+
extract_backend=settings.extract_backend,
|
|
144
152
|
provider=settings.provider,
|
|
145
153
|
base_url=settings.base_url,
|
|
146
154
|
api_key=settings.api_key,
|
|
@@ -170,6 +178,8 @@ def index(
|
|
|
170
178
|
model: str | None = None,
|
|
171
179
|
batch_size: int | None = None,
|
|
172
180
|
embed_concurrency: int | None = None,
|
|
181
|
+
extract_concurrency: int | None = None,
|
|
182
|
+
extract_backend: str | None = None,
|
|
173
183
|
base_url: str | None = None,
|
|
174
184
|
api_key: str | None = None,
|
|
175
185
|
local_cuda: bool | None = None,
|
|
@@ -190,6 +200,8 @@ def index(
|
|
|
190
200
|
model=model,
|
|
191
201
|
batch_size=batch_size,
|
|
192
202
|
embed_concurrency=embed_concurrency,
|
|
203
|
+
extract_concurrency=extract_concurrency,
|
|
204
|
+
extract_backend=extract_backend,
|
|
193
205
|
base_url=base_url,
|
|
194
206
|
api_key=api_key,
|
|
195
207
|
local_cuda=local_cuda,
|
|
@@ -208,6 +220,8 @@ def index(
|
|
|
208
220
|
model_name=settings.model_name,
|
|
209
221
|
batch_size=settings.batch_size,
|
|
210
222
|
embed_concurrency=settings.embed_concurrency,
|
|
223
|
+
extract_concurrency=settings.extract_concurrency,
|
|
224
|
+
extract_backend=settings.extract_backend,
|
|
211
225
|
provider=settings.provider,
|
|
212
226
|
base_url=settings.base_url,
|
|
213
227
|
api_key=settings.api_key,
|
|
@@ -282,6 +296,8 @@ def _resolve_settings(
|
|
|
282
296
|
model: str | None,
|
|
283
297
|
batch_size: int | None,
|
|
284
298
|
embed_concurrency: int | None,
|
|
299
|
+
extract_concurrency: int | None,
|
|
300
|
+
extract_backend: str | None,
|
|
285
301
|
base_url: str | None,
|
|
286
302
|
api_key: str | None,
|
|
287
303
|
local_cuda: bool | None,
|
|
@@ -313,11 +329,21 @@ def _resolve_settings(
|
|
|
313
329
|
embed_value = (
|
|
314
330
|
embed_concurrency if embed_concurrency is not None else config.embed_concurrency
|
|
315
331
|
)
|
|
332
|
+
extract_value = (
|
|
333
|
+
extract_concurrency
|
|
334
|
+
if extract_concurrency is not None
|
|
335
|
+
else config.extract_concurrency
|
|
336
|
+
)
|
|
337
|
+
extract_backend_value = (
|
|
338
|
+
extract_backend if extract_backend is not None else config.extract_backend
|
|
339
|
+
)
|
|
316
340
|
return RuntimeSettings(
|
|
317
341
|
provider=provider_value,
|
|
318
342
|
model_name=model_name,
|
|
319
343
|
batch_size=batch_value,
|
|
320
344
|
embed_concurrency=embed_value,
|
|
345
|
+
extract_concurrency=extract_value,
|
|
346
|
+
extract_backend=extract_backend_value,
|
|
321
347
|
base_url=base_url if base_url is not None else config.base_url,
|
|
322
348
|
api_key=api_key if api_key is not None else config.api_key,
|
|
323
349
|
local_cuda=bool(local_cuda if local_cuda is not None else config.local_cuda),
|