mb-rag 1.1.37__py3-none-any.whl → 1.1.39__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of mb-rag might be problematic. Click here for more details.
- mb_rag/rag/embeddings.py +12 -7
- mb_rag/version.py +1 -1
- {mb_rag-1.1.37.dist-info → mb_rag-1.1.39.dist-info}/METADATA +1 -1
- {mb_rag-1.1.37.dist-info → mb_rag-1.1.39.dist-info}/RECORD +6 -6
- {mb_rag-1.1.37.dist-info → mb_rag-1.1.39.dist-info}/WHEEL +0 -0
- {mb_rag-1.1.37.dist-info → mb_rag-1.1.39.dist-info}/top_level.txt +0 -0
mb_rag/rag/embeddings.py
CHANGED
|
@@ -325,7 +325,8 @@ class embedding_generator:
|
|
|
325
325
|
# Initialize generator
|
|
326
326
|
gen = embedding_generator(
|
|
327
327
|
model="openai",
|
|
328
|
-
model_type="text-embedding-3-small"
|
|
328
|
+
model_type="text-embedding-3-small",
|
|
329
|
+
collection_name='test'
|
|
329
330
|
)
|
|
330
331
|
|
|
331
332
|
# Generate embeddings
|
|
@@ -335,7 +336,7 @@ class embedding_generator:
|
|
|
335
336
|
)
|
|
336
337
|
|
|
337
338
|
# Load retriever
|
|
338
|
-
retriever = gen.load_retriever('./embeddings')
|
|
339
|
+
retriever = gen.load_retriever('./embeddings', collection_name='test')
|
|
339
340
|
|
|
340
341
|
# Query embeddings
|
|
341
342
|
results = gen.query_embeddings("What is this about?")
|
|
@@ -430,12 +431,13 @@ class embedding_generator:
|
|
|
430
431
|
else:
|
|
431
432
|
return "Vector store not found"
|
|
432
433
|
|
|
433
|
-
def load_embeddings(self, embeddings_folder_path: str):
|
|
434
|
+
def load_embeddings(self, embeddings_folder_path: str,collection_name: str = 'test'):
|
|
434
435
|
"""
|
|
435
436
|
Load embeddings from folder.
|
|
436
437
|
|
|
437
438
|
Args:
|
|
438
439
|
embeddings_folder_path (str): Path to embeddings folder
|
|
440
|
+
collection_name (str): Name of the collection. Default: 'test'
|
|
439
441
|
|
|
440
442
|
Returns:
|
|
441
443
|
Optional[Chroma]: Loaded vector store or None if not found
|
|
@@ -443,7 +445,8 @@ class embedding_generator:
|
|
|
443
445
|
if self.check_file(embeddings_folder_path):
|
|
444
446
|
if self.vector_store_type == 'chroma':
|
|
445
447
|
return Chroma(persist_directory=embeddings_folder_path,
|
|
446
|
-
embedding_function=self.model
|
|
448
|
+
embedding_function=self.model,
|
|
449
|
+
collection_name=collection_name)
|
|
447
450
|
else:
|
|
448
451
|
if self.logger:
|
|
449
452
|
self.logger.info("Embeddings file not found")
|
|
@@ -451,7 +454,8 @@ class embedding_generator:
|
|
|
451
454
|
|
|
452
455
|
def load_retriever(self, embeddings_folder_path: str,
|
|
453
456
|
search_type: List[str] = ["similarity_score_threshold"],
|
|
454
|
-
search_params: List[Dict] = [{"k": 3, "score_threshold": 0.9}]
|
|
457
|
+
search_params: List[Dict] = [{"k": 3, "score_threshold": 0.9}],
|
|
458
|
+
collection_name: str = 'test'):
|
|
455
459
|
"""
|
|
456
460
|
Load retriever with search configuration.
|
|
457
461
|
|
|
@@ -459,6 +463,7 @@ class embedding_generator:
|
|
|
459
463
|
embeddings_folder_path (str): Path to embeddings folder
|
|
460
464
|
search_type (List[str]): List of search types
|
|
461
465
|
search_params (List[Dict]): List of search parameters
|
|
466
|
+
collection_name (str): Name of the collection. Default: 'test'
|
|
462
467
|
|
|
463
468
|
Returns:
|
|
464
469
|
Union[Any, List[Any]]: Single retriever or list of retrievers
|
|
@@ -472,7 +477,7 @@ class embedding_generator:
|
|
|
472
477
|
)
|
|
473
478
|
```
|
|
474
479
|
"""
|
|
475
|
-
db = self.load_embeddings(embeddings_folder_path)
|
|
480
|
+
db = self.load_embeddings(embeddings_folder_path, collection_name)
|
|
476
481
|
if db is not None:
|
|
477
482
|
if self.vector_store_type == 'chroma':
|
|
478
483
|
if len(search_type) != len(search_params):
|
|
@@ -508,7 +513,7 @@ class embedding_generator:
|
|
|
508
513
|
chunk_overlap (int): Overlap between chunks
|
|
509
514
|
"""
|
|
510
515
|
if self.vector_store_type == 'chroma':
|
|
511
|
-
db = self.load_embeddings(embeddings_folder_path)
|
|
516
|
+
db = self.load_embeddings(embeddings_folder_path, collection_name)
|
|
512
517
|
if db is not None:
|
|
513
518
|
docs = self.tokenize(data, text_splitter_type, chunk_size, chunk_overlap)
|
|
514
519
|
db.add_documents(docs)
|
mb_rag/version.py
CHANGED
|
@@ -1,17 +1,17 @@
|
|
|
1
1
|
mb_rag/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
2
|
-
mb_rag/version.py,sha256=
|
|
2
|
+
mb_rag/version.py,sha256=HcQVlfDNzK6DIr0RRqDVdD0Tb_es_b1S3Ta7qd1VAWE,207
|
|
3
3
|
mb_rag/chatbot/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
4
4
|
mb_rag/chatbot/basic.py,sha256=wZ9rZvLtNEZPhaAFkOv0yaPCYiki9goNr77Pyqwfn5g,23139
|
|
5
5
|
mb_rag/chatbot/chains.py,sha256=vDbLX5R29sWN1pcFqJ5fyxJEgMCM81JAikunAEvMC9A,7223
|
|
6
6
|
mb_rag/chatbot/prompts.py,sha256=n1PyiLbU-5fkslRv6aVOzt0dDlwya_cEdQ7kRnRhMuY,1749
|
|
7
7
|
mb_rag/rag/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
8
|
-
mb_rag/rag/embeddings.py,sha256=
|
|
8
|
+
mb_rag/rag/embeddings.py,sha256=MhxG0n7Q0XwPGYIRjCpbSZTlZLyj6Shxo64n347BEWA,27497
|
|
9
9
|
mb_rag/utils/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
|
10
10
|
mb_rag/utils/bounding_box.py,sha256=G0hdDam8QmYtD9lfwMeDHGm-TTo6KZg-yK5ESFL9zaM,8366
|
|
11
11
|
mb_rag/utils/document_extract.py,sha256=vZiFB1RYm1BIEaNA0MveJ5Zp-KEi0ngKjW8xEdtPqXA,12558
|
|
12
12
|
mb_rag/utils/extra.py,sha256=spbFrGgdruNyYQ5PzgvpSIa6Nm0rn9bb4qc8W9g582o,2492
|
|
13
13
|
mb_rag/utils/pdf_extract.py,sha256=cVeMyhnAU4XZxjIZHKMYhrktTjUNOjhx2r_LZKReOZE,15598
|
|
14
|
-
mb_rag-1.1.
|
|
15
|
-
mb_rag-1.1.
|
|
16
|
-
mb_rag-1.1.
|
|
17
|
-
mb_rag-1.1.
|
|
14
|
+
mb_rag-1.1.39.dist-info/METADATA,sha256=MlnqdDCIR0P88B8EiNDnjQQCrI4BMT-5pm1Dlu9B3Og,234
|
|
15
|
+
mb_rag-1.1.39.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
|
|
16
|
+
mb_rag-1.1.39.dist-info/top_level.txt,sha256=FIK1eAa5uYnurgXZquBG-s3PIy-HDTC5yJBW4lTH_pM,7
|
|
17
|
+
mb_rag-1.1.39.dist-info/RECORD,,
|
|
File without changes
|
|
File without changes
|