ddi-fw 0.0.242__tar.gz → 0.0.243__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {ddi_fw-0.0.242 → ddi_fw-0.0.243}/PKG-INFO +1 -1
- {ddi_fw-0.0.242 → ddi_fw-0.0.243}/pyproject.toml +1 -1
- {ddi_fw-0.0.242 → ddi_fw-0.0.243}/src/ddi_fw/langchain/chroma_storage.py +5 -5
- {ddi_fw-0.0.242 → ddi_fw-0.0.243}/src/ddi_fw/langchain/faiss_storage.py +7 -4
- {ddi_fw-0.0.242 → ddi_fw-0.0.243}/src/ddi_fw.egg-info/PKG-INFO +1 -1
- {ddi_fw-0.0.242 → ddi_fw-0.0.243}/README.md +0 -0
- {ddi_fw-0.0.242 → ddi_fw-0.0.243}/setup.cfg +0 -0
- {ddi_fw-0.0.242 → ddi_fw-0.0.243}/src/ddi_fw/datasets/__init__.py +0 -0
- {ddi_fw-0.0.242 → ddi_fw-0.0.243}/src/ddi_fw/datasets/core.py +0 -0
- {ddi_fw-0.0.242 → ddi_fw-0.0.243}/src/ddi_fw/datasets/dataset_splitter.py +0 -0
- {ddi_fw-0.0.242 → ddi_fw-0.0.243}/src/ddi_fw/datasets/db_utils.py +0 -0
- {ddi_fw-0.0.242 → ddi_fw-0.0.243}/src/ddi_fw/datasets/setup_._py +0 -0
- {ddi_fw-0.0.242 → ddi_fw-0.0.243}/src/ddi_fw/langchain/__init__.py +0 -0
- {ddi_fw-0.0.242 → ddi_fw-0.0.243}/src/ddi_fw/langchain/embeddings.py +0 -0
- {ddi_fw-0.0.242 → ddi_fw-0.0.243}/src/ddi_fw/langchain/sentence_splitter.py +0 -0
- {ddi_fw-0.0.242 → ddi_fw-0.0.243}/src/ddi_fw/langchain/storage.py +0 -0
- {ddi_fw-0.0.242 → ddi_fw-0.0.243}/src/ddi_fw/ml/__init__.py +0 -0
- {ddi_fw-0.0.242 → ddi_fw-0.0.243}/src/ddi_fw/ml/evaluation_helper.py +0 -0
- {ddi_fw-0.0.242 → ddi_fw-0.0.243}/src/ddi_fw/ml/ml_helper.py +0 -0
- {ddi_fw-0.0.242 → ddi_fw-0.0.243}/src/ddi_fw/ml/model_wrapper.py +0 -0
- {ddi_fw-0.0.242 → ddi_fw-0.0.243}/src/ddi_fw/ml/pytorch_wrapper.py +0 -0
- {ddi_fw-0.0.242 → ddi_fw-0.0.243}/src/ddi_fw/ml/tensorflow_wrapper.py +0 -0
- {ddi_fw-0.0.242 → ddi_fw-0.0.243}/src/ddi_fw/ml/tracking_service.py +0 -0
- {ddi_fw-0.0.242 → ddi_fw-0.0.243}/src/ddi_fw/ner/__init__.py +0 -0
- {ddi_fw-0.0.242 → ddi_fw-0.0.243}/src/ddi_fw/ner/mmlrestclient.py +0 -0
- {ddi_fw-0.0.242 → ddi_fw-0.0.243}/src/ddi_fw/ner/ner.py +0 -0
- {ddi_fw-0.0.242 → ddi_fw-0.0.243}/src/ddi_fw/pipeline/__init__.py +0 -0
- {ddi_fw-0.0.242 → ddi_fw-0.0.243}/src/ddi_fw/pipeline/multi_modal_combination_strategy.py +0 -0
- {ddi_fw-0.0.242 → ddi_fw-0.0.243}/src/ddi_fw/pipeline/multi_pipeline.py +0 -0
- {ddi_fw-0.0.242 → ddi_fw-0.0.243}/src/ddi_fw/pipeline/multi_pipeline_org.py +0 -0
- {ddi_fw-0.0.242 → ddi_fw-0.0.243}/src/ddi_fw/pipeline/ner_pipeline.py +0 -0
- {ddi_fw-0.0.242 → ddi_fw-0.0.243}/src/ddi_fw/pipeline/pipeline.py +0 -0
- {ddi_fw-0.0.242 → ddi_fw-0.0.243}/src/ddi_fw/utils/__init__.py +0 -0
- {ddi_fw-0.0.242 → ddi_fw-0.0.243}/src/ddi_fw/utils/categorical_data_encoding_checker.py +0 -0
- {ddi_fw-0.0.242 → ddi_fw-0.0.243}/src/ddi_fw/utils/enums.py +0 -0
- {ddi_fw-0.0.242 → ddi_fw-0.0.243}/src/ddi_fw/utils/json_helper.py +0 -0
- {ddi_fw-0.0.242 → ddi_fw-0.0.243}/src/ddi_fw/utils/kaggle.py +0 -0
- {ddi_fw-0.0.242 → ddi_fw-0.0.243}/src/ddi_fw/utils/numpy_utils.py +0 -0
- {ddi_fw-0.0.242 → ddi_fw-0.0.243}/src/ddi_fw/utils/package_helper.py +0 -0
- {ddi_fw-0.0.242 → ddi_fw-0.0.243}/src/ddi_fw/utils/py7zr_helper.py +0 -0
- {ddi_fw-0.0.242 → ddi_fw-0.0.243}/src/ddi_fw/utils/utils.py +0 -0
- {ddi_fw-0.0.242 → ddi_fw-0.0.243}/src/ddi_fw/utils/zip_helper.py +0 -0
- {ddi_fw-0.0.242 → ddi_fw-0.0.243}/src/ddi_fw/vectorization/__init__.py +0 -0
- {ddi_fw-0.0.242 → ddi_fw-0.0.243}/src/ddi_fw/vectorization/feature_vector_generation.py +0 -0
- {ddi_fw-0.0.242 → ddi_fw-0.0.243}/src/ddi_fw/vectorization/idf_helper.py +0 -0
- {ddi_fw-0.0.242 → ddi_fw-0.0.243}/src/ddi_fw.egg-info/SOURCES.txt +0 -0
- {ddi_fw-0.0.242 → ddi_fw-0.0.243}/src/ddi_fw.egg-info/dependency_links.txt +0 -0
- {ddi_fw-0.0.242 → ddi_fw-0.0.243}/src/ddi_fw.egg-info/requires.txt +0 -0
- {ddi_fw-0.0.242 → ddi_fw-0.0.243}/src/ddi_fw.egg-info/top_level.txt +0 -0
@@ -89,12 +89,12 @@ class ChromaVectorStoreManager(BaseVectorStoreManager):
|
|
89
89
|
persist_directory: str = Field(default="./chroma_db")
|
90
90
|
text_splitter: Optional[TextSplitter] = None
|
91
91
|
batch_size: int = Field(default=1024)
|
92
|
+
vector_store: Optional[Chroma] | None = None
|
92
93
|
|
93
94
|
class Config:
|
94
95
|
arbitrary_types_allowed = True
|
95
96
|
|
96
97
|
|
97
|
-
|
98
98
|
# def __split_docs(self, documents):
|
99
99
|
# docs = self.text_splitter.split_documents(documents)
|
100
100
|
# return docs
|
@@ -225,8 +225,8 @@ class ChromaVectorStoreManager(BaseVectorStoreManager):
|
|
225
225
|
|
226
226
|
def initialize_embedding_dict(self, **kwargs):
|
227
227
|
column_embedding_configs = kwargs.get("column_embedding_configs")
|
228
|
-
vector_db_persist_directory = kwargs.get("vector_db_persist_directory")
|
229
|
-
vector_db_collection_name = kwargs.get("vector_db_collection_name")
|
228
|
+
# vector_db_persist_directory = kwargs.get("vector_db_persist_directory")
|
229
|
+
# vector_db_collection_name = kwargs.get("vector_db_collection_name")
|
230
230
|
embedding_dict = defaultdict(lambda: defaultdict(list))
|
231
231
|
if column_embedding_configs:
|
232
232
|
for item in column_embedding_configs:
|
@@ -234,8 +234,8 @@ class ChromaVectorStoreManager(BaseVectorStoreManager):
|
|
234
234
|
col_db_dir = item["vector_db_persist_directory"]
|
235
235
|
col_db_collection = item["vector_db_collection_name"]
|
236
236
|
self.__create_or_update_embeddings__(embedding_dict, col_db_dir, col_db_collection, col)
|
237
|
-
elif
|
238
|
-
self.__create_or_update_embeddings__(embedding_dict,
|
237
|
+
elif self.persist_directory:
|
238
|
+
self.__create_or_update_embeddings__(embedding_dict, self.persist_directory, self.collection_name)
|
239
239
|
else:
|
240
240
|
logging.warning("There is no configuration of Embeddings")
|
241
241
|
raise ValueError(
|
@@ -10,9 +10,11 @@ from langchain_core.embeddings import Embeddings
|
|
10
10
|
|
11
11
|
from pydantic import BaseModel, Field
|
12
12
|
from langchain_core.embeddings import Embeddings
|
13
|
+
from langchain_core.vectorstores import VectorStore
|
13
14
|
|
14
15
|
class BaseVectorStoreManager(BaseModel):
|
15
|
-
embeddings: Embeddings
|
16
|
+
embeddings: Optional[Embeddings] = None
|
17
|
+
vector_store: Optional[VectorStore]|None = None
|
16
18
|
|
17
19
|
class Config:
|
18
20
|
arbitrary_types_allowed = True
|
@@ -34,8 +36,7 @@ class BaseVectorStoreManager(BaseModel):
|
|
34
36
|
|
35
37
|
class FaissVectorStoreManager(BaseVectorStoreManager):
|
36
38
|
index: Any = None
|
37
|
-
vector_store:
|
38
|
-
|
39
|
+
vector_store: Optional[FAISS] | None = None
|
39
40
|
class Config:
|
40
41
|
arbitrary_types_allowed = True
|
41
42
|
# def generate_vector_store(self, docs):
|
@@ -73,7 +74,8 @@ class FaissVectorStoreManager(BaseVectorStoreManager):
|
|
73
74
|
- 'skip': skip the document
|
74
75
|
- 'error': raise ValueError
|
75
76
|
"""
|
76
|
-
|
77
|
+
if self.embeddings is None:
|
78
|
+
raise ValueError("Embeddings must be initialized before generating vector store.")
|
77
79
|
# Step 1: Get embedding dimension from a sample input
|
78
80
|
sample_embedding = self.embeddings.embed_query("hello world")
|
79
81
|
dimension = len(sample_embedding)
|
@@ -126,6 +128,7 @@ class FaissVectorStoreManager(BaseVectorStoreManager):
|
|
126
128
|
raise ValueError("No vector store to save.")
|
127
129
|
|
128
130
|
def load(self, path):
|
131
|
+
#self.embeddings
|
129
132
|
self.vector_store = FAISS.load_local(
|
130
133
|
path, self.embeddings, allow_dangerous_deserialization=True
|
131
134
|
)
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|