ddi-fw 0.0.242__py3-none-any.whl → 0.0.243__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -89,12 +89,12 @@ class ChromaVectorStoreManager(BaseVectorStoreManager):
89
89
  persist_directory: str = Field(default="./chroma_db")
90
90
  text_splitter: Optional[TextSplitter] = None
91
91
  batch_size: int = Field(default=1024)
92
+ vector_store: Optional[Chroma] | None = None
92
93
 
93
94
  class Config:
94
95
  arbitrary_types_allowed = True
95
96
 
96
97
 
97
-
98
98
  # def __split_docs(self, documents):
99
99
  # docs = self.text_splitter.split_documents(documents)
100
100
  # return docs
@@ -225,8 +225,8 @@ class ChromaVectorStoreManager(BaseVectorStoreManager):
225
225
 
226
226
  def initialize_embedding_dict(self, **kwargs):
227
227
  column_embedding_configs = kwargs.get("column_embedding_configs")
228
- vector_db_persist_directory = kwargs.get("vector_db_persist_directory")
229
- vector_db_collection_name = kwargs.get("vector_db_collection_name")
228
+ # vector_db_persist_directory = kwargs.get("vector_db_persist_directory")
229
+ # vector_db_collection_name = kwargs.get("vector_db_collection_name")
230
230
  embedding_dict = defaultdict(lambda: defaultdict(list))
231
231
  if column_embedding_configs:
232
232
  for item in column_embedding_configs:
@@ -234,8 +234,8 @@ class ChromaVectorStoreManager(BaseVectorStoreManager):
234
234
  col_db_dir = item["vector_db_persist_directory"]
235
235
  col_db_collection = item["vector_db_collection_name"]
236
236
  self.__create_or_update_embeddings__(embedding_dict, col_db_dir, col_db_collection, col)
237
- elif vector_db_persist_directory:
238
- self.__create_or_update_embeddings__(embedding_dict, vector_db_persist_directory, vector_db_collection_name)
237
+ elif self.persist_directory:
238
+ self.__create_or_update_embeddings__(embedding_dict, self.persist_directory, self.collection_name)
239
239
  else:
240
240
  logging.warning("There is no configuration of Embeddings")
241
241
  raise ValueError(
@@ -10,9 +10,11 @@ from langchain_core.embeddings import Embeddings
10
10
 
11
11
  from pydantic import BaseModel, Field
12
12
  from langchain_core.embeddings import Embeddings
13
+ from langchain_core.vectorstores import VectorStore
13
14
 
14
15
  class BaseVectorStoreManager(BaseModel):
15
- embeddings: Embeddings
16
+ embeddings: Optional[Embeddings] = None
17
+ vector_store: Optional[VectorStore]|None = None
16
18
 
17
19
  class Config:
18
20
  arbitrary_types_allowed = True
@@ -34,8 +36,7 @@ class BaseVectorStoreManager(BaseModel):
34
36
 
35
37
  class FaissVectorStoreManager(BaseVectorStoreManager):
36
38
  index: Any = None
37
- vector_store: Any = None
38
-
39
+ vector_store: Optional[FAISS] | None = None
39
40
  class Config:
40
41
  arbitrary_types_allowed = True
41
42
  # def generate_vector_store(self, docs):
@@ -73,7 +74,8 @@ class FaissVectorStoreManager(BaseVectorStoreManager):
73
74
  - 'skip': skip the document
74
75
  - 'error': raise ValueError
75
76
  """
76
-
77
+ if self.embeddings is None:
78
+ raise ValueError("Embeddings must be initialized before generating vector store.")
77
79
  # Step 1: Get embedding dimension from a sample input
78
80
  sample_embedding = self.embeddings.embed_query("hello world")
79
81
  dimension = len(sample_embedding)
@@ -126,6 +128,7 @@ class FaissVectorStoreManager(BaseVectorStoreManager):
126
128
  raise ValueError("No vector store to save.")
127
129
 
128
130
  def load(self, path):
131
+ #self.embeddings
129
132
  self.vector_store = FAISS.load_local(
130
133
  path, self.embeddings, allow_dangerous_deserialization=True
131
134
  )
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: ddi_fw
3
- Version: 0.0.242
3
+ Version: 0.0.243
4
4
  Summary: Do not use :)
5
5
  Author-email: Kıvanç Bayraktar <bayraktarkivanc@gmail.com>
6
6
  Maintainer-email: Kıvanç Bayraktar <bayraktarkivanc@gmail.com>
@@ -4,9 +4,9 @@ ddi_fw/datasets/dataset_splitter.py,sha256=8H8uZTAf8N9LUZeSeHOMawtJFJhnDgUUqFcnl
4
4
  ddi_fw/datasets/db_utils.py,sha256=xRj28U_uXTRPHcz3yIICczFUHXUPiAOZtAj5BM6kH44,6465
5
5
  ddi_fw/datasets/setup_._py,sha256=khYVJuW5PlOY_i_A16F3UbSZ6s6o_ljw33Byw3C-A8E,1047
6
6
  ddi_fw/langchain/__init__.py,sha256=xGNaTEZCUxyc_aT1zvzVWGRfsj-9VXqMvPKtV_G7ChA,399
7
- ddi_fw/langchain/chroma_storage.py,sha256=I8xoqlc2K4gJdOUn5b33mGGMPFKYG3UiptY2HeM34_c,15483
7
+ ddi_fw/langchain/chroma_storage.py,sha256=7LSUhdiPdQHZvKC_NapOeVbHtS71iE5ABZVTrI0YQ-A,15520
8
8
  ddi_fw/langchain/embeddings.py,sha256=eEWy4okcjdhUJHi4N48Wd8XauPXyeaQVLUdNWEvtEcY,6754
9
- ddi_fw/langchain/faiss_storage.py,sha256=H--yYOmHX7nr34THNojqP_qhGXd-kMkhzzWDbMMeoqo,8923
9
+ ddi_fw/langchain/faiss_storage.py,sha256=b-PStwJHeRl9ZYGC7ql5p5ak1Xk2-A6TTEL1UqmhxVI,9220
10
10
  ddi_fw/langchain/sentence_splitter.py,sha256=h_bYElx4Ud1mwDNJfL7mUwvgadwKX3GKlSzu5L2PXzg,280
11
11
  ddi_fw/langchain/storage.py,sha256=OizKyWm74Js7T6Q9kez-ulUoBGzIMFo4R46h4kjUyIM,11200
12
12
  ddi_fw/ml/__init__.py,sha256=FteYEawCkVQOaK-cTv2VrHZ2ZnfeFr31BD6VucO7_DQ,268
@@ -38,7 +38,7 @@ ddi_fw/utils/zip_helper.py,sha256=YRZA4tKZVBJwGQM0_WK6L-y5MoqkKoC-nXuuHK6CU9I,55
38
38
  ddi_fw/vectorization/__init__.py,sha256=LcJOpLVoLvHPDw9phGFlUQGeNcST_zKV-Oi1Pm5h_nE,110
39
39
  ddi_fw/vectorization/feature_vector_generation.py,sha256=QQQGhCti653BdU343Ag1bH_g1fzi2hlic7dgNy7otjE,7694
40
40
  ddi_fw/vectorization/idf_helper.py,sha256=_Gd1dtDSLaw8o-o0JugzSKMt9FpeXewTh4wGEaUd4VQ,2571
41
- ddi_fw-0.0.242.dist-info/METADATA,sha256=jq8Op7HG_u5PE0DjELixnPMKwEl6mUkNtPTyQ5uBWU8,2632
42
- ddi_fw-0.0.242.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
43
- ddi_fw-0.0.242.dist-info/top_level.txt,sha256=PMwHICFZTZtcpzQNPV4UQnfNXYIeLR_Ste-Wfc1h810,7
44
- ddi_fw-0.0.242.dist-info/RECORD,,
41
+ ddi_fw-0.0.243.dist-info/METADATA,sha256=li6Qy_fruHkWcTEbIx2-htRPwPOQOe6Ip4tGhFYJorg,2632
42
+ ddi_fw-0.0.243.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
43
+ ddi_fw-0.0.243.dist-info/top_level.txt,sha256=PMwHICFZTZtcpzQNPV4UQnfNXYIeLR_Ste-Wfc1h810,7
44
+ ddi_fw-0.0.243.dist-info/RECORD,,