ddi-fw 0.0.263__tar.gz → 0.0.264__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (49) hide show
  1. {ddi_fw-0.0.263 → ddi_fw-0.0.264}/PKG-INFO +1 -1
  2. {ddi_fw-0.0.263 → ddi_fw-0.0.264}/pyproject.toml +1 -1
  3. {ddi_fw-0.0.263 → ddi_fw-0.0.264}/src/ddi_fw/datasets/core.py +1 -1
  4. {ddi_fw-0.0.263 → ddi_fw-0.0.264}/src/ddi_fw/langchain/faiss_storage.py +45 -1
  5. {ddi_fw-0.0.263 → ddi_fw-0.0.264}/src/ddi_fw/pipeline/multi_pipeline.py +3 -2
  6. {ddi_fw-0.0.263 → ddi_fw-0.0.264}/src/ddi_fw.egg-info/PKG-INFO +1 -1
  7. {ddi_fw-0.0.263 → ddi_fw-0.0.264}/README.md +0 -0
  8. {ddi_fw-0.0.263 → ddi_fw-0.0.264}/setup.cfg +0 -0
  9. {ddi_fw-0.0.263 → ddi_fw-0.0.264}/src/ddi_fw/datasets/__init__.py +0 -0
  10. {ddi_fw-0.0.263 → ddi_fw-0.0.264}/src/ddi_fw/datasets/dataset_splitter.py +0 -0
  11. {ddi_fw-0.0.263 → ddi_fw-0.0.264}/src/ddi_fw/datasets/db_utils.py +0 -0
  12. {ddi_fw-0.0.263 → ddi_fw-0.0.264}/src/ddi_fw/datasets/setup_._py +0 -0
  13. {ddi_fw-0.0.263 → ddi_fw-0.0.264}/src/ddi_fw/langchain/__init__.py +0 -0
  14. {ddi_fw-0.0.263 → ddi_fw-0.0.264}/src/ddi_fw/langchain/chroma_storage.py +0 -0
  15. {ddi_fw-0.0.263 → ddi_fw-0.0.264}/src/ddi_fw/langchain/embeddings.py +0 -0
  16. {ddi_fw-0.0.263 → ddi_fw-0.0.264}/src/ddi_fw/langchain/sentence_splitter.py +0 -0
  17. {ddi_fw-0.0.263 → ddi_fw-0.0.264}/src/ddi_fw/langchain/storage.py +0 -0
  18. {ddi_fw-0.0.263 → ddi_fw-0.0.264}/src/ddi_fw/ml/__init__.py +0 -0
  19. {ddi_fw-0.0.263 → ddi_fw-0.0.264}/src/ddi_fw/ml/evaluation_helper.py +0 -0
  20. {ddi_fw-0.0.263 → ddi_fw-0.0.264}/src/ddi_fw/ml/ml_helper.py +0 -0
  21. {ddi_fw-0.0.263 → ddi_fw-0.0.264}/src/ddi_fw/ml/model_wrapper.py +0 -0
  22. {ddi_fw-0.0.263 → ddi_fw-0.0.264}/src/ddi_fw/ml/pytorch_wrapper.py +0 -0
  23. {ddi_fw-0.0.263 → ddi_fw-0.0.264}/src/ddi_fw/ml/tensorflow_wrapper.py +0 -0
  24. {ddi_fw-0.0.263 → ddi_fw-0.0.264}/src/ddi_fw/ml/tracking_service.py +0 -0
  25. {ddi_fw-0.0.263 → ddi_fw-0.0.264}/src/ddi_fw/ner/__init__.py +0 -0
  26. {ddi_fw-0.0.263 → ddi_fw-0.0.264}/src/ddi_fw/ner/mmlrestclient.py +0 -0
  27. {ddi_fw-0.0.263 → ddi_fw-0.0.264}/src/ddi_fw/ner/ner.py +0 -0
  28. {ddi_fw-0.0.263 → ddi_fw-0.0.264}/src/ddi_fw/pipeline/__init__.py +0 -0
  29. {ddi_fw-0.0.263 → ddi_fw-0.0.264}/src/ddi_fw/pipeline/multi_modal_combination_strategy.py +0 -0
  30. {ddi_fw-0.0.263 → ddi_fw-0.0.264}/src/ddi_fw/pipeline/multi_pipeline_org.py +0 -0
  31. {ddi_fw-0.0.263 → ddi_fw-0.0.264}/src/ddi_fw/pipeline/ner_pipeline.py +0 -0
  32. {ddi_fw-0.0.263 → ddi_fw-0.0.264}/src/ddi_fw/pipeline/pipeline.py +0 -0
  33. {ddi_fw-0.0.263 → ddi_fw-0.0.264}/src/ddi_fw/utils/__init__.py +0 -0
  34. {ddi_fw-0.0.263 → ddi_fw-0.0.264}/src/ddi_fw/utils/categorical_data_encoding_checker.py +0 -0
  35. {ddi_fw-0.0.263 → ddi_fw-0.0.264}/src/ddi_fw/utils/enums.py +0 -0
  36. {ddi_fw-0.0.263 → ddi_fw-0.0.264}/src/ddi_fw/utils/json_helper.py +0 -0
  37. {ddi_fw-0.0.263 → ddi_fw-0.0.264}/src/ddi_fw/utils/kaggle.py +0 -0
  38. {ddi_fw-0.0.263 → ddi_fw-0.0.264}/src/ddi_fw/utils/numpy_utils.py +0 -0
  39. {ddi_fw-0.0.263 → ddi_fw-0.0.264}/src/ddi_fw/utils/package_helper.py +0 -0
  40. {ddi_fw-0.0.263 → ddi_fw-0.0.264}/src/ddi_fw/utils/py7zr_helper.py +0 -0
  41. {ddi_fw-0.0.263 → ddi_fw-0.0.264}/src/ddi_fw/utils/utils.py +0 -0
  42. {ddi_fw-0.0.263 → ddi_fw-0.0.264}/src/ddi_fw/utils/zip_helper.py +0 -0
  43. {ddi_fw-0.0.263 → ddi_fw-0.0.264}/src/ddi_fw/vectorization/__init__.py +0 -0
  44. {ddi_fw-0.0.263 → ddi_fw-0.0.264}/src/ddi_fw/vectorization/feature_vector_generation.py +0 -0
  45. {ddi_fw-0.0.263 → ddi_fw-0.0.264}/src/ddi_fw/vectorization/idf_helper.py +0 -0
  46. {ddi_fw-0.0.263 → ddi_fw-0.0.264}/src/ddi_fw.egg-info/SOURCES.txt +0 -0
  47. {ddi_fw-0.0.263 → ddi_fw-0.0.264}/src/ddi_fw.egg-info/dependency_links.txt +0 -0
  48. {ddi_fw-0.0.263 → ddi_fw-0.0.264}/src/ddi_fw.egg-info/requires.txt +0 -0
  49. {ddi_fw-0.0.263 → ddi_fw-0.0.264}/src/ddi_fw.egg-info/top_level.txt +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: ddi_fw
3
- Version: 0.0.263
3
+ Version: 0.0.264
4
4
  Summary: Do not use :)
5
5
  Author-email: Kıvanç Bayraktar <bayraktarkivanc@gmail.com>
6
6
  Maintainer-email: Kıvanç Bayraktar <bayraktarkivanc@gmail.com>
@@ -6,7 +6,7 @@ build-backend = "setuptools.build_meta"
6
6
 
7
7
  [project]
8
8
  name = "ddi_fw"
9
- version = "0.0.263"
9
+ version = "0.0.264"
10
10
  description = "Do not use :)"
11
11
  readme = "README.md"
12
12
  authors = [
@@ -94,7 +94,7 @@ class BaseDataset(BaseModel, abc.ABC):
94
94
 
95
95
  train_data,test_data = np.stack(train_data.flatten().tolist()), np.stack(test_data.flatten().tolist())
96
96
  column = self.columns[0] if self.columns else 'default'
97
- items.append([f'default', np.nan_to_num(train_data),
97
+ items.append([f'{column}', np.nan_to_num(train_data),
98
98
  y_train_label, np.nan_to_num(test_data), y_test_label])
99
99
  else:
100
100
  for index, column in enumerate(self.columns):
@@ -460,4 +460,48 @@ def generate_embeddings(
460
460
  vector_store_manager.generate_vector_store(docs)
461
461
 
462
462
  # Optionally persist/save
463
- vector_store_manager.save(persist_dir)
463
+ vector_store_manager.save(persist_dir)
464
+
465
+
466
+ import os
467
+ import json
468
+
469
+ def generate_embeddings_for_json_object(
470
+ obj_json: dict,
471
+ vector_store_manager_type: Type[BaseVectorStoreManager],
472
+ persist_root: str = "./embeddings",
473
+ new_model_names: Optional[List] = None,
474
+ docs=None
475
+ ):
476
+ """
477
+ Generate embeddings for all collections in the given JSON object, storing them in a container folder.
478
+
479
+ Args:
480
+ obj_json: JSON object with 'id', 'name', and 'collections' keys.
481
+ vector_store_manager_type: The vector store manager class to use.
482
+ persist_root: Root directory for all embeddings.
483
+ new_model_names: Optional list of model names to filter collections.
484
+ docs: Documents to embed (if needed).
485
+ """
486
+ obj_id = obj_json.get("id")
487
+ obj_name = obj_json.get("name")
488
+ collections = obj_json.get("collections", [])
489
+
490
+ if not obj_id:
491
+ raise ValueError("JSON object must have an 'id' field.")
492
+ if not collections:
493
+ raise ValueError("No collections found in the given JSON object.")
494
+
495
+ # Create container directory for this object
496
+ container_dir = os.path.join(persist_root, str(obj_id))
497
+ os.makedirs(container_dir, exist_ok=True)
498
+
499
+ # Call your existing function
500
+ generate_embeddings(
501
+ docs=docs,
502
+ vector_store_manager_type=vector_store_manager_type,
503
+ config_file=None,
504
+ new_model_names=new_model_names,
505
+ collections=collections,
506
+ persist_directory=container_dir
507
+ )
@@ -149,8 +149,9 @@ class MultiPipeline():
149
149
 
150
150
  # Default model configuration
151
151
  default_model = config.get("default_model", {})
152
- default_model_type = get_import(default_model.get("model_type"))
153
- default_model_params = default_model.get("params", {})
152
+ if default_model:
153
+ default_model_type = get_import(default_model.get("model_type"))
154
+ default_model_params = default_model.get("params", {})
154
155
 
155
156
  multi_modal = config.get("multi_modal")
156
157
 
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: ddi_fw
3
- Version: 0.0.263
3
+ Version: 0.0.264
4
4
  Summary: Do not use :)
5
5
  Author-email: Kıvanç Bayraktar <bayraktarkivanc@gmail.com>
6
6
  Maintainer-email: Kıvanç Bayraktar <bayraktarkivanc@gmail.com>
File without changes
File without changes
File without changes