ddi-fw 0.0.230__tar.gz → 0.0.232__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (112) hide show
  1. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/PKG-INFO +1 -1
  2. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/pyproject.toml +1 -1
  3. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/pipeline/ner_pipeline.py +43 -22
  4. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw.egg-info/PKG-INFO +1 -1
  5. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/README.md +0 -0
  6. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/setup.cfg +0 -0
  7. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/datasets/__init__.py +0 -0
  8. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/datasets/core.py +0 -0
  9. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/datasets/dataset_splitter.py +0 -0
  10. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/datasets/db_utils.py +0 -0
  11. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/datasets/ddi_mdl/base.py +0 -0
  12. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/datasets/ddi_mdl/data/event.db +0 -0
  13. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/datasets/ddi_mdl/debug.log +0 -0
  14. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/datasets/ddi_mdl/indexes/test_indexes.txt +0 -0
  15. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/datasets/ddi_mdl/indexes/train_fold_0.txt +0 -0
  16. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/datasets/ddi_mdl/indexes/train_fold_1.txt +0 -0
  17. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/datasets/ddi_mdl/indexes/train_fold_2.txt +0 -0
  18. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/datasets/ddi_mdl/indexes/train_fold_3.txt +0 -0
  19. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/datasets/ddi_mdl/indexes/train_fold_4.txt +0 -0
  20. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/datasets/ddi_mdl/indexes/train_indexes.txt +0 -0
  21. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/datasets/ddi_mdl/indexes/validation_fold_0.txt +0 -0
  22. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/datasets/ddi_mdl/indexes/validation_fold_1.txt +0 -0
  23. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/datasets/ddi_mdl/indexes/validation_fold_2.txt +0 -0
  24. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/datasets/ddi_mdl/indexes/validation_fold_3.txt +0 -0
  25. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/datasets/ddi_mdl/indexes/validation_fold_4.txt +0 -0
  26. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/datasets/ddi_mdl/indexes_old/test_indexes.txt +0 -0
  27. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/datasets/ddi_mdl/indexes_old/train_fold_0.txt +0 -0
  28. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/datasets/ddi_mdl/indexes_old/train_fold_1.txt +0 -0
  29. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/datasets/ddi_mdl/indexes_old/train_fold_2.txt +0 -0
  30. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/datasets/ddi_mdl/indexes_old/train_fold_3.txt +0 -0
  31. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/datasets/ddi_mdl/indexes_old/train_fold_4.txt +0 -0
  32. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/datasets/ddi_mdl/indexes_old/train_indexes.txt +0 -0
  33. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/datasets/ddi_mdl/indexes_old/validation_fold_0.txt +0 -0
  34. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/datasets/ddi_mdl/indexes_old/validation_fold_1.txt +0 -0
  35. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/datasets/ddi_mdl/indexes_old/validation_fold_2.txt +0 -0
  36. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/datasets/ddi_mdl/indexes_old/validation_fold_3.txt +0 -0
  37. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/datasets/ddi_mdl/indexes_old/validation_fold_4.txt +0 -0
  38. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/datasets/ddi_mdl/readme.md +0 -0
  39. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/datasets/ddi_mdl_text/base.py +0 -0
  40. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/datasets/ddi_mdl_text/data/event.db +0 -0
  41. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/datasets/ddi_mdl_text/indexes/test_indexes.txt +0 -0
  42. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/datasets/ddi_mdl_text/indexes/train_fold_0.txt +0 -0
  43. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/datasets/ddi_mdl_text/indexes/train_fold_1.txt +0 -0
  44. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/datasets/ddi_mdl_text/indexes/train_fold_2.txt +0 -0
  45. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/datasets/ddi_mdl_text/indexes/train_fold_3.txt +0 -0
  46. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/datasets/ddi_mdl_text/indexes/train_fold_4.txt +0 -0
  47. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/datasets/ddi_mdl_text/indexes/train_indexes.txt +0 -0
  48. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/datasets/ddi_mdl_text/indexes/validation_fold_0.txt +0 -0
  49. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/datasets/ddi_mdl_text/indexes/validation_fold_1.txt +0 -0
  50. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/datasets/ddi_mdl_text/indexes/validation_fold_2.txt +0 -0
  51. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/datasets/ddi_mdl_text/indexes/validation_fold_3.txt +0 -0
  52. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/datasets/ddi_mdl_text/indexes/validation_fold_4.txt +0 -0
  53. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/datasets/mdf_sa_ddi/__init__.py +0 -0
  54. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/datasets/mdf_sa_ddi/base.py +0 -0
  55. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/datasets/mdf_sa_ddi/df_extraction_cleanxiaoyu50.csv +0 -0
  56. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/datasets/mdf_sa_ddi/drug_information_del_noDDIxiaoyu50.csv +0 -0
  57. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/datasets/mdf_sa_ddi/indexes/test_indexes.txt +0 -0
  58. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/datasets/mdf_sa_ddi/indexes/train_fold_0.txt +0 -0
  59. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/datasets/mdf_sa_ddi/indexes/train_fold_1.txt +0 -0
  60. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/datasets/mdf_sa_ddi/indexes/train_fold_2.txt +0 -0
  61. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/datasets/mdf_sa_ddi/indexes/train_fold_3.txt +0 -0
  62. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/datasets/mdf_sa_ddi/indexes/train_fold_4.txt +0 -0
  63. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/datasets/mdf_sa_ddi/indexes/train_indexes.txt +0 -0
  64. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/datasets/mdf_sa_ddi/indexes/validation_fold_0.txt +0 -0
  65. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/datasets/mdf_sa_ddi/indexes/validation_fold_1.txt +0 -0
  66. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/datasets/mdf_sa_ddi/indexes/validation_fold_2.txt +0 -0
  67. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/datasets/mdf_sa_ddi/indexes/validation_fold_3.txt +0 -0
  68. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/datasets/mdf_sa_ddi/indexes/validation_fold_4.txt +0 -0
  69. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/datasets/mdf_sa_ddi/mdf-sa-ddi.zip +0 -0
  70. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/datasets/setup_._py +0 -0
  71. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/drugbank/__init__.py +0 -0
  72. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/drugbank/drugbank.xsd +0 -0
  73. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/drugbank/drugbank_parser.py +0 -0
  74. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/drugbank/drugbank_processor.py +0 -0
  75. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/drugbank/drugbank_processor_org.py +0 -0
  76. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/drugbank/event_extractor.py +0 -0
  77. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/langchain/__init__.py +0 -0
  78. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/langchain/embeddings.py +0 -0
  79. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/langchain/sentence_splitter.py +0 -0
  80. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/langchain/storage.py +0 -0
  81. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/ml/__init__.py +0 -0
  82. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/ml/evaluation_helper.py +0 -0
  83. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/ml/ml_helper.py +0 -0
  84. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/ml/model_wrapper.py +0 -0
  85. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/ml/pytorch_wrapper.py +0 -0
  86. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/ml/tensorflow_wrapper.py +0 -0
  87. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/ml/tracking_service.py +0 -0
  88. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/ner/__init__.py +0 -0
  89. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/ner/mmlrestclient.py +0 -0
  90. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/ner/ner.py +0 -0
  91. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/pipeline/__init__.py +0 -0
  92. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/pipeline/multi_modal_combination_strategy.py +0 -0
  93. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/pipeline/multi_pipeline.py +0 -0
  94. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/pipeline/multi_pipeline_org.py +0 -0
  95. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/pipeline/pipeline.py +0 -0
  96. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/utils/__init__.py +0 -0
  97. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/utils/categorical_data_encoding_checker.py +0 -0
  98. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/utils/enums.py +0 -0
  99. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/utils/json_helper.py +0 -0
  100. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/utils/kaggle.py +0 -0
  101. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/utils/numpy_utils.py +0 -0
  102. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/utils/package_helper.py +0 -0
  103. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/utils/py7zr_helper.py +0 -0
  104. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/utils/utils.py +0 -0
  105. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/utils/zip_helper.py +0 -0
  106. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/vectorization/__init__.py +0 -0
  107. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/vectorization/feature_vector_generation.py +0 -0
  108. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw/vectorization/idf_helper.py +0 -0
  109. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw.egg-info/SOURCES.txt +0 -0
  110. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw.egg-info/dependency_links.txt +0 -0
  111. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw.egg-info/requires.txt +0 -0
  112. {ddi_fw-0.0.230 → ddi_fw-0.0.232}/src/ddi_fw.egg-info/top_level.txt +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: ddi_fw
3
- Version: 0.0.230
3
+ Version: 0.0.232
4
4
  Summary: Do not use :)
5
5
  Author-email: Kıvanç Bayraktar <bayraktarkivanc@gmail.com>
6
6
  Maintainer-email: Kıvanç Bayraktar <bayraktarkivanc@gmail.com>
@@ -6,7 +6,7 @@ build-backend = "setuptools.build_meta"
6
6
 
7
7
  [project]
8
8
  name = "ddi_fw"
9
- version = "0.0.230"
9
+ version = "0.0.232"
10
10
  description = "Do not use :)"
11
11
  readme = "README.md"
12
12
  authors = [
@@ -6,6 +6,7 @@ import mlflow
6
6
  from pydantic import BaseModel, Field, model_validator, root_validator, validator
7
7
  from ddi_fw.datasets.core import BaseDataset
8
8
  from ddi_fw.datasets.dataset_splitter import DatasetSplitter
9
+ from ddi_fw.ml.tracking_service import TrackingService
9
10
  from ddi_fw.vectorization.idf_helper import IDF
10
11
  from ddi_fw.ner.ner import CTakesNER
11
12
  from ddi_fw.ml.ml_helper import MultiModalRunner
@@ -33,6 +34,7 @@ class NerParameterSearch(BaseModel):
33
34
  increase_step: float = 0.5
34
35
 
35
36
  # Internal fields (not part of the input)
37
+ _tracking_service: TrackingService | None = None
36
38
  datasets: Dict[str, Any] = Field(default_factory=dict, exclude=True)
37
39
  items: List[Any] = Field(default_factory=list, exclude=True)
38
40
  # ner_df: Optional[Any] = Field(default=None, exclude=True)
@@ -42,6 +44,10 @@ class NerParameterSearch(BaseModel):
42
44
 
43
45
  class Config:
44
46
  arbitrary_types_allowed = True
47
+
48
+ @property
49
+ def tracking_service(self) -> TrackingService | None:
50
+ return self._tracking_service
45
51
 
46
52
  # @root_validator(pre=True)
47
53
  @model_validator(mode="before")
@@ -61,6 +67,9 @@ class NerParameterSearch(BaseModel):
61
67
  return values
62
68
 
63
69
  def build(self):
70
+ self._tracking_service = TrackingService(self.experiment_name,
71
+ backend=self.tracking_library, tracking_params=self.tracking_params)
72
+
64
73
  """Build the datasets and items for the parameter search."""
65
74
  if not isinstance(self.dataset_type, type):
66
75
  raise TypeError("self.dataset_type must be a class, not an instance")
@@ -96,7 +105,9 @@ class NerParameterSearch(BaseModel):
96
105
  "entities": 0,
97
106
  }
98
107
  if self.dataset_additional_config:
99
- kwargs= self.dataset_additional_config
108
+ additional_config= self.dataset_additional_config
109
+ else:
110
+ additional_config={}
100
111
 
101
112
  for threshold in np.arange(min_threshold, max_threshold, self.increase_step):
102
113
  if column.startswith("tui"):
@@ -105,8 +116,8 @@ class NerParameterSearch(BaseModel):
105
116
  thresholds["cui"] = threshold
106
117
  if column.startswith("entities"):
107
118
  thresholds["entities"] = threshold
108
- kwargs['ner']['thresholds'] = thresholds
109
-
119
+ additional_config['ner']['thresholds'] = thresholds
120
+ kwargs = {'additional_config': additional_config}
110
121
  print(f"Loading dataset for column: {column} with threshold: {threshold}")
111
122
  # Create a new dataset instance for each threshold
112
123
  dataset = self.dataset_type(
@@ -122,10 +133,20 @@ class NerParameterSearch(BaseModel):
122
133
  self.datasets[item[0]] = dataset
123
134
 
124
135
  self.items.extend(group_items)
125
-
126
- self.y_test_label = self.items[0][4]
127
- self.train_idx_arr = dataset.train_idx_arr
128
- self.val_idx_arr = dataset.val_idx_arr
136
+
137
+ # Set if y_test_label is None
138
+ # This ensures that y_test_label is set only once for the first dataset
139
+ if self.y_test_label is None:
140
+ self.y_test_label = self.items[0][4]
141
+ self.train_idx_arr = dataset.train_idx_arr
142
+ self.val_idx_arr = dataset.val_idx_arr
143
+
144
+ # Clear memory for the current dataset and items
145
+ del dataset
146
+ del group_items
147
+ import gc
148
+ gc.collect()
149
+
129
150
 
130
151
  # def run(self):
131
152
  # """Run the parameter search."""
@@ -147,18 +168,18 @@ class NerParameterSearch(BaseModel):
147
168
  # result = multi_modal_runner.predict()
148
169
  # return result
149
170
 
150
- def run(self):
151
- if self._tracking_service is None:
152
- logging.warning("Tracking service is not initialized.")
153
- else:
154
- self._tracking_service.setup()
155
-
156
- y_test_label = self.items[0][4]
157
- multi_modal_runner = MultiModalRunner(
158
- library=self.library, multi_modal=self.multi_modal, default_model=self.default_model, tracking_service=self._tracking_service)
159
-
160
- multi_modal_runner.set_data(
161
- self.items, self.train_idx_arr, self.val_idx_arr, y_test_label)
162
- combinations = self.combinations if self.combinations is not None else []
163
- result = multi_modal_runner.predict(combinations)
164
- return result
171
+ def run(self):
172
+ if self._tracking_service is None:
173
+ logging.warning("Tracking service is not initialized.")
174
+ else:
175
+ self._tracking_service.setup()
176
+
177
+ y_test_label = self.items[0][4]
178
+ multi_modal_runner = MultiModalRunner(
179
+ library=self.library, multi_modal=self.multi_modal, default_model=self.default_model, tracking_service=self._tracking_service)
180
+
181
+ multi_modal_runner.set_data(
182
+ self.items, self.train_idx_arr, self.val_idx_arr, y_test_label)
183
+ # combinations = self.combinations if self.combinations is not None else []
184
+ result = multi_modal_runner.predict()
185
+ return result
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: ddi_fw
3
- Version: 0.0.230
3
+ Version: 0.0.232
4
4
  Summary: Do not use :)
5
5
  Author-email: Kıvanç Bayraktar <bayraktarkivanc@gmail.com>
6
6
  Maintainer-email: Kıvanç Bayraktar <bayraktarkivanc@gmail.com>
File without changes
File without changes
File without changes