ddi-fw 0.0.194__tar.gz → 0.0.196__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (110) hide show
  1. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/PKG-INFO +1 -1
  2. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/pyproject.toml +1 -1
  3. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/datasets/core.py +4 -3
  4. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/datasets/ddi_mdl/base.py +22 -2
  5. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw.egg-info/PKG-INFO +1 -1
  6. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/README.md +0 -0
  7. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/setup.cfg +0 -0
  8. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/datasets/__init__.py +0 -0
  9. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/datasets/dataset_splitter.py +0 -0
  10. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/datasets/db_utils.py +0 -0
  11. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/datasets/ddi_mdl/data/event.db +0 -0
  12. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/datasets/ddi_mdl/debug.log +0 -0
  13. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/datasets/ddi_mdl/indexes/test_indexes.txt +0 -0
  14. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/datasets/ddi_mdl/indexes/train_fold_0.txt +0 -0
  15. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/datasets/ddi_mdl/indexes/train_fold_1.txt +0 -0
  16. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/datasets/ddi_mdl/indexes/train_fold_2.txt +0 -0
  17. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/datasets/ddi_mdl/indexes/train_fold_3.txt +0 -0
  18. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/datasets/ddi_mdl/indexes/train_fold_4.txt +0 -0
  19. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/datasets/ddi_mdl/indexes/train_indexes.txt +0 -0
  20. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/datasets/ddi_mdl/indexes/validation_fold_0.txt +0 -0
  21. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/datasets/ddi_mdl/indexes/validation_fold_1.txt +0 -0
  22. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/datasets/ddi_mdl/indexes/validation_fold_2.txt +0 -0
  23. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/datasets/ddi_mdl/indexes/validation_fold_3.txt +0 -0
  24. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/datasets/ddi_mdl/indexes/validation_fold_4.txt +0 -0
  25. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/datasets/ddi_mdl/indexes_old/test_indexes.txt +0 -0
  26. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/datasets/ddi_mdl/indexes_old/train_fold_0.txt +0 -0
  27. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/datasets/ddi_mdl/indexes_old/train_fold_1.txt +0 -0
  28. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/datasets/ddi_mdl/indexes_old/train_fold_2.txt +0 -0
  29. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/datasets/ddi_mdl/indexes_old/train_fold_3.txt +0 -0
  30. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/datasets/ddi_mdl/indexes_old/train_fold_4.txt +0 -0
  31. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/datasets/ddi_mdl/indexes_old/train_indexes.txt +0 -0
  32. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/datasets/ddi_mdl/indexes_old/validation_fold_0.txt +0 -0
  33. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/datasets/ddi_mdl/indexes_old/validation_fold_1.txt +0 -0
  34. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/datasets/ddi_mdl/indexes_old/validation_fold_2.txt +0 -0
  35. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/datasets/ddi_mdl/indexes_old/validation_fold_3.txt +0 -0
  36. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/datasets/ddi_mdl/indexes_old/validation_fold_4.txt +0 -0
  37. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/datasets/ddi_mdl/readme.md +0 -0
  38. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/datasets/ddi_mdl_text/base.py +0 -0
  39. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/datasets/ddi_mdl_text/data/event.db +0 -0
  40. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/datasets/ddi_mdl_text/indexes/test_indexes.txt +0 -0
  41. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/datasets/ddi_mdl_text/indexes/train_fold_0.txt +0 -0
  42. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/datasets/ddi_mdl_text/indexes/train_fold_1.txt +0 -0
  43. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/datasets/ddi_mdl_text/indexes/train_fold_2.txt +0 -0
  44. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/datasets/ddi_mdl_text/indexes/train_fold_3.txt +0 -0
  45. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/datasets/ddi_mdl_text/indexes/train_fold_4.txt +0 -0
  46. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/datasets/ddi_mdl_text/indexes/train_indexes.txt +0 -0
  47. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/datasets/ddi_mdl_text/indexes/validation_fold_0.txt +0 -0
  48. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/datasets/ddi_mdl_text/indexes/validation_fold_1.txt +0 -0
  49. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/datasets/ddi_mdl_text/indexes/validation_fold_2.txt +0 -0
  50. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/datasets/ddi_mdl_text/indexes/validation_fold_3.txt +0 -0
  51. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/datasets/ddi_mdl_text/indexes/validation_fold_4.txt +0 -0
  52. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/datasets/mdf_sa_ddi/__init__.py +0 -0
  53. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/datasets/mdf_sa_ddi/base.py +0 -0
  54. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/datasets/mdf_sa_ddi/df_extraction_cleanxiaoyu50.csv +0 -0
  55. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/datasets/mdf_sa_ddi/drug_information_del_noDDIxiaoyu50.csv +0 -0
  56. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/datasets/mdf_sa_ddi/indexes/test_indexes.txt +0 -0
  57. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/datasets/mdf_sa_ddi/indexes/train_fold_0.txt +0 -0
  58. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/datasets/mdf_sa_ddi/indexes/train_fold_1.txt +0 -0
  59. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/datasets/mdf_sa_ddi/indexes/train_fold_2.txt +0 -0
  60. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/datasets/mdf_sa_ddi/indexes/train_fold_3.txt +0 -0
  61. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/datasets/mdf_sa_ddi/indexes/train_fold_4.txt +0 -0
  62. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/datasets/mdf_sa_ddi/indexes/train_indexes.txt +0 -0
  63. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/datasets/mdf_sa_ddi/indexes/validation_fold_0.txt +0 -0
  64. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/datasets/mdf_sa_ddi/indexes/validation_fold_1.txt +0 -0
  65. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/datasets/mdf_sa_ddi/indexes/validation_fold_2.txt +0 -0
  66. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/datasets/mdf_sa_ddi/indexes/validation_fold_3.txt +0 -0
  67. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/datasets/mdf_sa_ddi/indexes/validation_fold_4.txt +0 -0
  68. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/datasets/mdf_sa_ddi/mdf-sa-ddi.zip +0 -0
  69. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/datasets/setup_._py +0 -0
  70. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/drugbank/__init__.py +0 -0
  71. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/drugbank/drugbank.xsd +0 -0
  72. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/drugbank/drugbank_parser.py +0 -0
  73. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/drugbank/drugbank_processor.py +0 -0
  74. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/drugbank/drugbank_processor_org.py +0 -0
  75. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/drugbank/event_extractor.py +0 -0
  76. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/langchain/__init__.py +0 -0
  77. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/langchain/embeddings.py +0 -0
  78. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/langchain/sentence_splitter.py +0 -0
  79. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/langchain/storage.py +0 -0
  80. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/ml/__init__.py +0 -0
  81. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/ml/evaluation_helper.py +0 -0
  82. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/ml/ml_helper.py +0 -0
  83. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/ml/model_wrapper.py +0 -0
  84. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/ml/pytorch_wrapper.py +0 -0
  85. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/ml/tensorflow_wrapper.py +0 -0
  86. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/ner/__init__.py +0 -0
  87. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/ner/mmlrestclient.py +0 -0
  88. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/ner/ner.py +0 -0
  89. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/pipeline/__init__.py +0 -0
  90. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/pipeline/multi_modal_combination_strategy.py +0 -0
  91. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/pipeline/multi_pipeline.py +0 -0
  92. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/pipeline/ner_pipeline.py +0 -0
  93. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/pipeline/pipeline.py +0 -0
  94. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/utils/__init__.py +0 -0
  95. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/utils/categorical_data_encoding_checker.py +0 -0
  96. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/utils/enums.py +0 -0
  97. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/utils/json_helper.py +0 -0
  98. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/utils/kaggle.py +0 -0
  99. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/utils/numpy_utils.py +0 -0
  100. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/utils/package_helper.py +0 -0
  101. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/utils/py7zr_helper.py +0 -0
  102. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/utils/utils.py +0 -0
  103. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/utils/zip_helper.py +0 -0
  104. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/vectorization/__init__.py +0 -0
  105. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/vectorization/feature_vector_generation.py +0 -0
  106. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw/vectorization/idf_helper.py +0 -0
  107. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw.egg-info/SOURCES.txt +0 -0
  108. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw.egg-info/dependency_links.txt +0 -0
  109. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw.egg-info/requires.txt +0 -0
  110. {ddi_fw-0.0.194 → ddi_fw-0.0.196}/src/ddi_fw.egg-info/top_level.txt +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: ddi_fw
3
- Version: 0.0.194
3
+ Version: 0.0.196
4
4
  Summary: Do not use :)
5
5
  Author-email: Kıvanç Bayraktar <bayraktarkivanc@gmail.com>
6
6
  Maintainer-email: Kıvanç Bayraktar <bayraktarkivanc@gmail.com>
@@ -6,7 +6,7 @@ build-backend = "setuptools.build_meta"
6
6
 
7
7
  [project]
8
8
  name = "ddi_fw"
9
- version = "0.0.194"
9
+ version = "0.0.196"
10
10
  description = "Do not use :)"
11
11
  readme = "README.md"
12
12
  authors = [
@@ -258,7 +258,7 @@ class BaseDataset(BaseModel):
258
258
  # return X_train, X_test, y_train, y_test, folds
259
259
 
260
260
 
261
- class TextDatasetMixin(BaseDataset):
261
+ class TextDatasetMixin(BaseModel):
262
262
  embedding_size: Optional[int] = None
263
263
  embedding_dict: Dict[str, Any] | None = Field(
264
264
  default_factory=dict, description="Dictionary for embeddings")
@@ -346,9 +346,10 @@ class TextDatasetMixin(BaseDataset):
346
346
  else:
347
347
  print(
348
348
  f"There is no configuration of Embeddings")
349
+ self.embedding_dict = embedding_dict
349
350
 
350
- else:
351
- embedding_dict = self.embedding_dict
351
+ # else:
352
+ # embedding_dict = self.embedding_dict
352
353
  # TODO make generic
353
354
  # embedding_size = list(embedding_dict['all_text'].values())[
354
355
  # 0][0].shape
@@ -1,6 +1,6 @@
1
1
  import pathlib
2
2
  from typing import List, Optional, Tuple
3
- from ddi_fw.datasets.core import TextDatasetMixin, generate_sim_matrices_new, generate_vectors
3
+ from ddi_fw.datasets.core import BaseDataset, TextDatasetMixin, generate_sim_matrices_new, generate_vectors
4
4
  from ddi_fw.datasets.db_utils import create_connection
5
5
  import numpy as np
6
6
  import pandas as pd
@@ -32,7 +32,7 @@ LIST_OF_NER_COLUMNS = ['tui', 'cui', 'entities']
32
32
  HERE = pathlib.Path(__file__).resolve().parent
33
33
 
34
34
 
35
- class DDIMDLDataset(TextDatasetMixin):
35
+ class DDIMDLDataset(BaseDataset,TextDatasetMixin):
36
36
  dataset_name: str = "DDIMDLDataset"
37
37
  index_path: str = Field(default_factory=lambda: str(
38
38
  pathlib.Path(__file__).resolve().parent.joinpath('indexes')))
@@ -62,6 +62,26 @@ class DDIMDLDataset(TextDatasetMixin):
62
62
  def __init__(self, **kwargs):
63
63
 
64
64
  super().__init__(**kwargs)
65
+
66
+ columns = kwargs['columns']
67
+ if columns:
68
+ chemical_property_columns = []
69
+ embedding_columns = []
70
+ ner_columns = []
71
+ for column in columns:
72
+ if column in LIST_OF_CHEMICAL_PROPERTY_COLUMNS:
73
+ chemical_property_columns.append(column)
74
+ elif column in LIST_OF_EMBEDDING_COLUMNS:
75
+ embedding_columns.append(column)
76
+ elif column in LIST_OF_NER_COLUMNS:
77
+ ner_columns.append(column)
78
+ else:
79
+ raise Exception(f"{column} is not related this dataset")
80
+
81
+ self.chemical_property_columns = chemical_property_columns
82
+ self.embedding_columns = embedding_columns
83
+ self.ner_columns = ner_columns
84
+
65
85
  self.class_column = 'event_category'
66
86
  _db_path = HERE.joinpath('data/event.db')
67
87
 
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: ddi_fw
3
- Version: 0.0.194
3
+ Version: 0.0.196
4
4
  Summary: Do not use :)
5
5
  Author-email: Kıvanç Bayraktar <bayraktarkivanc@gmail.com>
6
6
  Maintainer-email: Kıvanç Bayraktar <bayraktarkivanc@gmail.com>
File without changes
File without changes
File without changes