ddi-fw 0.0.36__py3-none-any.whl → 0.0.38__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- ddi_fw/datasets/core.py +10 -3
- ddi_fw/datasets/ddi_mdl/base.py +2 -2
- {ddi_fw-0.0.36.dist-info → ddi_fw-0.0.38.dist-info}/METADATA +1 -1
- {ddi_fw-0.0.36.dist-info → ddi_fw-0.0.38.dist-info}/RECORD +6 -6
- {ddi_fw-0.0.36.dist-info → ddi_fw-0.0.38.dist-info}/WHEEL +1 -1
- {ddi_fw-0.0.36.dist-info → ddi_fw-0.0.38.dist-info}/top_level.txt +0 -0
ddi_fw/datasets/core.py
CHANGED
@@ -21,8 +21,9 @@ def stack(df_column):
|
|
21
21
|
|
22
22
|
|
23
23
|
class BaseDataset(ABC):
|
24
|
-
def __init__(self,embedding_dict, ner_df, chemical_property_columns, embedding_columns, ner_columns,
|
24
|
+
def __init__(self,embedding_size,embedding_dict, ner_df, chemical_property_columns, embedding_columns, ner_columns,
|
25
25
|
**kwargs):
|
26
|
+
self.embedding_size = embedding_size
|
26
27
|
self.embedding_dict = embedding_dict
|
27
28
|
self.ner_df = ner_df
|
28
29
|
self.__similarity_related_columns__ = []
|
@@ -364,8 +365,14 @@ class BaseDataset(ABC):
|
|
364
365
|
# (value[row['id1']], value[row['id2']]), dtype=np.float16)
|
365
366
|
|
366
367
|
def x_fnc(row, embedding_column):
|
367
|
-
|
368
|
-
|
368
|
+
if row['id1'] in self.embedding_dict[embedding_column]:
|
369
|
+
v1 = self.embedding_dict[embedding_column][row['id1']]
|
370
|
+
else:
|
371
|
+
v1 = np.zeros(self.embedding_size)
|
372
|
+
if row['id2'] in self.embedding_dict[embedding_column]:
|
373
|
+
v2 = self.embedding_dict[embedding_column][row['id2']]
|
374
|
+
else:
|
375
|
+
v2 = np.zeros(self.embedding_size)
|
369
376
|
return np.float16(np.hstack(
|
370
377
|
(v1, v2)))
|
371
378
|
|
ddi_fw/datasets/ddi_mdl/base.py
CHANGED
@@ -8,7 +8,7 @@ HERE = pathlib.Path(__file__).resolve().parent
|
|
8
8
|
|
9
9
|
|
10
10
|
class DDIMDLDataset(BaseDataset):
|
11
|
-
def __init__(self, embedding_dict, ner_df, chemical_property_columns=['enzyme',
|
11
|
+
def __init__(self, embedding_size, embedding_dict, ner_df, chemical_property_columns=['enzyme',
|
12
12
|
'target',
|
13
13
|
'pathway',
|
14
14
|
'smile'],
|
@@ -16,7 +16,7 @@ class DDIMDLDataset(BaseDataset):
|
|
16
16
|
ner_columns=[],
|
17
17
|
**kwargs):
|
18
18
|
|
19
|
-
super().__init__(embedding_dict,ner_df, chemical_property_columns, embedding_columns,
|
19
|
+
super().__init__(embedding_size, embedding_dict,ner_df, chemical_property_columns, embedding_columns,
|
20
20
|
ner_columns, **kwargs)
|
21
21
|
|
22
22
|
# kwargs = {'index_path': str(HERE.joinpath('indexes'))}
|
@@ -1,12 +1,12 @@
|
|
1
1
|
ddi_fw/datasets/__init__.py,sha256=gkzHCU9-BL_bOU-RvvwdOIp_DhKRfXKU5SvgfQLVTds,505
|
2
|
-
ddi_fw/datasets/core.py,sha256=
|
2
|
+
ddi_fw/datasets/core.py,sha256=ukuiUkSMxJi4AQCXJvuAKnIq1Of4KXNzMNkCkD88lY4,18440
|
3
3
|
ddi_fw/datasets/db_utils.py,sha256=OTsa3d-Iic7z3HmzSQK9UigedRbHDxYChJk0s4GfLnw,6191
|
4
4
|
ddi_fw/datasets/embedding_generator.py,sha256=Jqrlv88RCu0Lg812KsA12X0cSaZuxbckJ4LNRKNy_qw,2173
|
5
5
|
ddi_fw/datasets/embedding_generator_new.py,sha256=GExjmBysPWkmFxTZQPs2yEmDdFllZ-qC9lhZeRQAfbQ,4320
|
6
6
|
ddi_fw/datasets/feature_vector_generation.py,sha256=dxTHvp6uTkao9PdThs116Q3bWw_WTo9T8WigVL4G01s,3245
|
7
7
|
ddi_fw/datasets/idf_helper.py,sha256=_Gd1dtDSLaw8o-o0JugzSKMt9FpeXewTh4wGEaUd4VQ,2571
|
8
8
|
ddi_fw/datasets/setup_._py,sha256=khYVJuW5PlOY_i_A16F3UbSZ6s6o_ljw33Byw3C-A8E,1047
|
9
|
-
ddi_fw/datasets/ddi_mdl/base.py,sha256=
|
9
|
+
ddi_fw/datasets/ddi_mdl/base.py,sha256=iBA-ZbpPswj0K2is3ptCGo-ylz2CZvtTxEnZLh19kp4,2505
|
10
10
|
ddi_fw/datasets/ddi_mdl/readme.md,sha256=WC6lpmsEKvIISnZqENY7TWtzCQr98HPpE3oRsBl8pIw,625
|
11
11
|
ddi_fw/datasets/ddi_mdl/data/event.db,sha256=cmlSsf9MYjRzqR-mw3cUDnTnfT6FkpOG2yCl2mMwwew,30580736
|
12
12
|
ddi_fw/datasets/ddi_mdl/indexes/test_indexes.txt,sha256=XVlDqYATckrQwNSXqMSKVBqyoN_Hg8SK6CL-XMdLADY,102176
|
@@ -80,7 +80,7 @@ ddi_fw/utils/enums.py,sha256=19eJ3fX5eRK_xPvkYcukmug144jXPH4X9zQqtsFBj5A,671
|
|
80
80
|
ddi_fw/utils/py7zr_helper.py,sha256=rWhz3Trj6bk6B24hMuff1fKdRbC0yuvaHFlL8-eaAhg,4450
|
81
81
|
ddi_fw/utils/utils.py,sha256=Na6Y8mY-CFbQjrgd9xC8agcrjVvTj_7KIXqFm1H_3qU,3549
|
82
82
|
ddi_fw/utils/zip_helper.py,sha256=YRZA4tKZVBJwGQM0_WK6L-y5MoqkKoC-nXuuHK6CU9I,5567
|
83
|
-
ddi_fw-0.0.
|
84
|
-
ddi_fw-0.0.
|
85
|
-
ddi_fw-0.0.
|
86
|
-
ddi_fw-0.0.
|
83
|
+
ddi_fw-0.0.38.dist-info/METADATA,sha256=_foC4ftO-wBt1Ixpge3FwYV0awsIhDHuc3I72HYY4v4,1563
|
84
|
+
ddi_fw-0.0.38.dist-info/WHEEL,sha256=GV9aMThwP_4oNCtvEC2ec3qUYutgWeAzklro_0m4WJQ,91
|
85
|
+
ddi_fw-0.0.38.dist-info/top_level.txt,sha256=PMwHICFZTZtcpzQNPV4UQnfNXYIeLR_Ste-Wfc1h810,7
|
86
|
+
ddi_fw-0.0.38.dist-info/RECORD,,
|
File without changes
|