ddi-fw 0.0.169__tar.gz → 0.0.171__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/PKG-INFO +2 -3
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/pyproject.toml +2 -4
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/datasets/core.py +35 -26
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw.egg-info/PKG-INFO +2 -3
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw.egg-info/requires.txt +1 -2
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/README.md +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/setup.cfg +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/datasets/__init__.py +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/datasets/dataset_splitter.py +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/datasets/db_utils.py +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/datasets/ddi_mdl/base.py +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/datasets/ddi_mdl/data/event.db +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/datasets/ddi_mdl/debug.log +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/datasets/ddi_mdl/indexes/test_indexes.txt +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/datasets/ddi_mdl/indexes/train_fold_0.txt +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/datasets/ddi_mdl/indexes/train_fold_1.txt +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/datasets/ddi_mdl/indexes/train_fold_2.txt +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/datasets/ddi_mdl/indexes/train_fold_3.txt +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/datasets/ddi_mdl/indexes/train_fold_4.txt +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/datasets/ddi_mdl/indexes/train_indexes.txt +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/datasets/ddi_mdl/indexes/validation_fold_0.txt +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/datasets/ddi_mdl/indexes/validation_fold_1.txt +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/datasets/ddi_mdl/indexes/validation_fold_2.txt +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/datasets/ddi_mdl/indexes/validation_fold_3.txt +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/datasets/ddi_mdl/indexes/validation_fold_4.txt +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/datasets/ddi_mdl/indexes_old/test_indexes.txt +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/datasets/ddi_mdl/indexes_old/train_fold_0.txt +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/datasets/ddi_mdl/indexes_old/train_fold_1.txt +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/datasets/ddi_mdl/indexes_old/train_fold_2.txt +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/datasets/ddi_mdl/indexes_old/train_fold_3.txt +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/datasets/ddi_mdl/indexes_old/train_fold_4.txt +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/datasets/ddi_mdl/indexes_old/train_indexes.txt +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/datasets/ddi_mdl/indexes_old/validation_fold_0.txt +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/datasets/ddi_mdl/indexes_old/validation_fold_1.txt +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/datasets/ddi_mdl/indexes_old/validation_fold_2.txt +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/datasets/ddi_mdl/indexes_old/validation_fold_3.txt +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/datasets/ddi_mdl/indexes_old/validation_fold_4.txt +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/datasets/ddi_mdl/readme.md +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/datasets/ddi_mdl_text/base.py +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/datasets/ddi_mdl_text/data/event.db +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/datasets/ddi_mdl_text/indexes/test_indexes.txt +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/datasets/ddi_mdl_text/indexes/train_fold_0.txt +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/datasets/ddi_mdl_text/indexes/train_fold_1.txt +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/datasets/ddi_mdl_text/indexes/train_fold_2.txt +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/datasets/ddi_mdl_text/indexes/train_fold_3.txt +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/datasets/ddi_mdl_text/indexes/train_fold_4.txt +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/datasets/ddi_mdl_text/indexes/train_indexes.txt +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/datasets/ddi_mdl_text/indexes/validation_fold_0.txt +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/datasets/ddi_mdl_text/indexes/validation_fold_1.txt +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/datasets/ddi_mdl_text/indexes/validation_fold_2.txt +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/datasets/ddi_mdl_text/indexes/validation_fold_3.txt +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/datasets/ddi_mdl_text/indexes/validation_fold_4.txt +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/datasets/mdf_sa_ddi/__init__.py +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/datasets/mdf_sa_ddi/base.py +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/datasets/mdf_sa_ddi/df_extraction_cleanxiaoyu50.csv +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/datasets/mdf_sa_ddi/drug_information_del_noDDIxiaoyu50.csv +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/datasets/mdf_sa_ddi/indexes/test_indexes.txt +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/datasets/mdf_sa_ddi/indexes/train_fold_0.txt +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/datasets/mdf_sa_ddi/indexes/train_fold_1.txt +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/datasets/mdf_sa_ddi/indexes/train_fold_2.txt +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/datasets/mdf_sa_ddi/indexes/train_fold_3.txt +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/datasets/mdf_sa_ddi/indexes/train_fold_4.txt +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/datasets/mdf_sa_ddi/indexes/train_indexes.txt +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/datasets/mdf_sa_ddi/indexes/validation_fold_0.txt +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/datasets/mdf_sa_ddi/indexes/validation_fold_1.txt +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/datasets/mdf_sa_ddi/indexes/validation_fold_2.txt +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/datasets/mdf_sa_ddi/indexes/validation_fold_3.txt +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/datasets/mdf_sa_ddi/indexes/validation_fold_4.txt +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/datasets/mdf_sa_ddi/mdf-sa-ddi.zip +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/datasets/setup_._py +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/drugbank/__init__.py +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/drugbank/drugbank.xsd +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/drugbank/drugbank_parser.py +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/drugbank/drugbank_processor.py +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/drugbank/drugbank_processor_org.py +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/drugbank/event_extractor.py +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/langchain/__init__.py +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/langchain/embeddings.py +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/langchain/sentence_splitter.py +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/langchain/storage.py +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/ml/__init__.py +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/ml/evaluation_helper.py +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/ml/ml_helper.py +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/ml/model_wrapper.py +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/ml/pytorch_wrapper.py +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/ml/tensorflow_wrapper.py +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/ner/__init__.py +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/ner/mmlrestclient.py +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/ner/ner.py +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/pipeline/__init__.py +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/pipeline/multi_modal_combination_strategy.py +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/pipeline/multi_pipeline.py +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/pipeline/ner_pipeline.py +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/pipeline/pipeline.py +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/utils/__init__.py +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/utils/enums.py +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/utils/json_helper.py +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/utils/kaggle.py +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/utils/package_helper.py +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/utils/py7zr_helper.py +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/utils/utils.py +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/utils/zip_helper.py +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/vectorization/__init__.py +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/vectorization/feature_vector_generation.py +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/vectorization/idf_helper.py +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw.egg-info/SOURCES.txt +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw.egg-info/dependency_links.txt +0 -0
- {ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw.egg-info/top_level.txt +0 -0
@@ -1,6 +1,6 @@
|
|
1
1
|
Metadata-Version: 2.4
|
2
2
|
Name: ddi_fw
|
3
|
-
Version: 0.0.
|
3
|
+
Version: 0.0.171
|
4
4
|
Summary: Do not use :)
|
5
5
|
Author-email: Kıvanç Bayraktar <bayraktarkivanc@gmail.com>
|
6
6
|
Maintainer-email: Kıvanç Bayraktar <bayraktarkivanc@gmail.com>
|
@@ -40,9 +40,8 @@ Requires-Dist: nltk>=3.8.1; extra == "llm"
|
|
40
40
|
Provides-Extra: ml
|
41
41
|
Requires-Dist: scikit-learn<=1.6.1,>=1.5.2; extra == "ml"
|
42
42
|
Requires-Dist: tensorflow<=2.18.0,>=2.17.0; extra == "ml"
|
43
|
-
Requires-Dist: tf-keras
|
43
|
+
Requires-Dist: tf-keras<=2.18.0,>=2.17.0; extra == "ml"
|
44
44
|
Requires-Dist: mlflow<=2.20.0,>=2.16.1; extra == "ml"
|
45
|
-
Requires-Dist: accelerate>=0.33.0; extra == "ml"
|
46
45
|
Requires-Dist: scipy<=1.14.1,>=1.13.1; extra == "ml"
|
47
46
|
Requires-Dist: plotly==5.24.1; extra == "ml"
|
48
47
|
Requires-Dist: matplotlib==3.10.0; extra == "ml"
|
@@ -6,7 +6,7 @@ build-backend = "setuptools.build_meta"
|
|
6
6
|
|
7
7
|
[project]
|
8
8
|
name = "ddi_fw"
|
9
|
-
version = "0.0.
|
9
|
+
version = "0.0.171"
|
10
10
|
description = "Do not use :)"
|
11
11
|
readme = "README.md"
|
12
12
|
authors = [
|
@@ -71,15 +71,13 @@ llm = [
|
|
71
71
|
ml = [
|
72
72
|
"scikit-learn>=1.5.2,<=1.6.1",
|
73
73
|
"tensorflow>=2.17.0,<=2.18.0",
|
74
|
-
"tf-keras>=2.17.0
|
74
|
+
"tf-keras>=2.17.0,<=2.18.0",
|
75
75
|
"mlflow>=2.16.1,<=2.20.0",
|
76
|
-
"accelerate>=0.33.0",
|
77
76
|
"scipy>=1.13.1,<=1.14.1",
|
78
77
|
"plotly==5.24.1",
|
79
78
|
"matplotlib==3.10.0"
|
80
79
|
]
|
81
80
|
|
82
|
-
|
83
81
|
drugbank = [
|
84
82
|
"rdkit==2023.3.3",
|
85
83
|
"xmlschema==3.4.2"
|
@@ -1,4 +1,5 @@
|
|
1
1
|
import glob
|
2
|
+
import logging
|
2
3
|
from typing import Any, Dict, List, Optional, Type
|
3
4
|
import numpy as np
|
4
5
|
import pandas as pd
|
@@ -56,25 +57,20 @@ def generate_sim_matrices_new(df, generated_vectors, columns, key_column="id"):
|
|
56
57
|
|
57
58
|
class BaseDataset(BaseModel):
|
58
59
|
dataset_name: str
|
59
|
-
index_path: str
|
60
|
+
index_path: Optional[str] = None
|
60
61
|
dataset_splitter_type: Type[DatasetSplitter]
|
61
62
|
class_column: str = 'class'
|
62
63
|
dataframe: Optional[pd.DataFrame] = None
|
63
|
-
X_train:
|
64
|
-
X_test:
|
65
|
-
y_train:
|
66
|
-
y_test:
|
67
|
-
train_indexes:
|
68
|
-
test_indexes:
|
69
|
-
train_idx_arr:
|
70
|
-
val_idx_arr:
|
71
|
-
# train_idx_arr: Optional[List[np.ndarray]] = None
|
72
|
-
# val_idx_arr: Optional[List[np.ndarray]] = None
|
64
|
+
X_train: Optional[pd.DataFrame] = None
|
65
|
+
X_test: Optional[pd.DataFrame] = None
|
66
|
+
y_train: Optional[pd.Series] = None
|
67
|
+
y_test: Optional[pd.Series] = None
|
68
|
+
train_indexes: Optional[pd.Index] = None
|
69
|
+
test_indexes: Optional[pd.Index] = None
|
70
|
+
train_idx_arr: Optional[List[np.ndarray]] = None
|
71
|
+
val_idx_arr: Optional[List[np.ndarray]] = None
|
73
72
|
columns: List[str] = []
|
74
73
|
|
75
|
-
# feature_process: FeatureProcessor
|
76
|
-
# similarity_matrix_service: SimilarityMatrixService
|
77
|
-
|
78
74
|
class Config:
|
79
75
|
arbitrary_types_allowed = True
|
80
76
|
|
@@ -107,21 +103,28 @@ class BaseDataset(BaseModel):
|
|
107
103
|
pass
|
108
104
|
|
109
105
|
def load(self):
|
106
|
+
"""
|
107
|
+
Load the dataset. If X_train, y_train, X_test, and y_test are already provided,
|
108
|
+
skip deriving them. Otherwise, derive them from the dataframe and indices.
|
109
|
+
"""
|
110
|
+
if self.X_train is not None and self.y_train is not None and self.X_test is not None and self.y_test is not None:
|
111
|
+
# Data is already provided, no need to calculate
|
112
|
+
logging.info("X_train, y_train, X_test, and y_test are already provided. Skipping calculation.")
|
113
|
+
return self.X_train, self.X_test, self.y_train, self.y_test, self.train_indexes, self.test_indexes, self.train_idx_arr, self.val_idx_arr
|
114
|
+
|
110
115
|
if self.index_path is None:
|
111
|
-
raise Exception(
|
112
|
-
|
116
|
+
raise Exception("There is no index path. Please call split_dataset or provide indices.")
|
117
|
+
|
118
|
+
if self.dataframe is None:
|
119
|
+
raise Exception("There is no dataframe to derive data from.")
|
113
120
|
|
114
121
|
try:
|
115
|
-
train_idx_all, test_idx_all, train_idx_arr, val_idx_arr = self.__get_indexes__(
|
116
|
-
self.index_path)
|
122
|
+
train_idx_all, test_idx_all, train_idx_arr, val_idx_arr = self.__get_indexes__(self.index_path)
|
117
123
|
except FileNotFoundError as e:
|
118
124
|
raise FileNotFoundError(f"Index files not found: {e.filename}")
|
119
125
|
|
120
126
|
self.prep()
|
121
127
|
|
122
|
-
if self.dataframe is None:
|
123
|
-
raise Exception("There is no dataframe")
|
124
|
-
|
125
128
|
train = self.dataframe[self.dataframe.index.isin(train_idx_all)]
|
126
129
|
test = self.dataframe[self.dataframe.index.isin(test_idx_all)]
|
127
130
|
|
@@ -135,7 +138,7 @@ class BaseDataset(BaseModel):
|
|
135
138
|
self.train_idx_arr = train_idx_arr
|
136
139
|
self.val_idx_arr = val_idx_arr
|
137
140
|
|
138
|
-
return self.X_train, self.X_test, self.y_train, self.y_test, self.
|
141
|
+
return self.X_train, self.X_test, self.y_train, self.y_test, self.train_indexes, self.test_indexes, self.train_idx_arr, self.val_idx_arr
|
139
142
|
|
140
143
|
def __get_indexes__(self, path):
|
141
144
|
train_index_path = path+'/train_indexes.txt'
|
@@ -167,14 +170,20 @@ class BaseDataset(BaseModel):
|
|
167
170
|
f.write('\n'.join(str_indexes))
|
168
171
|
|
169
172
|
def split_dataset(self, save_indexes: bool = False):
|
170
|
-
|
173
|
+
"""
|
174
|
+
Split the dataset into training and testing sets. This method is only available
|
175
|
+
if a dataframe exists. If X_train, y_train, X_test, and y_test are already present,
|
176
|
+
raise an error.
|
177
|
+
"""
|
178
|
+
if self.X_train is not None or self.X_test is not None:
|
179
|
+
raise Exception("X_train and X_test are already present. Splitting is not allowed.")
|
180
|
+
|
181
|
+
if self.dataframe is None:
|
182
|
+
raise Exception("There is no dataframe to split.")
|
171
183
|
|
172
184
|
save_path = self.index_path
|
173
185
|
self.prep()
|
174
186
|
|
175
|
-
if self.dataframe is None:
|
176
|
-
raise Exception("There is no data")
|
177
|
-
|
178
187
|
X = self.dataframe.drop(self.class_column, axis=1)
|
179
188
|
y = self.dataframe[self.class_column]
|
180
189
|
|
@@ -1,6 +1,6 @@
|
|
1
1
|
Metadata-Version: 2.4
|
2
2
|
Name: ddi_fw
|
3
|
-
Version: 0.0.
|
3
|
+
Version: 0.0.171
|
4
4
|
Summary: Do not use :)
|
5
5
|
Author-email: Kıvanç Bayraktar <bayraktarkivanc@gmail.com>
|
6
6
|
Maintainer-email: Kıvanç Bayraktar <bayraktarkivanc@gmail.com>
|
@@ -40,9 +40,8 @@ Requires-Dist: nltk>=3.8.1; extra == "llm"
|
|
40
40
|
Provides-Extra: ml
|
41
41
|
Requires-Dist: scikit-learn<=1.6.1,>=1.5.2; extra == "ml"
|
42
42
|
Requires-Dist: tensorflow<=2.18.0,>=2.17.0; extra == "ml"
|
43
|
-
Requires-Dist: tf-keras
|
43
|
+
Requires-Dist: tf-keras<=2.18.0,>=2.17.0; extra == "ml"
|
44
44
|
Requires-Dist: mlflow<=2.20.0,>=2.16.1; extra == "ml"
|
45
|
-
Requires-Dist: accelerate>=0.33.0; extra == "ml"
|
46
45
|
Requires-Dist: scipy<=1.14.1,>=1.13.1; extra == "ml"
|
47
46
|
Requires-Dist: plotly==5.24.1; extra == "ml"
|
48
47
|
Requires-Dist: matplotlib==3.10.0; extra == "ml"
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
{ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/datasets/ddi_mdl/indexes_old/validation_fold_0.txt
RENAMED
File without changes
|
{ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/datasets/ddi_mdl/indexes_old/validation_fold_1.txt
RENAMED
File without changes
|
{ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/datasets/ddi_mdl/indexes_old/validation_fold_2.txt
RENAMED
File without changes
|
{ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/datasets/ddi_mdl/indexes_old/validation_fold_3.txt
RENAMED
File without changes
|
{ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/datasets/ddi_mdl/indexes_old/validation_fold_4.txt
RENAMED
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
{ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/datasets/ddi_mdl_text/indexes/train_indexes.txt
RENAMED
File without changes
|
{ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/datasets/ddi_mdl_text/indexes/validation_fold_0.txt
RENAMED
File without changes
|
{ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/datasets/ddi_mdl_text/indexes/validation_fold_1.txt
RENAMED
File without changes
|
{ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/datasets/ddi_mdl_text/indexes/validation_fold_2.txt
RENAMED
File without changes
|
{ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/datasets/ddi_mdl_text/indexes/validation_fold_3.txt
RENAMED
File without changes
|
{ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/datasets/ddi_mdl_text/indexes/validation_fold_4.txt
RENAMED
File without changes
|
File without changes
|
File without changes
|
{ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/datasets/mdf_sa_ddi/df_extraction_cleanxiaoyu50.csv
RENAMED
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
{ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/datasets/mdf_sa_ddi/indexes/validation_fold_0.txt
RENAMED
File without changes
|
{ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/datasets/mdf_sa_ddi/indexes/validation_fold_1.txt
RENAMED
File without changes
|
{ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/datasets/mdf_sa_ddi/indexes/validation_fold_2.txt
RENAMED
File without changes
|
{ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/datasets/mdf_sa_ddi/indexes/validation_fold_3.txt
RENAMED
File without changes
|
{ddi_fw-0.0.169 → ddi_fw-0.0.171}/src/ddi_fw/datasets/mdf_sa_ddi/indexes/validation_fold_4.txt
RENAMED
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|