copulas 0.10.0.dev0__tar.gz → 0.10.1.dev0__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of copulas might be problematic. Click here for more details.
- copulas-0.10.1.dev0/PKG-INFO +223 -0
- {copulas-0.10.0.dev0 → copulas-0.10.1.dev0}/copulas/__init__.py +1 -1
- {copulas-0.10.0.dev0 → copulas-0.10.1.dev0}/copulas/multivariate/gaussian.py +3 -1
- {copulas-0.10.0.dev0 → copulas-0.10.1.dev0}/copulas/univariate/truncated_gaussian.py +8 -4
- copulas-0.10.1.dev0/copulas.egg-info/PKG-INFO +223 -0
- copulas-0.10.1.dev0/copulas.egg-info/SOURCES.txt +37 -0
- {copulas-0.10.0.dev0 → copulas-0.10.1.dev0}/copulas.egg-info/requires.txt +5 -11
- copulas-0.10.1.dev0/pyproject.toml +190 -0
- copulas-0.10.1.dev0/setup.cfg +23 -0
- copulas-0.10.1.dev0/tests/test_tasks.py +36 -0
- copulas-0.10.0.dev0/AUTHORS.rst +0 -4
- copulas-0.10.0.dev0/CONTRIBUTING.rst +0 -193
- copulas-0.10.0.dev0/HISTORY.md +0 -261
- copulas-0.10.0.dev0/MANIFEST.in +0 -12
- copulas-0.10.0.dev0/PKG-INFO +0 -423
- copulas-0.10.0.dev0/RELEASE.md +0 -239
- copulas-0.10.0.dev0/copulas.egg-info/PKG-INFO +0 -423
- copulas-0.10.0.dev0/copulas.egg-info/SOURCES.txt +0 -178
- copulas-0.10.0.dev0/copulas.egg-info/not-zip-safe +0 -1
- copulas-0.10.0.dev0/docs/Makefile +0 -20
- copulas-0.10.0.dev0/docs/authors.rst +0 -1
- copulas-0.10.0.dev0/docs/conf.py +0 -198
- copulas-0.10.0.dev0/docs/contributing.rst +0 -1
- copulas-0.10.0.dev0/docs/history.rst +0 -1
- copulas-0.10.0.dev0/docs/images/copulas-200.png +0 -0
- copulas-0.10.0.dev0/docs/images/copulas.png +0 -0
- copulas-0.10.0.dev0/docs/images/copulas_sample_dataset.png +0 -0
- copulas-0.10.0.dev0/docs/images/dai-logo-white.png +0 -0
- copulas-0.10.0.dev0/docs/images/dice_cdf.png +0 -0
- copulas-0.10.0.dev0/docs/images/pdf_cdf.png +0 -0
- copulas-0.10.0.dev0/docs/images/pit.png +0 -0
- copulas-0.10.0.dev0/docs/images/quickstart.png +0 -0
- copulas-0.10.0.dev0/docs/index.rst +0 -40
- copulas-0.10.0.dev0/docs/install.rst +0 -1
- copulas-0.10.0.dev0/docs/make.bat +0 -36
- copulas-0.10.0.dev0/setup.cfg +0 -66
- copulas-0.10.0.dev0/setup.py +0 -140
- copulas-0.10.0.dev0/tests/__init__.py +0 -139
- copulas-0.10.0.dev0/tests/end-to-end/README.md +0 -35
- copulas-0.10.0.dev0/tests/end-to-end/__init__.py +0 -1
- copulas-0.10.0.dev0/tests/end-to-end/bivariate/__init__.py +0 -1
- copulas-0.10.0.dev0/tests/end-to-end/bivariate/test_base.py +0 -44
- copulas-0.10.0.dev0/tests/end-to-end/multivariate/__init__.py +0 -1
- copulas-0.10.0.dev0/tests/end-to-end/multivariate/test_base.py +0 -33
- copulas-0.10.0.dev0/tests/end-to-end/multivariate/test_gaussian.py +0 -217
- copulas-0.10.0.dev0/tests/end-to-end/multivariate/test_vine.py +0 -72
- copulas-0.10.0.dev0/tests/end-to-end/test___init__.py +0 -62
- copulas-0.10.0.dev0/tests/end-to-end/test_visualization.py +0 -8
- copulas-0.10.0.dev0/tests/end-to-end/univariate/__init__.py +0 -1
- copulas-0.10.0.dev0/tests/end-to-end/univariate/test_beta.py +0 -162
- copulas-0.10.0.dev0/tests/end-to-end/univariate/test_gamma.py +0 -159
- copulas-0.10.0.dev0/tests/end-to-end/univariate/test_gaussian.py +0 -157
- copulas-0.10.0.dev0/tests/end-to-end/univariate/test_gaussian_kde.py +0 -175
- copulas-0.10.0.dev0/tests/end-to-end/univariate/test_student_t.py +0 -161
- copulas-0.10.0.dev0/tests/end-to-end/univariate/test_truncated_gaussian.py +0 -161
- copulas-0.10.0.dev0/tests/large_scale_evaluation.py +0 -278
- copulas-0.10.0.dev0/tests/numerical/README.md +0 -92
- copulas-0.10.0.dev0/tests/numerical/__init__.py +0 -1
- copulas-0.10.0.dev0/tests/numerical/cdf/__init__.py +0 -1
- copulas-0.10.0.dev0/tests/numerical/cdf/input/bivariate_cdf_input.csv +0 -13
- copulas-0.10.0.dev0/tests/numerical/cdf/output/clayton_cdf_test_case_1_output_Matlab.csv +0 -13
- copulas-0.10.0.dev0/tests/numerical/cdf/output/clayton_cdf_test_case_1_output_R.csv +0 -13
- copulas-0.10.0.dev0/tests/numerical/cdf/output/clayton_cdf_test_case_2_output_Matlab.csv +0 -13
- copulas-0.10.0.dev0/tests/numerical/cdf/output/clayton_cdf_test_case_2_output_R.csv +0 -13
- copulas-0.10.0.dev0/tests/numerical/cdf/output/clayton_cdf_test_case_3_output_Matlab.csv +0 -13
- copulas-0.10.0.dev0/tests/numerical/cdf/output/clayton_cdf_test_case_3_output_R.csv +0 -13
- copulas-0.10.0.dev0/tests/numerical/cdf/output/frank_cdf_test_case_1_output_Matlab.csv +0 -13
- copulas-0.10.0.dev0/tests/numerical/cdf/output/frank_cdf_test_case_1_output_R.csv +0 -13
- copulas-0.10.0.dev0/tests/numerical/cdf/output/frank_cdf_test_case_2_output_Matlab.csv +0 -13
- copulas-0.10.0.dev0/tests/numerical/cdf/output/frank_cdf_test_case_2_output_R.csv +0 -13
- copulas-0.10.0.dev0/tests/numerical/cdf/output/frank_cdf_test_case_3_output_Matlab.csv +0 -13
- copulas-0.10.0.dev0/tests/numerical/cdf/output/frank_cdf_test_case_3_output_R.csv +0 -13
- copulas-0.10.0.dev0/tests/numerical/cdf/output/gumbel_cdf_test_case_1_output_Matlab.csv +0 -13
- copulas-0.10.0.dev0/tests/numerical/cdf/output/gumbel_cdf_test_case_1_output_R.csv +0 -13
- copulas-0.10.0.dev0/tests/numerical/cdf/output/gumbel_cdf_test_case_2_output_Matlab.csv +0 -13
- copulas-0.10.0.dev0/tests/numerical/cdf/output/gumbel_cdf_test_case_2_output_R.csv +0 -13
- copulas-0.10.0.dev0/tests/numerical/cdf/scripts/bivariate_cdf_input.py +0 -26
- copulas-0.10.0.dev0/tests/numerical/cdf/scripts/bivariate_cdf_output.R +0 -58
- copulas-0.10.0.dev0/tests/numerical/cdf/scripts/bivariate_cdf_output.m +0 -42
- copulas-0.10.0.dev0/tests/numerical/cdf/test_cases/clayton/clayton_cdf_test_case_1.json +0 -31
- copulas-0.10.0.dev0/tests/numerical/cdf/test_cases/clayton/clayton_cdf_test_case_2.json +0 -28
- copulas-0.10.0.dev0/tests/numerical/cdf/test_cases/clayton/clayton_cdf_test_case_3.json +0 -28
- copulas-0.10.0.dev0/tests/numerical/cdf/test_cases/frank/frank_cdf_test_case_1.json +0 -28
- copulas-0.10.0.dev0/tests/numerical/cdf/test_cases/frank/frank_cdf_test_case_2.json +0 -28
- copulas-0.10.0.dev0/tests/numerical/cdf/test_cases/frank/frank_cdf_test_case_3.json +0 -28
- copulas-0.10.0.dev0/tests/numerical/cdf/test_cases/gumbel/gumbel_cdf_test_case_1.json +0 -28
- copulas-0.10.0.dev0/tests/numerical/cdf/test_cases/gumbel/gumbel_cdf_test_case_2.json +0 -28
- copulas-0.10.0.dev0/tests/numerical/cdf/test_cdf.py +0 -39
- copulas-0.10.0.dev0/tests/numerical/fit/__init__.py +0 -1
- copulas-0.10.0.dev0/tests/numerical/fit/input/bivariate_fit_test_case_1_input.csv +0 -7
- copulas-0.10.0.dev0/tests/numerical/fit/input/bivariate_fit_test_case_2_input.csv +0 -8
- copulas-0.10.0.dev0/tests/numerical/fit/scripts/bivariate_fit_output.R +0 -40
- copulas-0.10.0.dev0/tests/numerical/fit/scripts/bivariate_fit_output.m +0 -25
- copulas-0.10.0.dev0/tests/numerical/fit/test_cases/clayton/clayton_fit_test_case_1.json +0 -33
- copulas-0.10.0.dev0/tests/numerical/fit/test_cases/clayton/clayton_fit_test_case_2.json +0 -33
- copulas-0.10.0.dev0/tests/numerical/fit/test_cases/frank/frank_fit_test_case_1.json +0 -33
- copulas-0.10.0.dev0/tests/numerical/fit/test_cases/frank/frank_fit_test_case_2.json +0 -33
- copulas-0.10.0.dev0/tests/numerical/fit/test_cases/gumbel/gumbel_fit_test_case_1.json +0 -33
- copulas-0.10.0.dev0/tests/numerical/fit/test_cases/gumbel/gumbel_fit_test_case_2.json +0 -33
- copulas-0.10.0.dev0/tests/numerical/fit/test_fit.py +0 -37
- copulas-0.10.0.dev0/tests/numerical/pdf/__init__.py +0 -1
- copulas-0.10.0.dev0/tests/numerical/pdf/input/bivariate_pdf_input.csv +0 -13
- copulas-0.10.0.dev0/tests/numerical/pdf/output/clayton_pdf_test_case_1_output_Matlab.csv +0 -13
- copulas-0.10.0.dev0/tests/numerical/pdf/output/clayton_pdf_test_case_1_output_R.csv +0 -13
- copulas-0.10.0.dev0/tests/numerical/pdf/output/clayton_pdf_test_case_2_output_Matlab.csv +0 -13
- copulas-0.10.0.dev0/tests/numerical/pdf/output/clayton_pdf_test_case_2_output_R.csv +0 -13
- copulas-0.10.0.dev0/tests/numerical/pdf/output/clayton_pdf_test_case_3_output_Matlab.csv +0 -13
- copulas-0.10.0.dev0/tests/numerical/pdf/output/clayton_pdf_test_case_3_output_R.csv +0 -13
- copulas-0.10.0.dev0/tests/numerical/pdf/output/frank_pdf_test_case_1_output_Matlab.csv +0 -13
- copulas-0.10.0.dev0/tests/numerical/pdf/output/frank_pdf_test_case_1_output_R.csv +0 -13
- copulas-0.10.0.dev0/tests/numerical/pdf/output/frank_pdf_test_case_2_output_Matlab.csv +0 -13
- copulas-0.10.0.dev0/tests/numerical/pdf/output/frank_pdf_test_case_2_output_R.csv +0 -13
- copulas-0.10.0.dev0/tests/numerical/pdf/output/frank_pdf_test_case_3_output_Matlab.csv +0 -13
- copulas-0.10.0.dev0/tests/numerical/pdf/output/frank_pdf_test_case_3_output_R.csv +0 -13
- copulas-0.10.0.dev0/tests/numerical/pdf/output/gumbel_pdf_test_case_1_output_Matlab.csv +0 -13
- copulas-0.10.0.dev0/tests/numerical/pdf/output/gumbel_pdf_test_case_1_output_R.csv +0 -13
- copulas-0.10.0.dev0/tests/numerical/pdf/output/gumbel_pdf_test_case_2_output_Matlab.csv +0 -13
- copulas-0.10.0.dev0/tests/numerical/pdf/output/gumbel_pdf_test_case_2_output_R.csv +0 -13
- copulas-0.10.0.dev0/tests/numerical/pdf/scripts/bivariate_pdf_input.py +0 -25
- copulas-0.10.0.dev0/tests/numerical/pdf/scripts/bivariate_pdf_output.R +0 -58
- copulas-0.10.0.dev0/tests/numerical/pdf/scripts/bivariate_pdf_output.m +0 -45
- copulas-0.10.0.dev0/tests/numerical/pdf/test_cases/clayton/clayton_pdf_test_case_1.json +0 -28
- copulas-0.10.0.dev0/tests/numerical/pdf/test_cases/clayton/clayton_pdf_test_case_2.json +0 -28
- copulas-0.10.0.dev0/tests/numerical/pdf/test_cases/clayton/clayton_pdf_test_case_3.json +0 -28
- copulas-0.10.0.dev0/tests/numerical/pdf/test_cases/frank/frank_pdf_test_case_1.json +0 -28
- copulas-0.10.0.dev0/tests/numerical/pdf/test_cases/frank/frank_pdf_test_case_2.json +0 -28
- copulas-0.10.0.dev0/tests/numerical/pdf/test_cases/frank/frank_pdf_test_case_3.json +0 -28
- copulas-0.10.0.dev0/tests/numerical/pdf/test_cases/gumbel/gumbel_pdf_test_case_1.json +0 -28
- copulas-0.10.0.dev0/tests/numerical/pdf/test_cases/gumbel/gumbel_pdf_test_case_2.json +0 -28
- copulas-0.10.0.dev0/tests/numerical/pdf/test_pdf.py +0 -38
- copulas-0.10.0.dev0/tests/unit/__init__.py +0 -1
- copulas-0.10.0.dev0/tests/unit/bivariate/__init__.py +0 -1
- copulas-0.10.0.dev0/tests/unit/bivariate/test___init__.py +0 -23
- copulas-0.10.0.dev0/tests/unit/bivariate/test_base.py +0 -133
- copulas-0.10.0.dev0/tests/unit/bivariate/test_clayton.py +0 -107
- copulas-0.10.0.dev0/tests/unit/bivariate/test_frank.py +0 -115
- copulas-0.10.0.dev0/tests/unit/bivariate/test_gumbel.py +0 -114
- copulas-0.10.0.dev0/tests/unit/bivariate/test_independence.py +0 -62
- copulas-0.10.0.dev0/tests/unit/multivariate/__init__.py +0 -1
- copulas-0.10.0.dev0/tests/unit/multivariate/test_base.py +0 -17
- copulas-0.10.0.dev0/tests/unit/multivariate/test_gaussian.py +0 -517
- copulas-0.10.0.dev0/tests/unit/multivariate/test_tree.py +0 -753
- copulas-0.10.0.dev0/tests/unit/multivariate/test_vine.py +0 -176
- copulas-0.10.0.dev0/tests/unit/optimize/__init__.py +0 -1
- copulas-0.10.0.dev0/tests/unit/optimize/test___init__.py +0 -29
- copulas-0.10.0.dev0/tests/unit/test___init__.py +0 -575
- copulas-0.10.0.dev0/tests/unit/univariate/__init__.py +0 -1
- copulas-0.10.0.dev0/tests/unit/univariate/test_base.py +0 -245
- copulas-0.10.0.dev0/tests/unit/univariate/test_beta.py +0 -95
- copulas-0.10.0.dev0/tests/unit/univariate/test_gamma.py +0 -60
- copulas-0.10.0.dev0/tests/unit/univariate/test_gaussian.py +0 -55
- copulas-0.10.0.dev0/tests/unit/univariate/test_gaussian_kde.py +0 -206
- copulas-0.10.0.dev0/tests/unit/univariate/test_log_laplace.py +0 -60
- copulas-0.10.0.dev0/tests/unit/univariate/test_selection.py +0 -91
- copulas-0.10.0.dev0/tests/unit/univariate/test_student_t.py +0 -49
- copulas-0.10.0.dev0/tests/unit/univariate/test_truncated_gaussian.py +0 -63
- copulas-0.10.0.dev0/tests/unit/univariate/test_uniform.py +0 -57
- {copulas-0.10.0.dev0 → copulas-0.10.1.dev0}/LICENSE +0 -0
- {copulas-0.10.0.dev0 → copulas-0.10.1.dev0}/README.md +0 -0
- {copulas-0.10.0.dev0 → copulas-0.10.1.dev0}/copulas/bivariate/__init__.py +0 -0
- {copulas-0.10.0.dev0 → copulas-0.10.1.dev0}/copulas/bivariate/base.py +0 -0
- {copulas-0.10.0.dev0 → copulas-0.10.1.dev0}/copulas/bivariate/clayton.py +0 -0
- {copulas-0.10.0.dev0 → copulas-0.10.1.dev0}/copulas/bivariate/frank.py +0 -0
- {copulas-0.10.0.dev0 → copulas-0.10.1.dev0}/copulas/bivariate/gumbel.py +0 -0
- {copulas-0.10.0.dev0 → copulas-0.10.1.dev0}/copulas/bivariate/independence.py +0 -0
- {copulas-0.10.0.dev0 → copulas-0.10.1.dev0}/copulas/bivariate/utils.py +0 -0
- {copulas-0.10.0.dev0 → copulas-0.10.1.dev0}/copulas/datasets.py +0 -0
- {copulas-0.10.0.dev0 → copulas-0.10.1.dev0}/copulas/multivariate/__init__.py +0 -0
- {copulas-0.10.0.dev0 → copulas-0.10.1.dev0}/copulas/multivariate/base.py +0 -0
- {copulas-0.10.0.dev0 → copulas-0.10.1.dev0}/copulas/multivariate/tree.py +0 -0
- {copulas-0.10.0.dev0 → copulas-0.10.1.dev0}/copulas/multivariate/vine.py +0 -0
- {copulas-0.10.0.dev0 → copulas-0.10.1.dev0}/copulas/optimize/__init__.py +0 -0
- {copulas-0.10.0.dev0 → copulas-0.10.1.dev0}/copulas/univariate/__init__.py +0 -0
- {copulas-0.10.0.dev0 → copulas-0.10.1.dev0}/copulas/univariate/base.py +0 -0
- {copulas-0.10.0.dev0 → copulas-0.10.1.dev0}/copulas/univariate/beta.py +0 -0
- {copulas-0.10.0.dev0 → copulas-0.10.1.dev0}/copulas/univariate/gamma.py +0 -0
- {copulas-0.10.0.dev0 → copulas-0.10.1.dev0}/copulas/univariate/gaussian.py +0 -0
- {copulas-0.10.0.dev0 → copulas-0.10.1.dev0}/copulas/univariate/gaussian_kde.py +0 -0
- {copulas-0.10.0.dev0 → copulas-0.10.1.dev0}/copulas/univariate/log_laplace.py +0 -0
- {copulas-0.10.0.dev0 → copulas-0.10.1.dev0}/copulas/univariate/selection.py +0 -0
- {copulas-0.10.0.dev0 → copulas-0.10.1.dev0}/copulas/univariate/student_t.py +0 -0
- {copulas-0.10.0.dev0 → copulas-0.10.1.dev0}/copulas/univariate/uniform.py +0 -0
- {copulas-0.10.0.dev0 → copulas-0.10.1.dev0}/copulas/visualization.py +0 -0
- {copulas-0.10.0.dev0 → copulas-0.10.1.dev0}/copulas.egg-info/dependency_links.txt +0 -0
- {copulas-0.10.0.dev0 → copulas-0.10.1.dev0}/copulas.egg-info/top_level.txt +0 -0
|
@@ -0,0 +1,223 @@
|
|
|
1
|
+
Metadata-Version: 2.1
|
|
2
|
+
Name: copulas
|
|
3
|
+
Version: 0.10.1.dev0
|
|
4
|
+
Summary: Create tabular synthetic data using copulas-based modeling.
|
|
5
|
+
Author-email: "DataCebo, Inc." <info@sdv.dev>
|
|
6
|
+
License: BSL-1.1
|
|
7
|
+
Project-URL: Source Code, https://github.com/sdv-dev/Copulas/
|
|
8
|
+
Project-URL: Issue Tracker, https://github.com/sdv-dev/Copulas/issues
|
|
9
|
+
Project-URL: Changes, https://github.com/sdv-dev/Copulas/blob/main/HISTORY.md
|
|
10
|
+
Project-URL: Twitter, https://twitter.com/sdv_dev
|
|
11
|
+
Project-URL: Chat, https://bit.ly/sdv-slack-invite
|
|
12
|
+
Keywords: copulas
|
|
13
|
+
Classifier: Development Status :: 2 - Pre-Alpha
|
|
14
|
+
Classifier: Intended Audience :: Developers
|
|
15
|
+
Classifier: License :: Free for non-commercial use
|
|
16
|
+
Classifier: Natural Language :: English
|
|
17
|
+
Classifier: Programming Language :: Python :: 3
|
|
18
|
+
Classifier: Programming Language :: Python :: 3.8
|
|
19
|
+
Classifier: Programming Language :: Python :: 3.9
|
|
20
|
+
Classifier: Programming Language :: Python :: 3.10
|
|
21
|
+
Classifier: Programming Language :: Python :: 3.11
|
|
22
|
+
Classifier: Topic :: Scientific/Engineering :: Artificial Intelligence
|
|
23
|
+
Requires-Python: <3.12,>=3.8
|
|
24
|
+
Description-Content-Type: text/markdown
|
|
25
|
+
License-File: LICENSE
|
|
26
|
+
Requires-Dist: numpy<2,>=1.20.0; python_version < "3.10"
|
|
27
|
+
Requires-Dist: numpy<2,>=1.23.3; python_version >= "3.10"
|
|
28
|
+
Requires-Dist: pandas>=1.1.3; python_version < "3.10"
|
|
29
|
+
Requires-Dist: pandas>=1.3.4; python_version >= "3.10" and python_version < "3.11"
|
|
30
|
+
Requires-Dist: pandas>=1.5.0; python_version >= "3.11"
|
|
31
|
+
Requires-Dist: plotly<6,>=5.10.0
|
|
32
|
+
Requires-Dist: scipy<2,>=1.5.4; python_version < "3.10"
|
|
33
|
+
Requires-Dist: scipy<2,>=1.9.2; python_version >= "3.10"
|
|
34
|
+
Provides-Extra: tutorials
|
|
35
|
+
Requires-Dist: markupsafe<=2.0.1; extra == "tutorials"
|
|
36
|
+
Requires-Dist: scikit-learn<1.2,>=0.24; extra == "tutorials"
|
|
37
|
+
Requires-Dist: jupyter<2,>=1.0.0; extra == "tutorials"
|
|
38
|
+
Provides-Extra: test
|
|
39
|
+
Requires-Dist: copulas[tutorials]; extra == "test"
|
|
40
|
+
Requires-Dist: pytest<7,>=6.2.5; extra == "test"
|
|
41
|
+
Requires-Dist: pytest-cov<3,>=2.6.0; extra == "test"
|
|
42
|
+
Requires-Dist: pytest-rerunfailures<10,>=9.0.0; extra == "test"
|
|
43
|
+
Requires-Dist: rundoc<0.5,>=0.4.3; extra == "test"
|
|
44
|
+
Requires-Dist: tomli<3,>=2.0.0; extra == "test"
|
|
45
|
+
Provides-Extra: dev
|
|
46
|
+
Requires-Dist: copulas[test,tutorials]; extra == "dev"
|
|
47
|
+
Requires-Dist: pip>=9.0.1; extra == "dev"
|
|
48
|
+
Requires-Dist: build<2,>=1.0.0; extra == "dev"
|
|
49
|
+
Requires-Dist: bump-my-version<1,>=0.18.3; extra == "dev"
|
|
50
|
+
Requires-Dist: watchdog<0.11,>=0.8.3; extra == "dev"
|
|
51
|
+
Requires-Dist: m2r<0.3,>=0.2.0; extra == "dev"
|
|
52
|
+
Requires-Dist: nbsphinx<0.7,>=0.5.0; extra == "dev"
|
|
53
|
+
Requires-Dist: Sphinx<3,>=1.7.1; extra == "dev"
|
|
54
|
+
Requires-Dist: sphinx_rtd_theme<0.5,>=0.2.4; extra == "dev"
|
|
55
|
+
Requires-Dist: Jinja2<3,>=2; extra == "dev"
|
|
56
|
+
Requires-Dist: flake8<4,>=3.7.7; extra == "dev"
|
|
57
|
+
Requires-Dist: isort<5,>=4.3.4; extra == "dev"
|
|
58
|
+
Requires-Dist: flake8-debugger<4.1,>=4.0.0; extra == "dev"
|
|
59
|
+
Requires-Dist: flake8-mock<0.4,>=0.3; extra == "dev"
|
|
60
|
+
Requires-Dist: flake8-mutable<1.3,>=1.2.0; extra == "dev"
|
|
61
|
+
Requires-Dist: flake8-fixme<1.2,>=1.1.1; extra == "dev"
|
|
62
|
+
Requires-Dist: pep8-naming<0.13,>=0.12.1; extra == "dev"
|
|
63
|
+
Requires-Dist: dlint<0.12,>=0.11.0; extra == "dev"
|
|
64
|
+
Requires-Dist: flake8-docstrings<2,>=1.5.0; extra == "dev"
|
|
65
|
+
Requires-Dist: pydocstyle<6.2,>=6.1.1; extra == "dev"
|
|
66
|
+
Requires-Dist: flake8-pytest-style<2,>=1.5.0; extra == "dev"
|
|
67
|
+
Requires-Dist: flake8-comprehensions<3.7,>=3.6.1; extra == "dev"
|
|
68
|
+
Requires-Dist: flake8-print<4.1,>=4.0.0; extra == "dev"
|
|
69
|
+
Requires-Dist: flake8-expression-complexity<0.1,>=0.0.9; extra == "dev"
|
|
70
|
+
Requires-Dist: flake8-multiline-containers<0.1,>=0.0.18; extra == "dev"
|
|
71
|
+
Requires-Dist: pandas-vet<0.3,>=0.2.2; extra == "dev"
|
|
72
|
+
Requires-Dist: flake8-builtins<1.6,>=1.5.3; extra == "dev"
|
|
73
|
+
Requires-Dist: flake8-eradicate<1.2,>=1.1.0; extra == "dev"
|
|
74
|
+
Requires-Dist: flake8-quotes<4,>=3.3.0; extra == "dev"
|
|
75
|
+
Requires-Dist: flake8-variables-names<0.1,>=0.0.4; extra == "dev"
|
|
76
|
+
Requires-Dist: flake8-sfs<0.1,>=0.0.3; extra == "dev"
|
|
77
|
+
Requires-Dist: flake8-absolute-import<2,>=1.0; extra == "dev"
|
|
78
|
+
Requires-Dist: autoflake<2,>=1.1; extra == "dev"
|
|
79
|
+
Requires-Dist: autopep8<1.6,>=1.4.3; extra == "dev"
|
|
80
|
+
Requires-Dist: twine<4,>=1.10.0; extra == "dev"
|
|
81
|
+
Requires-Dist: wheel>=0.30.0; extra == "dev"
|
|
82
|
+
Requires-Dist: coverage<6,>=4.5.1; extra == "dev"
|
|
83
|
+
Requires-Dist: tox<4,>=2.9.1; extra == "dev"
|
|
84
|
+
Requires-Dist: invoke; extra == "dev"
|
|
85
|
+
Requires-Dist: doc8<0.9,>=0.8.0; extra == "dev"
|
|
86
|
+
Requires-Dist: urllib3<1.26,>=1.20; extra == "dev"
|
|
87
|
+
Requires-Dist: tabulate<0.9,>=0.8.3; extra == "dev"
|
|
88
|
+
Requires-Dist: boto3<1.10,>=1.7.47; extra == "dev"
|
|
89
|
+
Requires-Dist: docutils<0.15,>=0.10; extra == "dev"
|
|
90
|
+
|
|
91
|
+
<p style="text-align:center">
|
|
92
|
+
<i>This repository is part of <a href="https://sdv.dev">The Synthetic Data Vault Project</a>, a project from <a href="https://datacebo.com">DataCebo</a>.</i>
|
|
93
|
+
</p>
|
|
94
|
+
|
|
95
|
+
[](https://pypi.org/search/?c=Development+Status+%3A%3A+2+-+Pre-Alpha)
|
|
96
|
+
[](https://pypi.python.org/pypi/copulas)
|
|
97
|
+
[](https://pepy.tech/project/copulas)
|
|
98
|
+
[](https://github.com/sdv-dev/Copulas/actions/workflows/unit.yml)
|
|
99
|
+
[](https://codecov.io/gh/sdv-dev/Copulas)
|
|
100
|
+
[](https://bit.ly/sdv-slack-invite)
|
|
101
|
+
|
|
102
|
+
<br/>
|
|
103
|
+
<p align="center" style="text-align:center">
|
|
104
|
+
<a href="https://github.com/sdv-dev/Copulas">
|
|
105
|
+
<img width=40% src="https://github.com/sdv-dev/SDV/blob/stable/docs/images/Copulas-DataCebo.png?raw=true"></img>
|
|
106
|
+
</a>
|
|
107
|
+
</p>
|
|
108
|
+
|
|
109
|
+
# Overview
|
|
110
|
+
|
|
111
|
+
**Copulas** is a Python library for modeling multivariate distributions and sampling from them
|
|
112
|
+
using copula functions.
|
|
113
|
+
Given a table of numerical data, use Copulas to learn the distribution and
|
|
114
|
+
generate new synthetic data following the same statistical properties.
|
|
115
|
+
|
|
116
|
+
**Key Features:**
|
|
117
|
+
|
|
118
|
+
* **Model multivariate data.** Choose from a variety of univariate
|
|
119
|
+
distributions and copulas – including Archimedian Copulas, Gaussian Copulas and Vine Copulas.
|
|
120
|
+
|
|
121
|
+
* **Compare real and synthetic data visually** after building your model. Visualizations
|
|
122
|
+
are available as 1D histograms, 2D scatterplots and 3D scatterplots.
|
|
123
|
+
|
|
124
|
+
* **Access & manipulate learned parameters.** With complete access to the internals
|
|
125
|
+
of the model, set or tune parameters to your choosing.
|
|
126
|
+
|
|
127
|
+
# Install
|
|
128
|
+
|
|
129
|
+
Install the Copulas library using pip or conda.
|
|
130
|
+
|
|
131
|
+
```bash
|
|
132
|
+
pip install copulas
|
|
133
|
+
```
|
|
134
|
+
|
|
135
|
+
```bash
|
|
136
|
+
conda install -c conda-forge copulas
|
|
137
|
+
```
|
|
138
|
+
|
|
139
|
+
# Usage
|
|
140
|
+
|
|
141
|
+
Get started using a demo dataset. This dataset contains 3 numerical columns.
|
|
142
|
+
|
|
143
|
+
```python
|
|
144
|
+
from copulas.datasets import sample_trivariate_xyz
|
|
145
|
+
|
|
146
|
+
real_data = sample_trivariate_xyz()
|
|
147
|
+
real_data.head()
|
|
148
|
+
```
|
|
149
|
+
|
|
150
|
+
<img src="docs/images/copulas_sample_dataset.png" width="300">
|
|
151
|
+
|
|
152
|
+
Model the data using a copula and use it to create synthetic data.
|
|
153
|
+
The Copulas library offers many options including Gaussian Copula,
|
|
154
|
+
Vine Copulas and Archimedian Copulas.
|
|
155
|
+
|
|
156
|
+
```python
|
|
157
|
+
from copulas.multivariate import GaussianMultivariate
|
|
158
|
+
|
|
159
|
+
copula = GaussianMultivariate()
|
|
160
|
+
copula.fit(real_data)
|
|
161
|
+
|
|
162
|
+
synthetic_data = copula.sample(len(real_data))
|
|
163
|
+
```
|
|
164
|
+
|
|
165
|
+
Visualize the real and synthetic data side-by-side. Let's do this in 3D so see our full dataset.
|
|
166
|
+
|
|
167
|
+
```python
|
|
168
|
+
from copulas.visualization import compare_3d
|
|
169
|
+
|
|
170
|
+
compare_3d(real_data, synthetic_data)
|
|
171
|
+
```
|
|
172
|
+
|
|
173
|
+

|
|
174
|
+
|
|
175
|
+
# Tutorials
|
|
176
|
+
Click below to run the code yourself on a Colab Notebook and discover new features.
|
|
177
|
+
|
|
178
|
+
[](https://bit.ly/copulas-demo)
|
|
179
|
+
|
|
180
|
+
# Community & Support
|
|
181
|
+
|
|
182
|
+
Learn more about Copulas library from our [documentation](https://sdv.dev/Copulas/) site.
|
|
183
|
+
|
|
184
|
+
**Questions or issues?** Join our [Slack channel](https://bit.ly/sdv-slack-invite)
|
|
185
|
+
to discuss more about Copulas and synthetic data.
|
|
186
|
+
If you find a bug or have a feature request, you can also
|
|
187
|
+
[open an issue](https://github.com/sdv-dev/Copulas/issues/new/choose) on our GitHub.
|
|
188
|
+
|
|
189
|
+
**Interested in contributing to Copulas?** Read our
|
|
190
|
+
[Contribution Guide](https://sdv.dev/Copulas/contributing.html) to get started.
|
|
191
|
+
|
|
192
|
+
# Credits
|
|
193
|
+
|
|
194
|
+
The Copulas open source project first started at the Data to AI Lab at MIT in 2018.
|
|
195
|
+
Thank you to our team of contributors who have built and maintained the library over the years!
|
|
196
|
+
|
|
197
|
+
[View Contributors](https://github.com/sdv-dev/Copulas/graphs/contributors)
|
|
198
|
+
|
|
199
|
+
---
|
|
200
|
+
|
|
201
|
+
|
|
202
|
+
<div align="center">
|
|
203
|
+
<a href="https://datacebo.com"><img align="center" width=40% src="https://github.com/sdv-dev/SDV/blob/stable/docs/images/DataCebo.png"></img></a>
|
|
204
|
+
</div>
|
|
205
|
+
<br/>
|
|
206
|
+
<br/>
|
|
207
|
+
|
|
208
|
+
[The Synthetic Data Vault Project](https://sdv.dev) was first created at MIT's [Data to AI Lab](
|
|
209
|
+
https://dai.lids.mit.edu/) in 2016. After 4 years of research and traction with enterprise, we
|
|
210
|
+
created [DataCebo](https://datacebo.com) in 2020 with the goal of growing the project.
|
|
211
|
+
Today, DataCebo is the proud developer of SDV, the largest ecosystem for
|
|
212
|
+
synthetic data generation & evaluation. It is home to multiple libraries that support synthetic
|
|
213
|
+
data, including:
|
|
214
|
+
|
|
215
|
+
* 🔄 Data discovery & transformation. Reverse the transforms to reproduce realistic data.
|
|
216
|
+
* 🧠 Multiple machine learning models -- ranging from Copulas to Deep Learning -- to create tabular,
|
|
217
|
+
multi table and time series data.
|
|
218
|
+
* 📊 Measuring quality and privacy of synthetic data, and comparing different synthetic data
|
|
219
|
+
generation models.
|
|
220
|
+
|
|
221
|
+
[Get started using the SDV package](https://sdv.dev/SDV/getting_started/install.html) -- a fully
|
|
222
|
+
integrated solution and your one-stop shop for synthetic data. Or, use the standalone libraries
|
|
223
|
+
for specific needs.
|
|
@@ -148,7 +148,9 @@ class GaussianMultivariate(Multivariate):
|
|
|
148
148
|
"""
|
|
149
149
|
self.check_fit()
|
|
150
150
|
transformed = self._transform_to_normal(X)
|
|
151
|
-
|
|
151
|
+
|
|
152
|
+
return stats.multivariate_normal.pdf(
|
|
153
|
+
transformed, cov=self.correlation, allow_singular=True)
|
|
152
154
|
|
|
153
155
|
def cumulative_distribution(self, X):
|
|
154
156
|
"""Compute the cumulative distribution value for each point in X.
|
|
@@ -1,5 +1,7 @@
|
|
|
1
1
|
"""TruncatedGaussian module."""
|
|
2
2
|
|
|
3
|
+
import warnings
|
|
4
|
+
|
|
3
5
|
import numpy as np
|
|
4
6
|
from scipy.optimize import fmin_slsqp
|
|
5
7
|
from scipy.stats import truncnorm
|
|
@@ -47,10 +49,12 @@ class TruncatedGaussian(ScipyModel):
|
|
|
47
49
|
return truncnorm.nnlf((a, b, loc, scale), X)
|
|
48
50
|
|
|
49
51
|
initial_params = X.mean(), X.std()
|
|
50
|
-
|
|
51
|
-
(
|
|
52
|
-
(
|
|
53
|
-
|
|
52
|
+
with warnings.catch_warnings():
|
|
53
|
+
warnings.simplefilter('ignore', category=RuntimeWarning)
|
|
54
|
+
optimal = fmin_slsqp(nnlf, initial_params, iprint=False, bounds=[
|
|
55
|
+
(self.min, self.max),
|
|
56
|
+
(0.0, (self.max - self.min)**2)
|
|
57
|
+
])
|
|
54
58
|
|
|
55
59
|
loc, scale = optimal
|
|
56
60
|
a = (self.min - loc) / scale
|
|
@@ -0,0 +1,223 @@
|
|
|
1
|
+
Metadata-Version: 2.1
|
|
2
|
+
Name: copulas
|
|
3
|
+
Version: 0.10.1.dev0
|
|
4
|
+
Summary: Create tabular synthetic data using copulas-based modeling.
|
|
5
|
+
Author-email: "DataCebo, Inc." <info@sdv.dev>
|
|
6
|
+
License: BSL-1.1
|
|
7
|
+
Project-URL: Source Code, https://github.com/sdv-dev/Copulas/
|
|
8
|
+
Project-URL: Issue Tracker, https://github.com/sdv-dev/Copulas/issues
|
|
9
|
+
Project-URL: Changes, https://github.com/sdv-dev/Copulas/blob/main/HISTORY.md
|
|
10
|
+
Project-URL: Twitter, https://twitter.com/sdv_dev
|
|
11
|
+
Project-URL: Chat, https://bit.ly/sdv-slack-invite
|
|
12
|
+
Keywords: copulas
|
|
13
|
+
Classifier: Development Status :: 2 - Pre-Alpha
|
|
14
|
+
Classifier: Intended Audience :: Developers
|
|
15
|
+
Classifier: License :: Free for non-commercial use
|
|
16
|
+
Classifier: Natural Language :: English
|
|
17
|
+
Classifier: Programming Language :: Python :: 3
|
|
18
|
+
Classifier: Programming Language :: Python :: 3.8
|
|
19
|
+
Classifier: Programming Language :: Python :: 3.9
|
|
20
|
+
Classifier: Programming Language :: Python :: 3.10
|
|
21
|
+
Classifier: Programming Language :: Python :: 3.11
|
|
22
|
+
Classifier: Topic :: Scientific/Engineering :: Artificial Intelligence
|
|
23
|
+
Requires-Python: <3.12,>=3.8
|
|
24
|
+
Description-Content-Type: text/markdown
|
|
25
|
+
License-File: LICENSE
|
|
26
|
+
Requires-Dist: numpy<2,>=1.20.0; python_version < "3.10"
|
|
27
|
+
Requires-Dist: numpy<2,>=1.23.3; python_version >= "3.10"
|
|
28
|
+
Requires-Dist: pandas>=1.1.3; python_version < "3.10"
|
|
29
|
+
Requires-Dist: pandas>=1.3.4; python_version >= "3.10" and python_version < "3.11"
|
|
30
|
+
Requires-Dist: pandas>=1.5.0; python_version >= "3.11"
|
|
31
|
+
Requires-Dist: plotly<6,>=5.10.0
|
|
32
|
+
Requires-Dist: scipy<2,>=1.5.4; python_version < "3.10"
|
|
33
|
+
Requires-Dist: scipy<2,>=1.9.2; python_version >= "3.10"
|
|
34
|
+
Provides-Extra: tutorials
|
|
35
|
+
Requires-Dist: markupsafe<=2.0.1; extra == "tutorials"
|
|
36
|
+
Requires-Dist: scikit-learn<1.2,>=0.24; extra == "tutorials"
|
|
37
|
+
Requires-Dist: jupyter<2,>=1.0.0; extra == "tutorials"
|
|
38
|
+
Provides-Extra: test
|
|
39
|
+
Requires-Dist: copulas[tutorials]; extra == "test"
|
|
40
|
+
Requires-Dist: pytest<7,>=6.2.5; extra == "test"
|
|
41
|
+
Requires-Dist: pytest-cov<3,>=2.6.0; extra == "test"
|
|
42
|
+
Requires-Dist: pytest-rerunfailures<10,>=9.0.0; extra == "test"
|
|
43
|
+
Requires-Dist: rundoc<0.5,>=0.4.3; extra == "test"
|
|
44
|
+
Requires-Dist: tomli<3,>=2.0.0; extra == "test"
|
|
45
|
+
Provides-Extra: dev
|
|
46
|
+
Requires-Dist: copulas[test,tutorials]; extra == "dev"
|
|
47
|
+
Requires-Dist: pip>=9.0.1; extra == "dev"
|
|
48
|
+
Requires-Dist: build<2,>=1.0.0; extra == "dev"
|
|
49
|
+
Requires-Dist: bump-my-version<1,>=0.18.3; extra == "dev"
|
|
50
|
+
Requires-Dist: watchdog<0.11,>=0.8.3; extra == "dev"
|
|
51
|
+
Requires-Dist: m2r<0.3,>=0.2.0; extra == "dev"
|
|
52
|
+
Requires-Dist: nbsphinx<0.7,>=0.5.0; extra == "dev"
|
|
53
|
+
Requires-Dist: Sphinx<3,>=1.7.1; extra == "dev"
|
|
54
|
+
Requires-Dist: sphinx_rtd_theme<0.5,>=0.2.4; extra == "dev"
|
|
55
|
+
Requires-Dist: Jinja2<3,>=2; extra == "dev"
|
|
56
|
+
Requires-Dist: flake8<4,>=3.7.7; extra == "dev"
|
|
57
|
+
Requires-Dist: isort<5,>=4.3.4; extra == "dev"
|
|
58
|
+
Requires-Dist: flake8-debugger<4.1,>=4.0.0; extra == "dev"
|
|
59
|
+
Requires-Dist: flake8-mock<0.4,>=0.3; extra == "dev"
|
|
60
|
+
Requires-Dist: flake8-mutable<1.3,>=1.2.0; extra == "dev"
|
|
61
|
+
Requires-Dist: flake8-fixme<1.2,>=1.1.1; extra == "dev"
|
|
62
|
+
Requires-Dist: pep8-naming<0.13,>=0.12.1; extra == "dev"
|
|
63
|
+
Requires-Dist: dlint<0.12,>=0.11.0; extra == "dev"
|
|
64
|
+
Requires-Dist: flake8-docstrings<2,>=1.5.0; extra == "dev"
|
|
65
|
+
Requires-Dist: pydocstyle<6.2,>=6.1.1; extra == "dev"
|
|
66
|
+
Requires-Dist: flake8-pytest-style<2,>=1.5.0; extra == "dev"
|
|
67
|
+
Requires-Dist: flake8-comprehensions<3.7,>=3.6.1; extra == "dev"
|
|
68
|
+
Requires-Dist: flake8-print<4.1,>=4.0.0; extra == "dev"
|
|
69
|
+
Requires-Dist: flake8-expression-complexity<0.1,>=0.0.9; extra == "dev"
|
|
70
|
+
Requires-Dist: flake8-multiline-containers<0.1,>=0.0.18; extra == "dev"
|
|
71
|
+
Requires-Dist: pandas-vet<0.3,>=0.2.2; extra == "dev"
|
|
72
|
+
Requires-Dist: flake8-builtins<1.6,>=1.5.3; extra == "dev"
|
|
73
|
+
Requires-Dist: flake8-eradicate<1.2,>=1.1.0; extra == "dev"
|
|
74
|
+
Requires-Dist: flake8-quotes<4,>=3.3.0; extra == "dev"
|
|
75
|
+
Requires-Dist: flake8-variables-names<0.1,>=0.0.4; extra == "dev"
|
|
76
|
+
Requires-Dist: flake8-sfs<0.1,>=0.0.3; extra == "dev"
|
|
77
|
+
Requires-Dist: flake8-absolute-import<2,>=1.0; extra == "dev"
|
|
78
|
+
Requires-Dist: autoflake<2,>=1.1; extra == "dev"
|
|
79
|
+
Requires-Dist: autopep8<1.6,>=1.4.3; extra == "dev"
|
|
80
|
+
Requires-Dist: twine<4,>=1.10.0; extra == "dev"
|
|
81
|
+
Requires-Dist: wheel>=0.30.0; extra == "dev"
|
|
82
|
+
Requires-Dist: coverage<6,>=4.5.1; extra == "dev"
|
|
83
|
+
Requires-Dist: tox<4,>=2.9.1; extra == "dev"
|
|
84
|
+
Requires-Dist: invoke; extra == "dev"
|
|
85
|
+
Requires-Dist: doc8<0.9,>=0.8.0; extra == "dev"
|
|
86
|
+
Requires-Dist: urllib3<1.26,>=1.20; extra == "dev"
|
|
87
|
+
Requires-Dist: tabulate<0.9,>=0.8.3; extra == "dev"
|
|
88
|
+
Requires-Dist: boto3<1.10,>=1.7.47; extra == "dev"
|
|
89
|
+
Requires-Dist: docutils<0.15,>=0.10; extra == "dev"
|
|
90
|
+
|
|
91
|
+
<p style="text-align:center">
|
|
92
|
+
<i>This repository is part of <a href="https://sdv.dev">The Synthetic Data Vault Project</a>, a project from <a href="https://datacebo.com">DataCebo</a>.</i>
|
|
93
|
+
</p>
|
|
94
|
+
|
|
95
|
+
[](https://pypi.org/search/?c=Development+Status+%3A%3A+2+-+Pre-Alpha)
|
|
96
|
+
[](https://pypi.python.org/pypi/copulas)
|
|
97
|
+
[](https://pepy.tech/project/copulas)
|
|
98
|
+
[](https://github.com/sdv-dev/Copulas/actions/workflows/unit.yml)
|
|
99
|
+
[](https://codecov.io/gh/sdv-dev/Copulas)
|
|
100
|
+
[](https://bit.ly/sdv-slack-invite)
|
|
101
|
+
|
|
102
|
+
<br/>
|
|
103
|
+
<p align="center" style="text-align:center">
|
|
104
|
+
<a href="https://github.com/sdv-dev/Copulas">
|
|
105
|
+
<img width=40% src="https://github.com/sdv-dev/SDV/blob/stable/docs/images/Copulas-DataCebo.png?raw=true"></img>
|
|
106
|
+
</a>
|
|
107
|
+
</p>
|
|
108
|
+
|
|
109
|
+
# Overview
|
|
110
|
+
|
|
111
|
+
**Copulas** is a Python library for modeling multivariate distributions and sampling from them
|
|
112
|
+
using copula functions.
|
|
113
|
+
Given a table of numerical data, use Copulas to learn the distribution and
|
|
114
|
+
generate new synthetic data following the same statistical properties.
|
|
115
|
+
|
|
116
|
+
**Key Features:**
|
|
117
|
+
|
|
118
|
+
* **Model multivariate data.** Choose from a variety of univariate
|
|
119
|
+
distributions and copulas – including Archimedian Copulas, Gaussian Copulas and Vine Copulas.
|
|
120
|
+
|
|
121
|
+
* **Compare real and synthetic data visually** after building your model. Visualizations
|
|
122
|
+
are available as 1D histograms, 2D scatterplots and 3D scatterplots.
|
|
123
|
+
|
|
124
|
+
* **Access & manipulate learned parameters.** With complete access to the internals
|
|
125
|
+
of the model, set or tune parameters to your choosing.
|
|
126
|
+
|
|
127
|
+
# Install
|
|
128
|
+
|
|
129
|
+
Install the Copulas library using pip or conda.
|
|
130
|
+
|
|
131
|
+
```bash
|
|
132
|
+
pip install copulas
|
|
133
|
+
```
|
|
134
|
+
|
|
135
|
+
```bash
|
|
136
|
+
conda install -c conda-forge copulas
|
|
137
|
+
```
|
|
138
|
+
|
|
139
|
+
# Usage
|
|
140
|
+
|
|
141
|
+
Get started using a demo dataset. This dataset contains 3 numerical columns.
|
|
142
|
+
|
|
143
|
+
```python
|
|
144
|
+
from copulas.datasets import sample_trivariate_xyz
|
|
145
|
+
|
|
146
|
+
real_data = sample_trivariate_xyz()
|
|
147
|
+
real_data.head()
|
|
148
|
+
```
|
|
149
|
+
|
|
150
|
+
<img src="docs/images/copulas_sample_dataset.png" width="300">
|
|
151
|
+
|
|
152
|
+
Model the data using a copula and use it to create synthetic data.
|
|
153
|
+
The Copulas library offers many options including Gaussian Copula,
|
|
154
|
+
Vine Copulas and Archimedian Copulas.
|
|
155
|
+
|
|
156
|
+
```python
|
|
157
|
+
from copulas.multivariate import GaussianMultivariate
|
|
158
|
+
|
|
159
|
+
copula = GaussianMultivariate()
|
|
160
|
+
copula.fit(real_data)
|
|
161
|
+
|
|
162
|
+
synthetic_data = copula.sample(len(real_data))
|
|
163
|
+
```
|
|
164
|
+
|
|
165
|
+
Visualize the real and synthetic data side-by-side. Let's do this in 3D so see our full dataset.
|
|
166
|
+
|
|
167
|
+
```python
|
|
168
|
+
from copulas.visualization import compare_3d
|
|
169
|
+
|
|
170
|
+
compare_3d(real_data, synthetic_data)
|
|
171
|
+
```
|
|
172
|
+
|
|
173
|
+

|
|
174
|
+
|
|
175
|
+
# Tutorials
|
|
176
|
+
Click below to run the code yourself on a Colab Notebook and discover new features.
|
|
177
|
+
|
|
178
|
+
[](https://bit.ly/copulas-demo)
|
|
179
|
+
|
|
180
|
+
# Community & Support
|
|
181
|
+
|
|
182
|
+
Learn more about Copulas library from our [documentation](https://sdv.dev/Copulas/) site.
|
|
183
|
+
|
|
184
|
+
**Questions or issues?** Join our [Slack channel](https://bit.ly/sdv-slack-invite)
|
|
185
|
+
to discuss more about Copulas and synthetic data.
|
|
186
|
+
If you find a bug or have a feature request, you can also
|
|
187
|
+
[open an issue](https://github.com/sdv-dev/Copulas/issues/new/choose) on our GitHub.
|
|
188
|
+
|
|
189
|
+
**Interested in contributing to Copulas?** Read our
|
|
190
|
+
[Contribution Guide](https://sdv.dev/Copulas/contributing.html) to get started.
|
|
191
|
+
|
|
192
|
+
# Credits
|
|
193
|
+
|
|
194
|
+
The Copulas open source project first started at the Data to AI Lab at MIT in 2018.
|
|
195
|
+
Thank you to our team of contributors who have built and maintained the library over the years!
|
|
196
|
+
|
|
197
|
+
[View Contributors](https://github.com/sdv-dev/Copulas/graphs/contributors)
|
|
198
|
+
|
|
199
|
+
---
|
|
200
|
+
|
|
201
|
+
|
|
202
|
+
<div align="center">
|
|
203
|
+
<a href="https://datacebo.com"><img align="center" width=40% src="https://github.com/sdv-dev/SDV/blob/stable/docs/images/DataCebo.png"></img></a>
|
|
204
|
+
</div>
|
|
205
|
+
<br/>
|
|
206
|
+
<br/>
|
|
207
|
+
|
|
208
|
+
[The Synthetic Data Vault Project](https://sdv.dev) was first created at MIT's [Data to AI Lab](
|
|
209
|
+
https://dai.lids.mit.edu/) in 2016. After 4 years of research and traction with enterprise, we
|
|
210
|
+
created [DataCebo](https://datacebo.com) in 2020 with the goal of growing the project.
|
|
211
|
+
Today, DataCebo is the proud developer of SDV, the largest ecosystem for
|
|
212
|
+
synthetic data generation & evaluation. It is home to multiple libraries that support synthetic
|
|
213
|
+
data, including:
|
|
214
|
+
|
|
215
|
+
* 🔄 Data discovery & transformation. Reverse the transforms to reproduce realistic data.
|
|
216
|
+
* 🧠 Multiple machine learning models -- ranging from Copulas to Deep Learning -- to create tabular,
|
|
217
|
+
multi table and time series data.
|
|
218
|
+
* 📊 Measuring quality and privacy of synthetic data, and comparing different synthetic data
|
|
219
|
+
generation models.
|
|
220
|
+
|
|
221
|
+
[Get started using the SDV package](https://sdv.dev/SDV/getting_started/install.html) -- a fully
|
|
222
|
+
integrated solution and your one-stop shop for synthetic data. Or, use the standalone libraries
|
|
223
|
+
for specific needs.
|
|
@@ -0,0 +1,37 @@
|
|
|
1
|
+
LICENSE
|
|
2
|
+
README.md
|
|
3
|
+
pyproject.toml
|
|
4
|
+
setup.cfg
|
|
5
|
+
copulas/__init__.py
|
|
6
|
+
copulas/datasets.py
|
|
7
|
+
copulas/visualization.py
|
|
8
|
+
copulas.egg-info/PKG-INFO
|
|
9
|
+
copulas.egg-info/SOURCES.txt
|
|
10
|
+
copulas.egg-info/dependency_links.txt
|
|
11
|
+
copulas.egg-info/requires.txt
|
|
12
|
+
copulas.egg-info/top_level.txt
|
|
13
|
+
copulas/bivariate/__init__.py
|
|
14
|
+
copulas/bivariate/base.py
|
|
15
|
+
copulas/bivariate/clayton.py
|
|
16
|
+
copulas/bivariate/frank.py
|
|
17
|
+
copulas/bivariate/gumbel.py
|
|
18
|
+
copulas/bivariate/independence.py
|
|
19
|
+
copulas/bivariate/utils.py
|
|
20
|
+
copulas/multivariate/__init__.py
|
|
21
|
+
copulas/multivariate/base.py
|
|
22
|
+
copulas/multivariate/gaussian.py
|
|
23
|
+
copulas/multivariate/tree.py
|
|
24
|
+
copulas/multivariate/vine.py
|
|
25
|
+
copulas/optimize/__init__.py
|
|
26
|
+
copulas/univariate/__init__.py
|
|
27
|
+
copulas/univariate/base.py
|
|
28
|
+
copulas/univariate/beta.py
|
|
29
|
+
copulas/univariate/gamma.py
|
|
30
|
+
copulas/univariate/gaussian.py
|
|
31
|
+
copulas/univariate/gaussian_kde.py
|
|
32
|
+
copulas/univariate/log_laplace.py
|
|
33
|
+
copulas/univariate/selection.py
|
|
34
|
+
copulas/univariate/student_t.py
|
|
35
|
+
copulas/univariate/truncated_gaussian.py
|
|
36
|
+
copulas/univariate/uniform.py
|
|
37
|
+
tests/test_tasks.py
|
|
@@ -16,12 +16,10 @@ pandas>=1.3.4
|
|
|
16
16
|
pandas>=1.5.0
|
|
17
17
|
|
|
18
18
|
[dev]
|
|
19
|
-
|
|
20
|
-
pytest-cov<3,>=2.6.0
|
|
21
|
-
pytest-rerunfailures<10,>=9.0.0
|
|
22
|
-
rundoc<0.5,>=0.4.3
|
|
19
|
+
copulas[test,tutorials]
|
|
23
20
|
pip>=9.0.1
|
|
24
|
-
|
|
21
|
+
build<2,>=1.0.0
|
|
22
|
+
bump-my-version<1,>=0.18.3
|
|
25
23
|
watchdog<0.11,>=0.8.3
|
|
26
24
|
m2r<0.3,>=0.2.0
|
|
27
25
|
nbsphinx<0.7,>=0.5.0
|
|
@@ -62,18 +60,14 @@ urllib3<1.26,>=1.20
|
|
|
62
60
|
tabulate<0.9,>=0.8.3
|
|
63
61
|
boto3<1.10,>=1.7.47
|
|
64
62
|
docutils<0.15,>=0.10
|
|
65
|
-
markupsafe<=2.0.1
|
|
66
|
-
scikit-learn<1.2,>=0.24
|
|
67
|
-
jupyter<2,>=1.0.0
|
|
68
63
|
|
|
69
64
|
[test]
|
|
65
|
+
copulas[tutorials]
|
|
70
66
|
pytest<7,>=6.2.5
|
|
71
67
|
pytest-cov<3,>=2.6.0
|
|
72
68
|
pytest-rerunfailures<10,>=9.0.0
|
|
73
69
|
rundoc<0.5,>=0.4.3
|
|
74
|
-
|
|
75
|
-
scikit-learn<1.2,>=0.24
|
|
76
|
-
jupyter<2,>=1.0.0
|
|
70
|
+
tomli<3,>=2.0.0
|
|
77
71
|
|
|
78
72
|
[tutorials]
|
|
79
73
|
markupsafe<=2.0.1
|