PyPI - skxperiments - Versions diffs - 0.1.0.dev0__py3-none-any.whl - Mend

skxperiments 0.1.0.dev0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (36) hide show

skxperiments/__init__.py +5 -0
skxperiments/core/__init__.py +42 -0
skxperiments/core/assignment.py +589 -0
skxperiments/core/base.py +512 -0
skxperiments/core/exceptions.py +145 -0
skxperiments/core/potential_outcomes.py +168 -0
skxperiments/core/results.py +624 -0
skxperiments/design/__init__.py +22 -0
skxperiments/design/balance.py +182 -0
skxperiments/design/blocked_crd.py +157 -0
skxperiments/design/crd.py +162 -0
skxperiments/design/factorial.py +174 -0
skxperiments/design/power.py +233 -0
skxperiments/design/rerandomized_crd.py +319 -0
skxperiments/diagnostics/__init__.py +21 -0
skxperiments/diagnostics/aa_test.py +277 -0
skxperiments/diagnostics/balance_report.py +224 -0
skxperiments/diagnostics/srm.py +327 -0
skxperiments/estimators/__init__.py +23 -0
skxperiments/estimators/blocked_difference_in_means.py +197 -0
skxperiments/estimators/cuped.py +280 -0
skxperiments/estimators/difference_in_means.py +161 -0
skxperiments/estimators/factorial_estimator.py +213 -0
skxperiments/estimators/lin_estimator.py +298 -0
skxperiments/inference/__init__.py +17 -0
skxperiments/inference/bootstrap.py +450 -0
skxperiments/inference/multiple.py +365 -0
skxperiments/inference/neyman.py +386 -0
skxperiments/inference/randomization_test.py +319 -0
skxperiments/pipeline.py +366 -0
skxperiments/reporting/__init__.py +30 -0
skxperiments/reporting/plots.py +411 -0
skxperiments/reporting/summary.py +185 -0
skxperiments-0.1.0.dev0.dist-info/METADATA +272 -0
skxperiments-0.1.0.dev0.dist-info/RECORD +36 -0
skxperiments-0.1.0.dev0.dist-info/WHEEL +4 -0

skxperiments-0.1.0.dev0.dist-info/METADATA ADDED Viewed

@@ -0,0 +1,272 @@
+Metadata-Version: 2.4
+Name: skxperiments
+Version: 0.1.0.dev0
+Summary: Randomization-based experimental design and causal inference, sklearn-style.
+Project-URL: Homepage, https://github.com/gusbruschi13/skxperiments
+Project-URL: Repository, https://github.com/gusbruschi13/skxperiments
+Project-URL: Issues, https://github.com/gusbruschi13/skxperiments/issues
+Author-email: Gustavo Bruschi <gustavo.bruschi@riachuelo.com.br>
+License-Expression: MIT
+Keywords: ab-testing,causal-inference,design-of-experiments,experiments,potential-outcomes,randomization
+Classifier: Development Status :: 3 - Alpha
+Classifier: Intended Audience :: Science/Research
+Classifier: Operating System :: OS Independent
+Classifier: Programming Language :: Python :: 3
+Classifier: Programming Language :: Python :: 3.10
+Classifier: Programming Language :: Python :: 3.11
+Classifier: Programming Language :: Python :: 3.12
+Classifier: Topic :: Scientific/Engineering
+Requires-Python: >=3.10
+Requires-Dist: numpy
+Requires-Dist: pandas
+Requires-Dist: scipy
+Provides-Extra: dev
+Requires-Dist: black; extra == 'dev'
+Requires-Dist: hypothesis; extra == 'dev'
+Requires-Dist: ipykernel; extra == 'dev'
+Requires-Dist: matplotlib; extra == 'dev'
+Requires-Dist: mypy; extra == 'dev'
+Requires-Dist: nbmake; extra == 'dev'
+Requires-Dist: pre-commit; extra == 'dev'
+Requires-Dist: pytest; extra == 'dev'
+Requires-Dist: pytest-cov; extra == 'dev'
+Requires-Dist: ruff; extra == 'dev'
+Provides-Extra: viz
+Requires-Dist: matplotlib; extra == 'viz'
+Description-Content-Type: text/markdown
+# skxperiments
+> Randomization-based experimental design and causal inference, sklearn-style.
+![CI](https://github.com/username/skxperiments/actions/workflows/ci.yml/badge.svg)
+![Python](https://img.shields.io/badge/python-3.10%2B-blue)
+![Status](https://img.shields.io/badge/status-alpha-orange)
+A Python library for designing randomized experiments and estimating causal effects under the
+potential outcomes framework (Rubin Causal Model). Treatment assignment is the starting point;
+statistical models come second.
+## Status
+The v1 feature set is complete: Phases 0–7 are done (sequential testing is
+deferred to v2). See [Project status](#project-status) below for details.
+## Installation
+```bash
+pip install skxperiments
+```
+Requires Python 3.10+. Dependencies: `numpy`, `pandas`, `scipy`.
+## Quick start
+```python
+import numpy as np
+import pandas as pd
+from skxperiments.design.crd import CRD
+from skxperiments.estimators.difference_in_means import DifferenceInMeans
+from skxperiments.inference import RandomizationTest
+# 1. Generate a synthetic dataset
+rng = np.random.default_rng(42)
+df = pd.DataFrame({
+    "x": rng.normal(0.0, 1.0, 200),
+    "y": rng.normal(0.0, 1.0, 200),
+})
+# 2. Design: completely randomized assignment, 50/50 split
+design = CRD(p=0.5, seed=42)
+assignment = design.randomize(df)
+# 3. Point estimate of the ATE
+estimator = DifferenceInMeans(outcome_col="y")
+result = estimator.fit(assignment).estimate()
+print(result.ate)
+# 4. Randomization-based p-value (Fisher's sharp null)
+rt = RandomizationTest(estimator=estimator, n_permutations=10_000, seed=0)
+result = rt.fit(assignment).estimate()
+print(result.ate, result.p_value)
+```
+For variance reduction with covariates, use `LinEstimator` (Lin 2013) or `CUPED` (Deng et al.
+2013). For blocked or factorial designs, use `BlockedCRD` + `BlockedDifferenceInMeans` or
+`FactorialDesign` + `FactorialEstimator`. For rerandomization on Mahalanobis distance,
+use `ReRandomizedCRD` (Morgan & Rubin 2012). `RandomizationTest` works with all of these
+(except `FactorialAssignment` in v1). To control the family-wise error rate or false
+discovery rate when reporting multiple effects, wrap the result in
+`MultipleTestingCorrection`.
+## Documentation and tutorials
+Learning-path notebooks (bilingual, Portuguese and English) live in
+[`examples/for_starters/`](examples/for_starters/); conceptual docs (a glossary
+and a "how to choose" guide) are in [`docs/`](docs/README.md).
+## Design philosophy
+1. **The assignment mechanism is primary**, not the statistical model.
+2. **API in scikit-learn style**: parameters in `__init__`, data in `fit()`, learned attributes
+   end with `_`.
+3. **`Assignment` is the contract** between designs and estimators — estimators receive
+   `Assignment` objects, not loose DataFrames.
+4. **Randomization-based inference is the default**; classical t-tests are not.
+5. **Finite-population vs. superpopulation inference are distinguished explicitly.**
+6. **Fail fast** with clear messages when designs and estimators are incompatible.
+7. **No side effects**: `fit()` and `randomize()` never mutate input DataFrames.
+## Project status
+| Phase | Module | Status |
+|---|---|---|
+| 0 | Scaffold, exceptions, CI | ✓ Complete |
+| 1 | Core (`Assignment`, `Results`, base classes) | ✓ Complete |
+| 2 | Designs (CRD, BlockedCRD, ReRandomizedCRD, FactorialDesign, balance, power) | ✓ Complete |
+| 3 | Estimators (DIM, BlockedDIM, Factorial, Lin, CUPED) | ✓ Complete |
+| 4 | Inference (RandomizationTest, MultipleTestingCorrection, NeymanCI, BootstrapCI) | ✓ Complete (4.1–4.4; sequential → v2) |
+| 5 | Diagnostics (SRMTest, AATest, BalanceReport) | ✓ Complete |
+| 6 | Pipeline (ExperimentPipeline, ExperimentComparison) | ✓ Complete |
+| 7 | Visualization and reporting (plots, ExperimentReport) | ✓ Complete |
+Test coverage: 720 tests, all passing on CI.
+See [`ROADMAP.md`](ROADMAP.md) for deferred features and v2 plans, and `CHANGELOG.md` for the
+full history of changes.
+## What's implemented
+### Designs (`skxperiments.design`)
+- **`CRD`** — Completely randomized design.
+- **`BlockedCRD`** — Independent randomization within blocks.
+- **`ReRandomizedCRD`** — Mahalanobis acceptance criterion with cached covariance matrix; loop with `max_attempts`.
+- **`FactorialDesign`** — 2^K factorial design with equal cell sizes; little-endian cell encoding.
+- **`check_balance(assignment, covariates)`** — Standardized mean differences (SMD), pooled std with `ddof=1`.
+- **`power_analysis(...)`** — Sample size, MDE, or power for two-sample mean comparisons.
+### Estimators (`skxperiments.estimators`)
+- **`DifferenceInMeans`** — Simple ATE for `CRDAssignment`.
+- **`BlockedDifferenceInMeans`** — Size-weighted ATE for `BlockedAssignment`.
+- **`FactorialEstimator`** — All 2^K − 1 effects (main effects and interactions of all orders) for `FactorialAssignment`. Returns `Results` in multi-effect mode.
+- **`LinEstimator`** — Covariate-adjusted ATE via OLS with treatment-covariate interaction (Lin 2013).
+- **`CUPED`** — Variance reduction with a pre-experiment covariate (Deng et al. 2013).
+All estimators return `Results` with point estimates only; standard errors and confidence
+intervals come from inference classes in `skxperiments.inference`.
+### Inference (`skxperiments.inference`)
+- **`RandomizationTest`** — Fisher's sharp null hypothesis test via Monte Carlo permutations.
+  Uses `Assignment.draw()` to respect the original randomization mechanism (including
+  rerandomization Mahalanobis criterion and within-block proportions). P-value via the
+  Phipson & Smyth (2010) continuity correction. Three alternatives: `"two-sided"`,
+  `"greater"`, `"less"`. Works with `DifferenceInMeans`, `BlockedDifferenceInMeans`,
+  `LinEstimator`, and `CUPED`.
+- **`MultipleTestingCorrection`** — Bonferroni, Holm (FWER) and Benjamini-Hochberg (FDR)
+  correction over a family of p-values. Accepts a multi-effect `Results` (typical from
+  `FactorialEstimator` after inference) or a list of scalar `Results` (for comparing
+  independent experiments). Clips corrected p-values to `[0, 1]`; preserves originals
+  in `Results.extra["original_p_values"]`. Default method is Holm.
+- **`NeymanCI`** — Neyman variance-based two-sided Wald confidence interval and p-value
+  for finite-population inference. Conservative variance for `CRDAssignment` (including
+  rerandomized) and stratified variance for `BlockedAssignment`, consistent with the
+  size-weighted ATE of `BlockedDifferenceInMeans`. Wraps `DifferenceInMeans` or
+  `BlockedDifferenceInMeans`; rejects superpopulation mode (use `BootstrapCI`).
+- **`BootstrapCI`** — Bootstrap confidence interval (percentile or BCa) for
+  superpopulation inference. Resamples units within each arm (within each
+  block-by-arm stratum for blocked designs) and refits the estimator, so it
+  works with any scalar estimator (`DifferenceInMeans`, `BlockedDifferenceInMeans`,
+  `LinEstimator`, `CUPED`).
+### Diagnostics (`skxperiments.diagnostics`)
+- **`SRMTest`** — Sample Ratio Mismatch via chi-squared: observed vs. intended arm/cell
+  allocation, flagged below a threshold (default 0.001). Two-arm and factorial.
+- **`BalanceReport`** — Standardized mean differences (SMD) per covariate, flagging
+  `|SMD| > 0.1`. Consumes `check_balance`; `to_dataframe()` feeds the Phase 7 Love plot.
+- **`AATest`** — A/A calibration: re-randomizes a design on fixed data, runs a wrapped
+  inference, and checks the false-positive rate (exact binomial test) and p-value
+  uniformity (KS).
+Each returns a dedicated result with `to_diagnostics_report()` for pipeline aggregation.
+### Pipeline (`skxperiments.pipeline`)
+- **`ExperimentPipeline`** — Composes an inference (with its estimator) and diagnostics,
+  runs them on an `Assignment`, and bundles the result. Runs `SRMTest` automatically;
+  diagnostics are best-effort and flags are surfaced without halting (opt-in
+  `raise_on_flag`).
+- **`ExperimentComparison`** — Compares independent experiments, applying
+  `MultipleTestingCorrection` across the family. Returns a comparison table ready for the
+  forest plot. Subgroup comparison is deferred to v2.
+### Reporting (`skxperiments.reporting`)
+Requires the optional `viz` extra (`pip install skxperiments[viz]`).
+- **Plots** — diagnostic (`plot_balance`, `plot_srm`, `plot_null_distribution`) and result
+  (`plot_effect`, `plot_forest`, `plot_interaction`, `plot_power_curve`). Each returns a
+  matplotlib `Axes` and accepts an optional `ax`.
+- **`ExperimentReport`** — Renders a `PipelineResult` as a self-contained static HTML page
+  (results table, diagnostics, embedded plots). `include_plots=False` skips the optional
+  dependency.
+## What's next (v2)
+The v1 feature set is complete. Deferred items live in [`ROADMAP.md`](ROADMAP.md):
+`SequentialTest` (mSPRT/always-valid), Benjamini-Yekutieli correction, covariate-adjusted
+variance in `NeymanCI`, studentized and block-resampling bootstrap, subgroup comparison,
+a plotly backend, and interactive dashboards.
+## Contributing
+Contributions are welcome. Please open an issue to discuss substantial changes before submitting
+a pull request. The architecture has documented design decisions that should be respected — see
+[`ROADMAP.md`](ROADMAP.md), the project notes in `CHANGELOG.md`, and the docstrings of base
+classes (`BaseAssignment`, `BaseEstimator`, `Results`) for the contracts new code must follow.
+Run the test suite with:
+```bash
+pytest tests/ -v
+```
+Skip slow statistical tests:
+```bash
+pytest tests/ -v -m "not slow"
+```
+## License
+MIT.
+## References
+The implementations follow standard textbook formulations:
+- Imbens, G. W., & Rubin, D. B. (2015). *Causal inference for statistics, social, and biomedical
+  sciences: An introduction.* Cambridge University Press.
+- Lin, W. (2013). Agnostic notes on regression adjustments to experimental data: Reexamining
+  Freedman's critique. *Annals of Applied Statistics*, 7(1), 295–318.
+- Morgan, K. L., & Rubin, D. B. (2012). Rerandomization to improve covariate balance in
+  experiments. *Annals of Statistics*, 40(2), 1263–1282.
+- Deng, A., Xu, Y., Kohavi, R., & Walker, T. (2013). Improving the sensitivity of online
+  controlled experiments by utilizing pre-experiment data. *WSDM 2013*.
+- Box, G. E. P., Hunter, J. S., & Hunter, W. G. (2005). *Statistics for experimenters: Design,
+  innovation, and discovery* (2nd ed.). Wiley.
+- Cohen, J. (1988). *Statistical power analysis for the behavioral sciences* (2nd ed.). Routledge.
+- Austin, P. C. (2009). Balance diagnostics for comparing the distribution of baseline covariates
+  between treatment groups in propensity-score matched samples. *Statistics in Medicine*.
+- Phipson, B., & Smyth, G. K. (2010). Permutation P-values should never be zero: calculating
+  exact P-values when permutations are randomly drawn. *Statistical Applications in Genetics
+  and Molecular Biology*, 9(1).
+- Fisher, R. A. (1935). *The Design of Experiments*. Oliver and Boyd.
+- Holm, S. (1979). A simple sequentially rejective multiple test procedure. *Scandinavian
+  Journal of Statistics*, 6(2), 65–70.
+- Benjamini, Y., & Hochberg, Y. (1995). Controlling the false discovery rate: a practical and
+  powerful approach to multiple testing. *Journal of the Royal Statistical Society: Series B*,
+  57(1), 289–300.

skxperiments-0.1.0.dev0.dist-info/RECORD ADDED Viewed

@@ -0,0 +1,36 @@
+skxperiments/__init__.py,sha256=zQDBS0g4SM9rsIDgYxaKbWzQqatRFQpWpkEg9j9esgs,139
+skxperiments/pipeline.py,sha256=2njPU2qxu0vdeQFi2i0RLBm81zc6xDFn8v2HXMNp6k8,13343
+skxperiments/core/__init__.py,sha256=V53NjlelwN8lSwHq_f0UhgVIneL2Q2dNSYxSyz-B-5w,1270
+skxperiments/core/assignment.py,sha256=gq96xZD9_b7jDSizAdRyX4jOymzGZj2UwJkaoz1dHj8,20559
+skxperiments/core/base.py,sha256=jQ3yc2wzmvm1wKXtbdolw3Li60KY4l1COcIXZPwhAUw,15829
+skxperiments/core/exceptions.py,sha256=6WpfdCNDER9w5NQgHu-2LQNM2JdDuB2Bb03L2SMzY9A,4135
+skxperiments/core/potential_outcomes.py,sha256=yvcZYT_mjLoX_ijuZHGSmrj3wqcTVFMcht_QcsYSBjs,4794
+skxperiments/core/results.py,sha256=ECQsJ4nIO8PFuO-Ac9si474E-1xB4hZYm0Lm4mScDmE,24173
+skxperiments/design/__init__.py,sha256=So_cHRb285y3UzGebwnw6zRswKOcxpNyiZHgE2CeCc0,692
+skxperiments/design/balance.py,sha256=B6BKhkJfenwKjc_0bLNrbXRB-Gcqp3R4n2tBtLmZZis,6102
+skxperiments/design/blocked_crd.py,sha256=5letYzEMkOF_F7XRMkj0cpF5fFmQry_lUaCBr_NCh3w,5491
+skxperiments/design/crd.py,sha256=hfYAhWRo13z5SEkx_raYlg-UyzrHTTqxYAS8H1atMq0,5452
+skxperiments/design/factorial.py,sha256=MZ9CLbHl4eDyirIQt6detjaRwhYn7NLTov_EJvz50FQ,5968
+skxperiments/design/power.py,sha256=hbbr9d7lvptKyvb33vLFj369izQ6kr7P-B1T0Hr1lcI,7619
+skxperiments/design/rerandomized_crd.py,sha256=d7hwIXVpDRqoQag8dmZIul6KAPff9TyJ16kWEtjSezM,11768
+skxperiments/diagnostics/__init__.py,sha256=IMqNGzyNDErXECJDAe614wyDCthtXUENF4026AGw9nE,548
+skxperiments/diagnostics/aa_test.py,sha256=ny7jyYEro2Q7qgwN_v5hdkzdUIBIJexe3PefGeLuA_I,10876
+skxperiments/diagnostics/balance_report.py,sha256=5RxraXUSPxNOGcXi1Hbqm7qzG8-hxh4CbGRiYZFvQZI,7938
+skxperiments/diagnostics/srm.py,sha256=lVU3M0VU0SX5_uCg2ATeNZ1NcYzVR1sTa1A5szS_jgE,12287
+skxperiments/estimators/__init__.py,sha256=q8ONWo11PPkuUwkDFG-wbTbJaTbQppNknPle4rJvhO4,752
+skxperiments/estimators/blocked_difference_in_means.py,sha256=9Wve756AlOziJVGjkObTxnEfcjDYSZZ31Gd4hkKOiGk,7538
+skxperiments/estimators/cuped.py,sha256=5qHSutrQxtdLfyj4KtLjTL4ENYmsnVuZJ7K3sQ-T4XM,10642
+skxperiments/estimators/difference_in_means.py,sha256=ZE-cP42hImaBMSidxwo-7cSw9l_VUubIndAJwSDBJM0,5662
+skxperiments/estimators/factorial_estimator.py,sha256=tPxRI2g1i3BZdQX-Am68MDDA3bOJV0vWZ5AWdl7rap8,7754
+skxperiments/estimators/lin_estimator.py,sha256=D6hiSmwd2Uyx5PJl7k0hCHOC2lNDl1u0wayMgKheNbk,11001
+skxperiments/inference/__init__.py,sha256=rs_MMI7O3zhrWYoqGABy7JO9qKbL7dbReRkMQJJGrjY,545
+skxperiments/inference/bootstrap.py,sha256=PPFvOjBSt5C6l0iMVtOQXnFBbH7LEj9aauitsh3kQlo,17893
+skxperiments/inference/multiple.py,sha256=y9KiW693iYIdqK58K1sBv-42Y3Iw39X9KSL3s21m4GA,13573
+skxperiments/inference/neyman.py,sha256=wTNZmnpLNEevd0apOU-GUWqF4kGM_wVlPNriMkxazzw,14903
+skxperiments/inference/randomization_test.py,sha256=M4uvNQDaweinNx5Jg2hvFFdO6UYQy8ltaGzcc9WvitA,13123
+skxperiments/reporting/__init__.py,sha256=njiThCyqBGT0JUaWa0MCDvOY8K07L3Bw8Wwc2XoHX_g,844
+skxperiments/reporting/plots.py,sha256=JPzLmoZu46Vv0gpeyDnEWiMX4AMuZBp4rzEx8w9fVnI,12731
+skxperiments/reporting/summary.py,sha256=XcEUVPN8MxVHXdQR25PBc9DIGtIZM7LhDw0_oVnvM2Y,6759
+skxperiments-0.1.0.dev0.dist-info/METADATA,sha256=mV0bukgv6p_FOnRnf0dyzpihzxepoihAcacKF0_ZV5o,12924
+skxperiments-0.1.0.dev0.dist-info/WHEEL,sha256=mffPy8wBnZQn2VnJUU5jE99KsxaSfiyMHV9Yt0aLVxs,87
+skxperiments-0.1.0.dev0.dist-info/RECORD,,

skxperiments-0.1.0.dev0.dist-info/WHEEL ADDED Viewed

@@ -0,0 +1,4 @@
+Wheel-Version: 1.0
+Generator: hatchling 1.30.1
+Root-Is-Purelib: true
+Tag: py3-none-any