PyPI - statslibx - Versions diffs - 0.1.8__py3-none-any.whl → 0.2.0__py3-none-any.whl - Mend

statslibx 0.1.8py3-none-any.whl → 0.2.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (18) hide show

statslibx/__init__.py +5 -5
statslibx/computacional.py +126 -2
statslibx/datasets/__init__.py +27 -11
statslibx/datasets/course_completion.csv +100001 -0
statslibx/datasets/iris.csv +151 -0
statslibx/datasets/penguins.csv +345 -0
statslibx/datasets/sp500_companies.csv +504 -0
statslibx/datasets/titanic.csv +419 -0
statslibx/descriptive.py +74 -8
statslibx/inferential.py +67 -6
statslibx/utils.py +71 -13
{statslibx-0.1.8.dist-info → statslibx-0.2.0.dist-info}/METADATA +5 -5
statslibx-0.2.0.dist-info/RECORD +19 -0
{statslibx-0.1.8.dist-info → statslibx-0.2.0.dist-info}/WHEEL +1 -1
statslibx/probability.py +0 -2
statslibx-0.1.8.dist-info/RECORD +0 -15
{statslibx-0.1.8.dist-info → statslibx-0.2.0.dist-info}/entry_points.txt +0 -0
{statslibx-0.1.8.dist-info → statslibx-0.2.0.dist-info}/top_level.txt +0 -0

statslibx/utils.py CHANGED Viewed

@@ -11,23 +11,81 @@ from pathlib import Path
 class UtilsStats:
     """
-    Clase utilitaria para operaciones estadísticas comunes y visualización
+    UtilsStats
+    A utility class for common statistical operations and visualization.
+    This class provides methods for data validation, basic statistical analysis,
+    and visualization of results. It also supports loading data directly from files.
+    >>> # Load data from a file
+    >>> data = utils.load_data("data.csv")
+    >>> utils.check_normality(data, column='age')
+    >>> # Analyze data from an array
+    Methods:
+    --------
+    _setup_plotting_style():
+        Configures default plotting styles for matplotlib.
-    Esta clase proporciona métodos para validación de datos, análisis estadísticos
-    básicos y visualización de resultados. Ahora con soporte para leer archivos directamente.
+    set_plot_backend(backend: Literal['matplotlib', 'seaborn', 'plotly']):
+        Sets the default visualization backend.
-    Examples:
-    ---------
-    >>> utils = UtilsStats()
-    >>> # Desde archivo
-    >>> data = utils.load_data("datos.csv")
-    >>> utils.check_normality(data, column='edad')
-    >>> # Desde array
-    >>> data = np.random.normal(0, 1, 100)
-    >>> utils.check_normality(data)
-    >>> utils.plot_distribution(data)
+    set_default_figsize(figsize: Tuple[int, int]):
+        Sets the default figure size for plots.
+    set_save_fig_options(save_fig: Optional[bool] = False, fig_format: str = 'png',
+                         fig_dpi: int = 300, figures_dir: str = 'figures'):
+        Configures options for saving figures.
+    load_data(path: Union[str, Path], **kwargs) -> pd.DataFrame:
+        Loads data from a file in various formats (CSV, Excel, JSON, etc.).
+    validate_dataframe(data: Union[pd.DataFrame, np.ndarray, list, str, Path]) -> pd.DataFrame:
+        Validates and converts data to a DataFrame. Also accepts file paths.
+    format_number(num: float, decimals: int = 6, scientific: bool = False) -> str:
+        Formats a number with specified decimal places.
+    check_normality(data: Union[pd.Series, np.ndarray, pd.DataFrame, str, Path],
+                    column: Optional[str] = None, alpha: float = 0.05) -> dict:
+        Checks if the data follows a normal distribution using the Shapiro-Wilk test.
+    calculate_confidence_intervals(data: Union[pd.Series, np.ndarray, pd.DataFrame, str, Path],
+                                    column: Optional[str] = None, confidence_level: float = 0.95,
+        Calculates confidence intervals for the mean using parametric or bootstrap methods.
+    detect_outliers(data: Union[pd.Series, np.ndarray, pd.DataFrame, str, Path],
+                    column: Optional[str] = None, method: Literal['iqr', 'zscore', 'isolation_forest'] = 'iqr',
+        Detects outliers using different methods: 'iqr', 'zscore', or 'isolation_forest'.
+    calculate_effect_size(data: Union[pd.Series, np.ndarray, pd.DataFrame, str, Path] = None,
+        Calculates the effect size between two groups using Cohen's d or Hedges' g.
+    plot_distribution(data: Union[pd.DataFrame, pd.Series, np.ndarray, str, Path],
+                      column: Optional[str] = None, plot_type: Literal['hist', 'kde', 'box', 'violin', 'all'] = 'hist',
+                      bins: int = 30, figsize: Optional[Tuple[int, int]] = None,
+                      save_fig: Optional[bool] = False, filename: Optional[str] = None, **kwargs):
+        Plots the distribution of a variable using various plot types and backends.
+    plot_correlation_matrix(data: Union[pd.DataFrame, str, Path],
+                            filename: Optional[str] = None, **kwargs):
+        Visualizes the correlation matrix using a heatmap.
+    plot_scatter_matrix(data: Union[pd.DataFrame, str, Path],
+                        filename: Optional[str] = None, **kwargs):
+        Creates a scatter matrix (pairplot) for visualizing relationships between variables.
+    plot_distribution_with_ci(data: Union[pd.DataFrame, pd.Series, np.ndarray, str, Path],
+                              column: Optional[str] = None, confidence_level: float = 0.95,
+                              ci_method: str = 'parametric', bins: int = 30,
+                              filename: Optional[str] = None, **kwargs) -> plt.Figure:
+        Plots the distribution of a variable with confidence intervals.
+    get_descriptive_stats(data, column=None) -> dict:
+        Returns a dictionary of descriptive statistics for the given data.
+    help():
+        Displays a complete help guide for the UtilsStats class.
     """
     def __init__(self):
         """Inicializar la clase utilitaria"""
         self._plot_backend = 'seaborn'

{statslibx-0.1.8.dist-info → statslibx-0.2.0.dist-info}/METADATA RENAMED Viewed

@@ -1,7 +1,7 @@
 Metadata-Version: 2.4
 Name: statslibx
-Version: 0.1.8
-Summary: StatsLibx - Librería de estadística descriptiva e inferencial
+Version: 0.2.0
+Summary: StatsLibx - Librería de estadística descriptiva, inferencial y computacional
 Author-email: Emmanuel Ascendra Perez <ascendraemmanuel@gmail.com>
 License: MIT
 Classifier: Development Status :: 3 - Alpha
@@ -28,9 +28,9 @@ Requires-Dist: statsmodels>=0.13; extra == "advanced"
 StatsLibX es un paquete de Python diseñado para proporcionar una solución sencilla, eficiente y flexible para manejar volumenes de datos.
-Este proyecto surge con la idea de ofrecer una alternativa moderna, intuitiva y ligera que permita a desarrolladores y entusiastas integrar la **estadistica descriptiva e inferencial** sin complicaciones, con multiples funcionalidades y utilidades pensadas para el futuro.
+Este proyecto surge con la idea de ofrecer una alternativa moderna, intuitiva y ligera que permita a desarrolladores y entusiastas integrar la **estadistica descriptiva, inferencial y computacional (En desarrollo)** sin complicaciones, con multiples funcionalidades y utilidades pensadas para el futuro.
-GitHub del Proyecto: [text](https://github.com/GhostAnalyst30/StatsLibX)
+GitHub del Proyecto: [https://github.com/GhostAnalyst30/StatsLibX](https://github.com/GhostAnalyst30/StatsLibX)
 ## ✨ Características principales
@@ -55,7 +55,7 @@ stats = DescriptiveStats(data) # InferentialStats(data), UtilsStats()
 stats.summary()
 ```
-Para ver mas funciones: [text](https://github.com/GhostAnalyst30/StatsLibX/blob/main/how_use_statslibx.ipynb)
+Para ver mas funciones: [https://github.com/GhostAnalyst30/StatsLibX/blob/main/how_use_statslibx.ipynb](https://github.com/GhostAnalyst30/StatsLibX/blob/main/how_use_statslibx.ipynb)
 ##  📦 Instalación
 ```bash

statslibx-0.2.0.dist-info/RECORD ADDED Viewed

@@ -0,0 +1,19 @@
+statslibx/__init__.py,sha256=YUKUQhO1vUYvcUQmlz1ZtvU6MWNZERdAG55-trf25ZY,1500
+statslibx/cli.py,sha256=DqXaoP85n9xgLDlFnEkeqj-HJG0_IKX0uSqxRcHbzII,1122
+statslibx/computacional.py,sha256=z46bRUiH9a3ajxVTYE2sGO-pg20L87MdOKM3Y_Tcq44,4062
+statslibx/descriptive.py,sha256=GrUR4QfstUeLTXdxKSZsmKaOJkDso-QH51hlwTUaubA,63513
+statslibx/inferential.py,sha256=xiJCppezhWK4TrAARdOufuxjZcoGKsfHtRujKfuXbgg,83068
+statslibx/io.py,sha256=v7pxpmlEMeKyfXftl3WbkUtC9FOh1pymz7MmKPPNw98,493
+statslibx/utils.py,sha256=gWXduW8LMN1q4ZwNggmodRsT9Rcsot-S82NsQiqrjUo,69992
+statslibx/datasets/__init__.py,sha256=wiSp4qGwpILCiaN5vVuwWgKnbdELpbi5pxnNB9Wg2nI,7282
+statslibx/datasets/course_completion.csv,sha256=jaqyxAh4YCsYuH5OFsjvGV7KUyM_7vQt6LgnqnNAFsI,22422135
+statslibx/datasets/iris.csv,sha256=xSdC5QMVqZ-Vajg_rt91dVUmdfZAnvD5pHB23QhHmTA,3858
+statslibx/datasets/penguins.csv,sha256=4HY2vYr3QmAJnqL4Z44uq7813vV5lAzHb2cGHuFsBsE,13478
+statslibx/datasets/sp500_companies.csv,sha256=WKS72YOGnAbyLR6kD95fOpIYZt5oXGjPryyFVqLRF_k,803820
+statslibx/datasets/titanic.csv,sha256=5seOS8ybyBMBCCWhgKZrsbu06m_OWyKtD9l0YXOImXU,29474
+statslibx/preprocessing/__init__.py,sha256=ZwdwjBodxeOry-umJ__6yUSeubpRlZg41yve366ArkY,7395
+statslibx-0.2.0.dist-info/METADATA,sha256=w7f-3RgizY3PHUSxoBl6YuHImHz2qFyillhZk82WUfE,2993
+statslibx-0.2.0.dist-info/WHEEL,sha256=wUyA8OaulRlbfwMtmQsvNngGrxQHAvkKcvRmdizlJi0,92
+statslibx-0.2.0.dist-info/entry_points.txt,sha256=bkCY7JDWNCZFE3I4sjgJ2oGrUgoBBbCbYmWkBAymT70,49
+statslibx-0.2.0.dist-info/top_level.txt,sha256=eeYZXyFm0hIjuI0ba3wF6XW938Mv9tv7Nk9qgjYfCtU,10
+statslibx-0.2.0.dist-info/RECORD,,

{statslibx-0.1.8.dist-info → statslibx-0.2.0.dist-info}/WHEEL RENAMED Viewed

@@ -1,5 +1,5 @@
 Wheel-Version: 1.0
-Generator: setuptools (80.9.0)
+Generator: setuptools (80.10.2)
 Root-Is-Purelib: true
 Tag: py3-none-any

statslibx/probability.py DELETED Viewed

	@@ -1,2 +0,0 @@
1	- class ProbabilityStats:
2	- pass

statslibx-0.1.8.dist-info/RECORD DELETED Viewed

@@ -1,15 +0,0 @@
-statslibx/__init__.py,sha256=KeEoEZVPUR_PZACWoCpS_2l6luPbEee7VRlcrLgbKQQ,1490
-statslibx/cli.py,sha256=DqXaoP85n9xgLDlFnEkeqj-HJG0_IKX0uSqxRcHbzII,1122
-statslibx/computacional.py,sha256=Nv8wk67RUuuv15oBRu2XPp0_k7O4ZgmT51vThH2OuFk,35
-statslibx/descriptive.py,sha256=r5D4reP1Cdzsu1tSLmf2OEaFAkGvHSd3FIYfUclEaRU,60178
-statslibx/inferential.py,sha256=H0R6g3dJFk-53m1bKldrXObgk0SSmpcdqQg_tIgRKBI,79169
-statslibx/io.py,sha256=v7pxpmlEMeKyfXftl3WbkUtC9FOh1pymz7MmKPPNw98,493
-statslibx/probability.py,sha256=MUME4eXWzbdU93F-QdKwmmyd9IgZK1flFUYQHitp10o,33
-statslibx/utils.py,sha256=iJzt0jDacaoUfjtp4dU2PFuIBEheMP9Qrq-HnLTW_Qw,66515
-statslibx/datasets/__init__.py,sha256=GuUl_7-d6YanuDFht1dwB1bFrqjShvKh1m-iRYAbYZE,6875
-statslibx/preprocessing/__init__.py,sha256=ZwdwjBodxeOry-umJ__6yUSeubpRlZg41yve366ArkY,7395
-statslibx-0.1.8.dist-info/METADATA,sha256=uyhAd0xghADIfVee7WzDp76nLA2snjqQcNayio_UrIc,2835
-statslibx-0.1.8.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
-statslibx-0.1.8.dist-info/entry_points.txt,sha256=bkCY7JDWNCZFE3I4sjgJ2oGrUgoBBbCbYmWkBAymT70,49
-statslibx-0.1.8.dist-info/top_level.txt,sha256=eeYZXyFm0hIjuI0ba3wF6XW938Mv9tv7Nk9qgjYfCtU,10
-statslibx-0.1.8.dist-info/RECORD,,

{statslibx-0.1.8.dist-info → statslibx-0.2.0.dist-info}/entry_points.txt RENAMED Viewed

File without changes

{statslibx-0.1.8.dist-info → statslibx-0.2.0.dist-info}/top_level.txt RENAMED Viewed

File without changes

statslibx 0.1.8__py3-none-any.whl → 0.2.0__py3-none-any.whl

statslibx 0.1.8py3-none-any.whl → 0.2.0py3-none-any.whl