PyPI - statslibx - Versions diffs - 0.2.0__tar.gz → 0.2.1__tar.gz - Mend

statslibx 0.2.0tar.gz → 0.2.1tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (26) hide show

{statslibx-0.2.0/statslibx.egg-info → statslibx-0.2.1}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: statslibx
-Version: 0.2.0
+Version: 0.2.1
 Summary: StatsLibx - Librería de estadística descriptiva, inferencial y computacional
 Author-email: Emmanuel Ascendra Perez <ascendraemmanuel@gmail.com>
 License: MIT
@@ -16,7 +16,6 @@ Classifier: Programming Language :: Python :: 3.12
 Requires-Python: >=3.8
 Description-Content-Type: text/markdown
 Requires-Dist: pandas>=1.5
-Requires-Dist: polars>=0.20
 Provides-Extra: viz
 Requires-Dist: seaborn>=0.11; extra == "viz"
 Requires-Dist: plotly>=5.0; extra == "viz"

{statslibx-0.2.0 → statslibx-0.2.1}/pyproject.toml RENAMED Viewed

@@ -4,7 +4,7 @@ build-backend = "setuptools.build_meta"
 [project]
 name = "statslibx"
-version = "0.2.0"
+version = "0.2.1"
 description = "StatsLibx - Librería de estadística descriptiva, inferencial y computacional"
 readme = "README.md"
 requires-python = ">=3.8"
@@ -27,8 +27,7 @@ classifiers = [
 ]
 dependencies = [
-    "pandas>=1.5",
-    "polars>=0.20"
+    "pandas>=1.5"
 ]
 [project.optional-dependencies]

{statslibx-0.2.0 → statslibx-0.2.1}/statslibx/__init__.py RENAMED Viewed

@@ -1,10 +1,10 @@
 """
 StatsLibx - Librería de Estadística para Python
 Autor: Emmanuel Ascendra
-Versión: 0.2.0
+Versión: 0.2.1
 """
-__version__ = "0.2.0"
+__version__ = "0.2.1"
 __author__ = "Emmanuel Ascendra"
 # Importar las clases principales

{statslibx-0.2.0 → statslibx-0.2.1}/statslibx/datasets/__init__.py RENAMED Viewed

@@ -61,8 +61,9 @@ def load_dataset(
     name: str,
     backend: Literal["pandas", "polars"] = "pandas",
     return_X_y: Optional[Tuple[List[str], str]] = None,
+    sep: str = ",",
     save: Optional[bool] = False,
-    filename: Optional[str] = None
+    filename: Optional[str] = None,
 ) -> Union[pd.DataFrame, pl.DataFrame, Tuple[NDArray, NDArray]]:
     """
     Carga un dataset interno del paquete.
@@ -101,7 +102,7 @@ def load_dataset(
         data_bytes = pkgutil.get_data("statslibx.datasets", name)
         if data_bytes is not None:
             df = (
-                pd.read_csv(io.BytesIO(data_bytes))
+                pd.read_csv(io.BytesIO(data_bytes), sep=sep)
                 if backend == "pandas"
                 else pl.read_csv(io.BytesIO(data_bytes))
             )
@@ -112,7 +113,7 @@ def load_dataset(
     if df is None:
         try:
             df = (
-                pd.read_csv(name)
+                pd.read_csv(name, sep=sep)
                 if backend == "pandas"
                 else pl.read_csv(name)
             )

{statslibx-0.2.0 → statslibx-0.2.1}/statslibx/descriptive.py RENAMED Viewed

@@ -3,7 +3,6 @@ import pandas as pd
 import polars as pl
 from typing import Optional, Union, Literal, List
 from datetime import datetime
-import flet as ft
 import os
 import matplotlib.pyplot as plt
 import seaborn as sns
@@ -81,10 +80,6 @@ class DescriptiveStats:
     """
     def __init__(self, data: Union[pd.DataFrame, np.ndarray],
-                sep: str = None,
-                decimal: str = None,
-                thousand: str = None,
-                backend: Literal['pandas', 'polars'] = 'pandas',
                 lang: Literal['es-ES', 'en-US'] = 'es-ES'):
         """
         # Initialize DataFrame
@@ -92,9 +87,6 @@ class DescriptiveStats:
         ## **Parameters:**
         - **data** : Data to analyze
-        - **sep** : Column separator
-        - **decimal** : Decimal separator
-        - **thousand** : Thousand separator
         - **backend** : 'pandas' or 'polars' for processing
         (Proximamente estara habilitado polars para big data)
@@ -104,72 +96,26 @@ class DescriptiveStats:
         stats = DescriptiveStats(data)
         ``
         """
-        if isinstance(data, str) and os.path.exists(data):
-                data = DescriptiveStats.from_file(data).data
-        if isinstance(data, pl.DataFrame):
+        if isinstance(data, pd.DataFrame):
+            self.data = data
+        elif isinstance(data, np.ndarray):
+            self.data = pd.DataFrame(data)
+        else:
             raise TypeError(
-                "Polars aún no soportado. Use pandas.DataFrame."
+                "Data must be a pandas.DataFrame or numpy.ndarray."
             )
         if isinstance(data, np.ndarray):
             if data.ndim == 1:
                 data = pd.DataFrame({'var': data})
             else:
-                data = pd.DataFrame(data, columns=[f'var_{i}' for i in range(data.shape[1])]) \
+                data = pd.DataFrame(data, columns=[f'var_{i}' for i in range(data.shape[1])],
+                                    sep=self.sep) \
                     if isinstance(data, pd.DataFrame) else pl.DataFrame(data, )
-        self.data = data
-        self.backend = backend
         self._numeric_cols = data.select_dtypes(include=[np.number]).columns.tolist()
-        self.sep = sep
-        self.decimal = decimal
-        self.thousand = thousand
         self.lang = lang
-    @classmethod
-    def from_file(self, path: str):
-        """
-        Carga automática de archivos y devuelve instancia de Intelligence.
-        Soporta CSV, Excel, TXT, JSON, Parquet, Feather, TSV.
-        Automatic file upload and returns Intelligence instance.
-        Supports CSV, Excel, TXT, JSON, Parquet, Feather, TSV.
-        Parametros / Parameters:
-        ------------------------
-        path : str
-            Ruta del archivo
-            File path
-        """
-        if not os.path.exists(path):
-            raise FileNotFoundError(f"Archivo no encontrado / File not found: {path}")
-        ext = os.path.splitext(path)[1].lower()
-        if ext == ".csv":
-            df = pd.read_csv(path, sep=self.sep, decimal=self.decimal, thousand=self.thousand)
-        elif ext in [".xlsx", ".xls"]:
-            df = pd.read_excel(path, decimal=self.decimal, thousand=self.thousand)
-        elif ext in [".txt", ".tsv"]:
-            df = pd.read_table(path, sep=self.sep, decimal=self.decimal, thousand=self.thousand)
-        elif ext == ".json":
-            df = pd.read_json(path)
-        elif ext == ".parquet":
-            df = pd.read_parquet(path)
-        elif ext == ".feather":
-            df = pd.read_feather(path)
-        else:
-            raise ValueError(f"Formato no soportado / Unsupported format: {ext}")
-        return DescriptiveStats(df)
     # ============= MÉTODOS UNIVARIADOS =============
@@ -1262,3 +1208,4 @@ class LinearRegressionResult:
             plt.ylabel("Residuos")
             plt.title("Residuos vs Predicciones")
             plt.show()

{statslibx-0.2.0 → statslibx-0.2.1}/statslibx/inferential.py RENAMED Viewed

@@ -69,8 +69,6 @@ class InferentialStats:
     """
     def __init__(self, data: Union[pd.DataFrame, np.ndarray],
-                backend: Literal['pandas', 'polars'] = 'pandas',
-                sep: str = None, decimal: str = None, thousand: str = None,
                 lang: Literal['es-ES', 'en-US'] = 'es-ES'):
         """
         Initialize DataFrame
@@ -79,17 +77,16 @@ class InferentialStats:
         -----------
         data : DataFrame o ndarray
             Data to analyze
-        backend : str
-            'pandas' or 'polars' for processing
         """
-        if isinstance(data, str) and os.path.exists(data):
-                data = InferentialStats.from_file(data).data
-        if isinstance(data, pl.DataFrame):
+        if isinstance(data, pd.DataFrame):
+            self.data = data
+        elif isinstance(data, np.ndarray):
+            self.data = pd.DataFrame(data)
+        else:
             raise TypeError(
-                "Polars aún no soportado. Use pandas.DataFrame."
-            )
+                "Data must be a pandas.DataFrame or numpy.ndarray."
+            )
         if isinstance(data, np.ndarray):
             if data.ndim == 1:
@@ -98,48 +95,9 @@ class InferentialStats:
                 data = pd.DataFrame(data, columns=[f'var_{i}' for i in range(data.shape[1])])
         self.data = data
-        self.backend = backend
         self._numeric_cols = data.select_dtypes(include=[np.number]).columns.tolist()
-        self.sep = sep
-        self.decimal = decimal
-        self.thousand = thousand
         self.lang = lang
-    @classmethod
-    def from_file(path: str):
-        """
-        Carga automática de archivos y devuelve instancia de Intelligence.
-        Soporta CSV, Excel, TXT, JSON, Parquet, Feather, TSV.
-        """
-        if not os.path.exists(path):
-            raise FileNotFoundError(f"Archivo no encontrado / File not found: {path}")
-        ext = os.path.splitext(path)[1].lower()
-        if ext == ".csv":
-            df = pd.read_csv(path, sep=self.sep, decimal=self.decimal, thousand=self.thousand)
-        elif ext in [".xlsx", ".xls"]:
-            df = pd.read_excel(path, decimal=self.decimal, thousand=self.thousand)
-        elif ext in [".txt", ".tsv"]:
-            df = pd.read_table(path, sep=self.sep, decimal=self.decimal, thousand=self.thousand)
-        elif ext == ".json":
-            df = pd.read_json(path)
-        elif ext == ".parquet":
-            df = pd.read_parquet(path)
-        elif ext == ".feather":
-            df = pd.read_feather(path)
-        else:
-            raise ValueError(f"Formato no soportado: {ext}")
-        return InferentialStats(df)
     # ============= INTERVALOS DE CONFIANZA =============
     def confidence_interval(self, column: str, confidence: float = 0.95,

{statslibx-0.2.0 → statslibx-0.2.1/statslibx.egg-info}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: statslibx
-Version: 0.2.0
+Version: 0.2.1
 Summary: StatsLibx - Librería de estadística descriptiva, inferencial y computacional
 Author-email: Emmanuel Ascendra Perez <ascendraemmanuel@gmail.com>
 License: MIT
@@ -16,7 +16,6 @@ Classifier: Programming Language :: Python :: 3.12
 Requires-Python: >=3.8
 Description-Content-Type: text/markdown
 Requires-Dist: pandas>=1.5
-Requires-Dist: polars>=0.20
 Provides-Extra: viz
 Requires-Dist: seaborn>=0.11; extra == "viz"
 Requires-Dist: plotly>=5.0; extra == "viz"

{statslibx-0.2.0 → statslibx-0.2.1}/statslibx.egg-info/SOURCES.txt RENAMED Viewed

@@ -20,4 +20,5 @@ statslibx/datasets/iris.csv
 statslibx/datasets/penguins.csv
 statslibx/datasets/sp500_companies.csv
 statslibx/datasets/titanic.csv
-statslibx/preprocessing/__init__.py
+statslibx/preprocessing/__init__.py
+tests/test1.py

{statslibx-0.2.0 → statslibx-0.2.1}/statslibx.egg-info/requires.txt RENAMED Viewed

@@ -1,5 +1,4 @@
 pandas>=1.5
-polars>=0.20
 [advanced]
 scikit-learn>=1.0

{statslibx-0.2.0 → statslibx-0.2.1}/statslibx.egg-info/top_level.txt RENAMED Viewed

@@ -1,3 +1,4 @@
 dist
 figures
 statslibx
+tests

statslibx-0.2.1/tests/test1.py ADDED Viewed

@@ -0,0 +1,14 @@
+from statslibx import load_dataset, DescriptiveStats, InferentialStats
+import pandas as pd
+# df = pd.read_csv(r"tests\bank (1).csv", sep=";")
+df = load_dataset(r"tests\bank (1).csv", sep=";")
+stats = DescriptiveStats(df)
+print(stats.data)
+infer = InferentialStats(df)
+print(infer.data)