PyPI - qdesc - Versions diffs - 0.1.2__tar.gz → 0.1.3__tar.gz - Mend

qdesc 0.1.2tar.gz → 0.1.3tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of qdesc might be problematic. Click here for more details.

Files changed (11) hide show

{qdesc-0.1.2 → qdesc-0.1.3}/PKG-INFO +1 -1
qdesc-0.1.3/qdesc/__init__.py +52 -0
{qdesc-0.1.2 → qdesc-0.1.3}/qdesc.egg-info/PKG-INFO +1 -1
{qdesc-0.1.2 → qdesc-0.1.3}/qdesc.egg-info/SOURCES.txt +1 -0
qdesc-0.1.3/qdesc.egg-info/top_level.txt +1 -0
{qdesc-0.1.2 → qdesc-0.1.3}/setup.py +1 -1
qdesc-0.1.2/qdesc.egg-info/top_level.txt +0 -1
{qdesc-0.1.2 → qdesc-0.1.3}/LICENCE.txt +0 -0
{qdesc-0.1.2 → qdesc-0.1.3}/README.txt +0 -0
{qdesc-0.1.2 → qdesc-0.1.3}/qdesc.egg-info/dependency_links.txt +0 -0
{qdesc-0.1.2 → qdesc-0.1.3}/setup.cfg +0 -0

{qdesc-0.1.2 → qdesc-0.1.3}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.1
 Name: qdesc
-Version: 0.1.2
+Version: 0.1.3
 Summary: Quick and Easy way to do descriptive analysis.
 Author: Paolo Hilado
 Author-email: datasciencepgh@proton.me

qdesc-0.1.3/qdesc/__init__.py ADDED Viewed

@@ -0,0 +1,52 @@
+def desc(df):
+    import pandas as pd
+    import numpy as np
+    from scipy.stats import anderson
+    x = np.round(df.describe().T,2)
+    x = x.iloc[:, [0,1,2,5,3,7]]
+    x.rename(columns={'50%': 'median'}, inplace=True)
+    mad_values = {}
+    # computes the manual mad which is more robust to outliers and non-normal distributions
+    for column in df.select_dtypes(include=[np.number]):
+        median = np.median(df[column])
+        abs_deviation = np.abs(df[column] - median)
+        mad = np.median(abs_deviation)
+        mad_values[column] = mad
+    mad_df = pd.DataFrame(list(mad_values.items()), columns=['Variable', 'MAD'])
+    mad_df.set_index('Variable', inplace=True)
+    results = {}
+    # Loop through each column to test only continuous variables (numeric columns)
+    for column in df.select_dtypes(include=[np.number]):  # Only continuous variables
+        result = anderson(df[column])
+        statistic = result.statistic
+        critical_values = result.critical_values
+        # Only select the 5% and 1% significance levels
+        selected_critical_values = {
+            '5% crit_value': critical_values[2],  # 5% critical value
+            '1% crit_value': critical_values[4]   # 1% critical value
+        }
+        # Store the results in a dictionary
+        results[column] = {
+            'AD_stat': statistic,
+            **selected_critical_values  # Add critical values for 5% and 1% levels
+        }
+    # Convert the results dictionary into a DataFrame
+    anderson_df = pd.DataFrame.from_dict(results, orient='index')
+    xl = x.iloc[:, :4]
+    xr = x.iloc[:, 4:]
+    x_df = np.round(pd.concat([xl, mad_df, xr, anderson_df], axis=1),2)
+    return x_df
+def freqdist(df, column_name):
+    import pandas as pd
+    if column_name not in df.columns:
+        raise ValueError(f"Column '{column_name}' not found in DataFrame.")
+    if df[column_name].dtype not in ['object', 'category']:
+        raise ValueError(f"Column '{column_name}' is not a categorical column.")
+    freq_dist = df[column_name].value_counts().reset_index()
+    freq_dist.columns = [column_name, 'Count']
+    freq_dist['Percentage'] = (freq_dist['Count'] / len(df)) * 100
+    return freq_dist

{qdesc-0.1.2 → qdesc-0.1.3}/qdesc.egg-info/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.1
 Name: qdesc
-Version: 0.1.2
+Version: 0.1.3
 Summary: Quick and Easy way to do descriptive analysis.
 Author: Paolo Hilado
 Author-email: datasciencepgh@proton.me

{qdesc-0.1.2 → qdesc-0.1.3}/qdesc.egg-info/SOURCES.txt RENAMED Viewed

@@ -1,6 +1,7 @@
 LICENCE.txt
 README.txt
 setup.py
+qdesc/__init__.py
 qdesc.egg-info/PKG-INFO
 qdesc.egg-info/SOURCES.txt
 qdesc.egg-info/dependency_links.txt

qdesc-0.1.3/qdesc.egg-info/top_level.txt ADDED Viewed

	@@ -0,0 +1 @@
1	+ qdesc

{qdesc-0.1.2 → qdesc-0.1.3}/setup.py RENAMED Viewed

@@ -7,7 +7,7 @@ long_description = (this_directory / "README.md").read_text()
 setup(
     name='qdesc',
-    version='0.1.2',
+    version='0.1.3',
     packages=find_packages(),
     install_requires=[
         # List your dependencies here, e.g., pandas if your function requires it

qdesc-0.1.2/qdesc.egg-info/top_level.txt DELETED Viewed

	@@ -1 +0,0 @@
1	-

{qdesc-0.1.2 → qdesc-0.1.3}/LICENCE.txt RENAMED Viewed

File without changes

{qdesc-0.1.2 → qdesc-0.1.3}/README.txt RENAMED Viewed

File without changes

{qdesc-0.1.2 → qdesc-0.1.3}/qdesc.egg-info/dependency_links.txt RENAMED Viewed

File without changes

{qdesc-0.1.2 → qdesc-0.1.3}/setup.cfg RENAMED Viewed

File without changes

qdesc 0.1.2__tar.gz → 0.1.3__tar.gz

Potentially problematic release.

qdesc 0.1.2tar.gz → 0.1.3tar.gz