PyPI - qdesc - Versions diffs - 0.1.7.1__py3-none-any.whl → 0.1.8.1__py3-none-any.whl - Mend

qdesc 0.1.7.1py3-none-any.whl → 0.1.8.1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of qdesc might be problematic. Click here for more details.

Files changed (7) hide show

qdesc/__init__.py CHANGED Viewed

@@ -106,3 +106,51 @@ def freqdist_to_excel(df, output_path, sort_by='Percentage', ascending=False, to
             used_names.add(sheet_name.lower())
             distribution.to_excel(writer, sheet_name=sheet_name, index=False)
     print(f"Frequency distributions written to {output_path}")
+def normcheck_dashboard(df, significance_level=0.05, figsize=(18, 5)):
+    import pandas as pd
+    import numpy as np
+    import matplotlib.pyplot as plt
+    import seaborn as sns
+    import statsmodels.api as sm
+    from scipy.stats import anderson
+    import math
+    numeric_cols = df.select_dtypes(include=[np.number]).columns
+    if len(numeric_cols) == 0:
+        print("No numeric columns to analyze.")
+        return
+    for col in numeric_cols:
+        data = df[col].dropna()
+        print(f"\n--- Variable: {col} ---")
+        if len(data) < 8:
+            print("Not enough data to perform Anderson-Darling test or meaningful plots.")
+            continue
+        # Anderson-Darling Test
+        test_result = anderson(data, dist='norm')
+        stat = test_result.statistic
+        sig_levels = test_result.significance_level
+        crit_values = test_result.critical_values
+        level_diff = [abs(sl - (significance_level * 100)) for sl in sig_levels]
+        closest_index = level_diff.index(min(level_diff))
+        used_sig = sig_levels[closest_index]
+        crit_val = crit_values[closest_index]
+        decision = "Fail to Reject Null" if stat <= crit_val else "Reject Null"
+        # Print Summary
+        print(f"  Anderson-Darling Statistic : {stat:.4f}")
+        print(f"  Critical Value (@ {used_sig}%) : {crit_val:.4f}")
+        print(f"  Decision : {decision}")
+        # Plots (QQ, Histogram, Boxplot)
+        fig, axes = plt.subplots(1, 3, figsize=figsize)
+        # QQ Plot
+        sm.qqplot(data, line='s', ax=axes[0])
+        axes[0].set_title(f"QQ Plot - {col}")
+        # Histogram (No KDE)
+        sns.histplot(data, bins=30, kde=False, color='gray', alpha=0.3, ax=axes[1])
+        axes[1].set_title(f"Histogram - {col}")
+        # Boxplot
+        sns.boxplot(x=data, ax=axes[2], color='lightblue')
+        axes[2].set_title(f"Boxplot - {col}")
+        axes[2].set_xlabel(col)
+        plt.suptitle(f"Normality Assessment - {col}", fontsize=14, y=1.05)
+        plt.tight_layout()
+        plt.show()

{qdesc-0.1.7.1.dist-info → qdesc-0.1.8.1.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.1
 Name: qdesc
-Version: 0.1.7.1
+Version: 0.1.8.1
 Summary: Quick and Easy way to do descriptive analysis.
 Author: Paolo Hilado
 Author-email: datasciencepgh@proton.me
@@ -53,15 +53,36 @@ Run the function qd.freqdist_to_excel(df, "Name of file.xlsx", ascending = FALSE
 * Counts - the number of observations
 * Percentage - percentage of observations from total.
+## qd.normcheck_dashboard Function
+Run the function qd.normcheck_dashboard(df) to efficiently check each numeric variable for normality of its distribution. It will compute the Anderson-Darling statistic and
+create visualizations (i.e., qq-plot, histogram, and boxplots) for checking whether the distribution is approximately normal.
 Later versions will include data visualizations handy for exploring the distribution of the data set.
 ## Installation
 pip install qdesc
-## Usage - doing descriptive analysis using qdesc
-### import qdesc as qd
-### qd.desc(df)
+## Sample use of qdesc functions
+# Creating a sample dataframe
+import pandas as pd
+import numpy as np
+# Set seed for reproducibility
+np.random.seed(21)
+# Create two continuous variables
+var1 = np.random.normal(loc=0, scale=1, size=1000)     # Normal distribution
+var2 = np.random.uniform(low=10, high=50, size=1000)   # Uniform distribution
+# Create DataFrame
+df = pd.DataFrame({
+    'Normal_Variable': var1,
+    'Uniform_Variable': var2
+})
+# Using the qdesc function
+import qdesc as qd
+qd.desc(df)
 ## License
 This project is licensed under the GPL-3 License. See the LICENSE file for more details.

qdesc-0.1.8.1.dist-info/RECORD ADDED Viewed

@@ -0,0 +1,6 @@
+qdesc/__init__.py,sha256=YtYahB-neaYOG3DvVXweSuFExqVZFNR0lAivaPp9_SA,6599
+qdesc-0.1.8.1.dist-info/LICENCE.txt,sha256=xdFo-Rt6I7EP7C_qrVeIBIcH_7mRGUh8sciJs2R8VmY,9684
+qdesc-0.1.8.1.dist-info/METADATA,sha256=qXseXkIM1Ynrx9kralmBs9B1jtpnwb8-kHUKVMLjk9Y,4552
+qdesc-0.1.8.1.dist-info/WHEEL,sha256=2wepM1nk4DS4eFpYrW1TTqPcoGNfHhhO_i5m4cOimbo,92
+qdesc-0.1.8.1.dist-info/top_level.txt,sha256=JuSs1wWRGN77DVuq-SX-5P7m_mIZF0ikEVgPTBOrHb0,6
+qdesc-0.1.8.1.dist-info/RECORD,,

qdesc-0.1.7.1.dist-info/RECORD DELETED Viewed

@@ -1,6 +0,0 @@
-qdesc/__init__.py,sha256=eT5JOnELIhQy3K453z3r22_xmf47uW1AOlUiWlSWgSM,4513
-qdesc-0.1.7.1.dist-info/LICENCE.txt,sha256=xdFo-Rt6I7EP7C_qrVeIBIcH_7mRGUh8sciJs2R8VmY,9684
-qdesc-0.1.7.1.dist-info/METADATA,sha256=OScoZdD8due5ilEz-waSAdaHcYqeLHDOQquLGRzMfAs,3782
-qdesc-0.1.7.1.dist-info/WHEEL,sha256=2wepM1nk4DS4eFpYrW1TTqPcoGNfHhhO_i5m4cOimbo,92
-qdesc-0.1.7.1.dist-info/top_level.txt,sha256=JuSs1wWRGN77DVuq-SX-5P7m_mIZF0ikEVgPTBOrHb0,6
-qdesc-0.1.7.1.dist-info/RECORD,,

{qdesc-0.1.7.1.dist-info → qdesc-0.1.8.1.dist-info}/LICENCE.txt RENAMED Viewed

File without changes

{qdesc-0.1.7.1.dist-info → qdesc-0.1.8.1.dist-info}/WHEEL RENAMED Viewed

File without changes

{qdesc-0.1.7.1.dist-info → qdesc-0.1.8.1.dist-info}/top_level.txt RENAMED Viewed

File without changes

qdesc 0.1.7.1__py3-none-any.whl → 0.1.8.1__py3-none-any.whl

Potentially problematic release.

qdesc 0.1.7.1py3-none-any.whl → 0.1.8.1py3-none-any.whl