PyPI - pidatametrics1 - Versions diffs - 0.3.6__py2.py3-none-any.whl → 0.3.7__py2.py3-none-any.whl - Mend

pidatametrics1 0.3.6py2.py3-none-any.whl → 0.3.7py2.py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (4) hide show

pidatametrics/exporter.py CHANGED Viewed

@@ -1,12 +1,15 @@
 import csv
-import json
+import re
+import math
 from google.cloud import bigquery
-# Optional imports with error handling
+# Optional imports
 try:
     import pandas as pd
+    from openpyxl.cell.cell import ILLEGAL_CHARACTERS_RE
 except ImportError:
     pd = None
+    ILLEGAL_CHARACTERS_RE = None
 try:
     import gspread
@@ -15,6 +18,17 @@ except ImportError:
     gspread = None
 class PiExporter:
+    @staticmethod
+    def _clean_for_excel(text):
+        """Removes characters that cause Excel to crash/corrupt."""
+        if not isinstance(text, str):
+            return text
+        # Remove illegal control characters (null bytes, etc.)
+        if ILLEGAL_CHARACTERS_RE:
+            return ILLEGAL_CHARACTERS_RE.sub('', text)
+        return text
     @staticmethod
     def to_csv(data, filename):
         if not data:
@@ -33,9 +47,11 @@ class PiExporter:
     @staticmethod
     def to_excel(data, filename):
-        """Exports data to Excel. Requires pandas and openpyxl."""
+        """
+        Exports to Excel with sanitization to prevent 'Corrupted File' errors.
+        """
         if pd is None:
-            print("Error: Pandas not installed. Run: pip install pandas openpyxl")
+            print("Error: Pandas/Openpyxl not installed.")
             return
         if not data:
             print("No data to export.")
@@ -44,58 +60,87 @@ class PiExporter:
         if not filename.endswith('.xlsx'):
             filename += '.xlsx'
+        print(f"Preparing Excel file: {filename} ({len(data)} rows)...")
         try:
+            # 1. Create DataFrame
             df = pd.DataFrame(data)
-            df.to_excel(filename, index=False)
+            # 2. Sanitize Data (Fixes "Excel found a problem with content")
+            # Apply cleaning to all string columns
+            for col in df.select_dtypes(include=['object']).columns:
+                df[col] = df[col].apply(PiExporter._clean_for_excel)
+            # 3. Export
+            df.to_excel(filename, index=False, engine='openpyxl')
             print(f"Successfully saved {len(data)} rows to {filename}")
         except Exception as e:
             print(f"Excel Export Failed: {e}")
     @staticmethod
     def to_google_sheet(data, spreadsheet_name, tab_name="Sheet1"):
-        """
-        Exports to Google Sheet using the Filename (not ID).
-        Uses the active Colab authentication.
-        """
         if gspread is None:
-            print("Error: gspread not installed. Run: pip install gspread google-auth")
+            print("Error: gspread not installed.")
             return
         if not data:
             print("No data to upload.")
             return
-        print(f"Connecting to Google Sheet: '{spreadsheet_name}'...")
+        row_count = len(data)
+        print(f"Preparing Google Sheet upload: {row_count} rows...")
+        # --- WARNING FOR LARGE DATASETS ---
+        if row_count > 50000:
+            print(f"⚠️  WARNING: You are uploading {row_count} rows.")
+            print("   Google Sheets may become slow. Uploading in chunks...")
         try:
-            # 1. Get Default Credentials (works with Colab auth.authenticate_user)
+            # 1. Auth
             creds, _ = google.auth.default()
             client = gspread.authorize(creds)
-            # 2. Open by Name (Title)
+            # 2. Open Sheet
             try:
                 sh = client.open(spreadsheet_name)
             except gspread.SpreadsheetNotFound:
                 print(f"Sheet '{spreadsheet_name}' not found. Creating it...")
                 sh = client.create(spreadsheet_name)
-            # 3. Select or Create Worksheet (Tab)
+            # 3. Setup Tab
             try:
                 worksheet = sh.worksheet(tab_name)
-                worksheet.clear() # Clear old data
+                worksheet.clear()
             except gspread.WorksheetNotFound:
-                worksheet = sh.add_worksheet(title=tab_name, rows=len(data)+100, cols=20)
+                worksheet = sh.add_worksheet(title=tab_name, rows=row_count+100, cols=20)
             # 4. Prepare Data
             headers = list(data[0].keys())
             rows = [[row.get(col, '') for col in headers] for row in data]
-            all_values = [headers] + rows
+            # 5. Upload Headers first
+            worksheet.update([headers], 'A1')
+            # 6. CHUNKED UPLOAD (To prevent timeouts on large data)
+            chunk_size = 5000  # Safe limit for gspread
+            total_chunks = math.ceil(len(rows) / chunk_size)
+            print(f"Starting upload in {total_chunks} chunks...")
+            for i in range(total_chunks):
+                start = i * chunk_size
+                end = start + chunk_size
+                chunk = rows[start:end]
+                # Append rows is safer for large datasets than update range
+                worksheet.append_rows(chunk, value_input_option='RAW')
+                print(f"   - Uploaded chunk {i+1}/{total_chunks} ({len(chunk)} rows)")
-            # 5. Update
-            worksheet.update(all_values)
-            print(f"Successfully uploaded {len(data)} rows to '{spreadsheet_name}' (Tab: {tab_name})")
+            print(f"✅ Successfully uploaded {row_count} rows to '{spreadsheet_name}' (Tab: {tab_name})")
         except Exception as e:
-            print(f"Google Sheet Upload Failed: {e}")
+            print(f"❌ Google Sheet Upload Failed: {e}")
     @staticmethod
     def to_bigquery(data, project_id, dataset_id, table_id):

{pidatametrics1-0.3.6.dist-info → pidatametrics1-0.3.7.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: pidatametrics1
-Version: 0.3.6
+Version: 0.3.7
 Summary: A test wrapper for Pi Datametrics API with CSV and BigQuery support.
 Requires-Dist: google-auth
 Requires-Dist: google-cloud-bigquery

{pidatametrics1-0.3.6.dist-info → pidatametrics1-0.3.7.dist-info}/RECORD RENAMED Viewed

@@ -1,8 +1,8 @@
 pidatametrics/__init__.py,sha256=cmNSHvjvMsYO1tMv0Nf-7LGjIJ8AFXmUIwiv8jQ34BI,137
 pidatametrics/client.py,sha256=tHH0GV0rk2SizVqRdKepjdDQevkfdWlHOJHwsPR2PCk,4399
-pidatametrics/exporter.py,sha256=CcsdVhxI6rXi0zlQaYzFEGX0GL3ZaNV94Pj5r_WrZc4,4226
+pidatametrics/exporter.py,sha256=yLN40kqwibHWs45gXKe_I1j9td9lJt-8LLFSS-Pk9-U,5813
 pidatametrics/manager.py,sha256=tUeeJ-wKAlhpWsaZEAjxtZCtA2EbQcTBB1JkXPEVV50,9101
 pidatametrics/parsers.py,sha256=fiLx3080wNubT1VqSIeDvlrKT85KdqlKhY6FaB2XuC8,5989
-pidatametrics1-0.3.6.dist-info/METADATA,sha256=DOlktdH-uHRwem6nbXWDIn3NLXmw67iENpiiX4f7--o,293
-pidatametrics1-0.3.6.dist-info/WHEEL,sha256=aha0VrrYvgDJ3Xxl3db_g_MDIW-ZexDdrc_m-Hk8YY4,105
-pidatametrics1-0.3.6.dist-info/RECORD,,
+pidatametrics1-0.3.7.dist-info/METADATA,sha256=3rqys7d0-SNpsghd25f3eS99WSl-1QYzTY0HjbAYNak,293
+pidatametrics1-0.3.7.dist-info/WHEEL,sha256=aha0VrrYvgDJ3Xxl3db_g_MDIW-ZexDdrc_m-Hk8YY4,105
+pidatametrics1-0.3.7.dist-info/RECORD,,

{pidatametrics1-0.3.6.dist-info → pidatametrics1-0.3.7.dist-info}/WHEEL RENAMED Viewed

File without changes

pidatametrics1 0.3.6__py2.py3-none-any.whl → 0.3.7__py2.py3-none-any.whl

pidatametrics1 0.3.6py2.py3-none-any.whl → 0.3.7py2.py3-none-any.whl