PyPI - ml-dash - Versions diffs - 0.0.17__py3-none-any.whl → 0.4.0__py3-none-any.whl - Mend

ml-dash 0.0.17py3-none-any.whl → 0.4.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (56) hide show

ml_dash/ARCHITECTURE.md +382 -0
ml_dash/__init__.py +14 -1
ml_dash/autolog.py +32 -0
ml_dash/backends/__init__.py +11 -0
ml_dash/backends/base.py +124 -0
ml_dash/backends/dash_backend.py +571 -0
ml_dash/backends/local_backend.py +90 -0
ml_dash/components/__init__.py +13 -0
ml_dash/components/files.py +246 -0
ml_dash/components/logs.py +104 -0
ml_dash/components/metrics.py +169 -0
ml_dash/components/parameters.py +144 -0
ml_dash/job_logger.py +42 -0
ml_dash/ml_logger.py +234 -0
ml_dash/run.py +331 -0
ml_dash-0.4.0.dist-info/METADATA +1424 -0
ml_dash-0.4.0.dist-info/RECORD +19 -0
ml_dash-0.4.0.dist-info/WHEEL +4 -0
ml_dash-0.4.0.dist-info/entry_points.txt +3 -0
app-build/asset-manifest.json +0 -15
app-build/favicon.ico +0 -0
app-build/github-markdown.css +0 -957
app-build/index.html +0 -1
app-build/manifest.json +0 -15
app-build/monaco-editor-worker-loader-proxy.js +0 -6
app-build/precache-manifest.ffc09f8a591c529a1bd5c6f21f49815f.js +0 -26
app-build/service-worker.js +0 -34
ml_dash/app.py +0 -60
ml_dash/config.py +0 -16
ml_dash/example.py +0 -0
ml_dash/file_events.py +0 -71
ml_dash/file_handlers.py +0 -141
ml_dash/file_utils.py +0 -5
ml_dash/file_watcher.py +0 -30
ml_dash/main.py +0 -60
ml_dash/mime_types.py +0 -20
ml_dash/schema/__init__.py +0 -110
ml_dash/schema/archive.py +0 -165
ml_dash/schema/directories.py +0 -59
ml_dash/schema/experiments.py +0 -65
ml_dash/schema/files/__init__.py +0 -204
ml_dash/schema/files/file_helpers.py +0 -79
ml_dash/schema/files/images.py +0 -27
ml_dash/schema/files/metrics.py +0 -64
ml_dash/schema/files/parameters.py +0 -50
ml_dash/schema/files/series.py +0 -235
ml_dash/schema/files/videos.py +0 -27
ml_dash/schema/helpers.py +0 -66
ml_dash/schema/projects.py +0 -65
ml_dash/schema/schema_helpers.py +0 -19
ml_dash/schema/users.py +0 -33
ml_dash/sse.py +0 -18
ml_dash-0.0.17.dist-info/METADATA +0 -67
ml_dash-0.0.17.dist-info/RECORD +0 -38
ml_dash-0.0.17.dist-info/WHEEL +0 -5
ml_dash-0.0.17.dist-info/top_level.txt +0 -2

ml_dash/ARCHITECTURE.md ADDED Viewed

@@ -0,0 +1,382 @@
+# ML-Logger Architecture
+## Class Hierarchy and Composition
+<details open>
+<summary><strong>🏗️ System Overview</strong></summary>
+```
+ML-Logger System
+│
+├── Storage Backends (remove existing implementations awaiting design)
+    add local logger, s3, gcp, ml_dash, as empty files. Also include an empty base class.
+├── Logger Components (file and data types)
+├── ML_Logger (Main Interface)
+└── Supporting and Utility Classes
+```
+</details>
+<details>
+<summary><strong>💾 Storage Backends</strong> (Where to store)</summary>
+```
+Storage Backends
+│
+├── StorageBackend (Abstract Base)
+│   ├── exists()
+│   ├── write_bytes()
+│   ├── read_bytes()
+│   ├── write_text()
+│   ├── read_text()
+│   ├── append_text()
+│   ├── list_dir()
+│   └── get_url()
+│
+├── LocalBackend(StorageBackend)
+│   └── Implements file system operations
+│
+├── S3Backend(StorageBackend)
+│   └── Implements AWS S3 operations
+│
+└── GCPBackend(StorageBackend)
+    └── Implements Google Cloud Storage operations
+```
+</details>
+<details>
+<summary><strong>📝 Logger Components</strong> (What to log)</summary>
+```
+Experiment
+│
+├── logs: TextLogger
+│   ├── log(level, message)
+│   ├── error(message)
+│   ├── warning(message)
+│   ├── info(message)
+│   └── debug(message)
+│
+├── metrics: ScalarLogger (accessed via experiment.metrics)
+│   ├── log(step, **metrics) - Log metrics immediately
+│   ├── collect(step, **metrics) - Collect for later aggregation
+│   ├── flush(_aggregation, step) - Aggregate and log collected metrics
+│   ├── get_summary(name, frequency)
+│   ├── __call__(namespace) - Return namespaced logger
+│   └── Uses: ScalarCache, Series
+│
+├── files: ArtifactLogger (accessed via experiment.files)
+│   ├── save(data, filename) - Save generic data
+│   ├── save_pkl(data, filename) - Save pickle data
+│   ├── save_image(name, image) - Save image
+│   ├── save_video(name, video, fps) - Save video
+│   ├── save_audio(name, audio) - Save audio
+│   ├── savefig(fig, filename) - Save matplotlib figure
+│   ├── load_torch(filename) - Load PyTorch data
+│   ├── make_video(pattern, output, fps, codec, quality, sort) - Create video from frames
+│   ├── __call__(namespace) - Return namespaced logger
+│   └── File management and artifact storage
+│
+├── params: ParameterIndex
+│   ├── set(params) - Set/overwrite parameters
+│   ├── extend(params) - Merge with existing parameters
+│   ├── update(key, value) - Update single parameter
+│   ├── read() - Read all parameters
+│   └── Manages experiment configuration
+│
+└── charts: ChartBuilder  # PLANNING PHASE, subject to changes.
+    ├── line_chart(query)
+    ├── scatter_plot(query)
+    ├── bar_chart(query)
+    └── video/images(query)
+```
+</details>
+<details>
+<summary><strong>🎯 Composite Logger</strong> (Main Interface)</summary>
+```
+MLLogger
+├── __init__(backend: StorageBackend)
+├── params: ParameterIndex - Parameter management
+├── metrics: ScalarLogger - Metrics logging
+├── readme: MarkdownLogger - Rich Text logging (PLANNING PHASE)
+├── files: ArtifactLogger - File and artifact management
+├── logs: TextLogger - Text logging
+│
+├── Convenience Methods: (can just hide under logs)
+│   ├── error() -> text.error()
+│   ├── warning() -> text.warning()
+│   ├── info() -> text.info()
+│   └── debug() -> text.debug()
+│
+└── Context Managers:
+    ├── experiment(name)
+    └── run(id)
+```
+</details>
+<details>
+<summary><strong>⚙️ Supporting Classes</strong></summary>
+```
+Supporting Classes
+│
+└── Serialization (serdes/) (NOT USED)
+    ├── serialize()
+    ├── deserialize()
+    └── Type registry with $t, $s keys
+```
+</details>
+## Usage Examples
+<details>
+<summary><strong>📊 Logging Different Data Types</strong></summary>
+```python
+# Text logging (errors, warnings, info) experiment.logs.error("Training failed") experiment.logs.warning("Low GPU memory") experiment.logs.info("Starting epoch 1")
+# Parameter logging experiment.params.set(learning_rate=0.001, batch_size=32)
+# Metrics logging experiment.metrics.log(step=100, loss=0.523, accuracy=0.95)
+# Collect metrics for aggregation experiment.metrics.collect(step=101, loss=0.521) experiment.metrics.flush(_aggregation="mean", step=100)
+# Namespaced metrics experiment.metrics("train").log(step=100, loss=0.5) experiment.metrics("val").log(step=100, accuracy=0.95)
+# File operations experiment.files.save_image("confusion_matrix", image_array) experiment.files.save(model_state, "checkpoint.pt") experiment.files("checkpoints").save(model_state, "model_epoch_10.pt")
+```
+</details>
+<details>
+<summary><strong>🎛️ Direct Component Access</strong></summary>
+```python
+# Access components directly for advanced usage experiment.logs.error("Direct text logging") experiment.metrics.log(step=50, lr=0.001) experiment.files.save_video("training_progress", video_array, fps=30)
+# Namespaced file operations experiment.files("videos").save_video("training_progress", video_array, fps=30) experiment.files("checkpoints").save(model_state, "model.pt")
+# Get statistics
+stats = experiment.metrics.get_stats("loss")
+percentile_95 = experiment.metrics.get_percentile("loss", 95)
+```
+</details>
+## File Organization
+<details>
+<summary><strong>📁 Project Structure</strong></summary>
+```
+ml-logger/
+├── src/ml_logger/
+│   ├── __init__.py
+│   ├── experiment.py          # Main MLLogger class
+│   │
+│   ├── backends/
+│   │   ├── __init__.py
+│   │   ├── base.py        # StorageBackend ABC
+│   │   ├── local.py       # LocalBackend
+│   │   ├── s3.py          # S3Backend
+│   │   └── gcp.py         # GCPBackend
+│   │
+│   ├── loggers/
+│   │   ├── __init__.py
+│   │   ├── text.py        # TextLogger
+│   │   ├── scalar.py      # ScalarLogger
+│   │   └── artifact.py    # ArtifactLogger
+│   │
+│   ├── scalar_cache.py    # ScalarCache, Series, RollingStats
+│   │
+│   └── serdes/
+│       ├── __init__.py
+│       └── ndjson.py      # Serialization with $t, $s
+│
+└── tests/
+    ├── test_backends.py
+    ├── test_loggers.py
+    ├── test_scalar_cache.py
+    └── test_integration.py
+```
+</details>
+## Advanced Features
+<details>
+<summary><strong>📈 Statistical Features</strong></summary>
+### Rolling Statistics
+- **Window-based metrics**: Configurable window size for recent data
+- **Automatic calculation**: Mean, variance, std, min, max
+- **Percentiles**: p0, p1, p5, p10, p20, p25, p40, p50, p60, p75, p80, p90, p95, p99, p100
+### Summary Frequencies
+Automatic summaries at: 1, 5, 10, 15, 20, 25, 30, 40, 50, 75, 80, 100, 120, 150, 200, 250, 300, 400, 500, 600, 1000, 1200, 1500, 2000, 2500, ...
+```python
+# Access statistics
+stats = experiment.scalars.get_stats("loss")
+print(f"Mean: {stats.mean}, Std: {stats.std}")
+# Get percentiles
+p95 = experiment.scalars.get_percentile("accuracy", 95)
+# Get summaries at specific frequencies
+summaries = experiment.scalars.get_summary("loss", frequency=100)
+```
+</details>
+<details>
+<summary><strong>🔄 Serialization System</strong></summary>
+### Type-Annotated Serialization
+- Uses `$t` for type keys
+- Uses `$s` for shape keys (arrays)
+- Recursive serialization for nested structures
+- Supports: primitives, datetime, numpy, Path, bytes, collections
+```python
+from ml_dash.serdes import serialize, deserialize
+# Serialize complex objects
+data = {
+    "array": np.array([[1, 2], [3, 4]]),
+    "date": datetime.now(),
+    "path": Path("/tmp/file.txt")
+}
+serialized = serialize(data)
+# Deserialize back
+original = deserialize(serialized)
+```
+</details>
+## Examples
+<details>
+<summary><strong>🤖 ML Training Example</strong></summary>
+```python
+# train.py - Define your training function
+from ml_dash import get_logger
+@logger.run
+def train(config):
+    """Training function that will be wrapped by the experiment."""
+    model = create_model(config.model_type)
+    optimizer = torch.optim.Adam(model.parameters(), lr=config.lr)
+    best_acc = 0
+    for epoch in range(config.epochs):
+        # Training loop
+        for batch_idx, (data, target) in enumerate(train_loader):
+            loss = train_step(model, data, target, optimizer)
+            step = epoch * len(train_loader) + batch_idx
+            with experiment.step(step):
+                # Log metrics
+                experiment.log_metric("train/loss", loss.item())
+                # Log histograms periodically
+                if step % 100 == 0:
+                    experiment.log_histogram("gradients", get_gradients(model))
+                # Save visualizations
+                if step % 500 == 0:
+                    fig = plot_predictions(model, data)
+                    experiment.log_image("predictions", fig)
+        # Validation
+        val_loss, val_acc = validate(model, val_loader)
+        experiment.log_metrics({
+            "val/loss": val_loss,
+            "val/accuracy": val_acc
+        }, step=epoch)
+        # Save checkpoint
+        if val_acc > best_acc:
+            experiment.log_model("best_model", model.state_dict())
+            best_acc = val_acc
+    # Final summary
+    experiment.info(f"Training completed. Best accuracy: {best_acc}")
+    return {"best_accuracy": best_acc}
+```
+**experiment.py** - Launch experiments with different configs:
+```python
+from ml_dash import get_logger
+from train import train
+# Initialize logger
+experiment = get_logger("s3://experiments/mnist")
+# Define experiment configurations
+configs = [
+    {"model_type": "CNN", "lr": 0.001, "batch_size": 32, "epochs": 100},
+    {"model_type": "CNN", "lr": 0.01, "batch_size": 64, "epochs": 100},
+    {"model_type": "ResNet", "lr": 0.001, "batch_size": 32, "epochs": 150},
+]
+# Run experiment with multiple configurations
+with experiment.experiment("model_comparison"):
+    for i, config in enumerate(configs):
+        # Each config gets its own run
+        run_name = f"{config['model_type']}_lr{config['lr']}"
+        # The decorator handles run creation and lifecycle
+        result = train(
+            config=config,
+            _run_name=run_name,
+            _hyperparams=config,
+            _tags=["baseline", config["model_type"].lower()]
+        )
+        print(f"Run {run_name} completed with accuracy: {result['best_accuracy']}")
+```
+</details>
+<details>
+<summary><strong>🔍 Debugging Example</strong></summary>
+```python
+# Setup logger with debug level
+ experiment =get_logger("./debug_logs") experiment.logs.set_level(LogLevel.DEBUG)
+try:
+    # Your code here
+    result = risky_operation()
+    experiment.debug(f"Operation result: {result}")
+except Exception as e:
+    # Log exception with full traceback
+    experiment.exception("Operation failed", exc_info=True)
+    # Log additional context
+    experiment.error("Failed at step", step=current_step,
+                input_shape=data.shape)
+    # Save problematic data for debugging
+    experiment.log_file("failed_input", "debug_data.pkl")
+finally:
+    # Get recent logs
+    errors = experiment.get_logs(level="ERROR", limit=50)
+    print(f"Found {len(errors)} errors")
+```
+</details>

ml_dash/__init__.py CHANGED Viewed

@@ -1 +1,14 @@
-from .main import app
+"""ML-Logger: A minimal, local-first experiment tracking library."""
+from .run import Experiment
+from .ml_logger import ML_Logger, LogLevel
+from .job_logger import JobLogger
+__version__ = "0.4.0"
+__all__ = [
+    "Experiment",
+    "ML_Logger",
+    "LogLevel",
+    "JobLogger",
+]

ml_dash/autolog.py ADDED Viewed

@@ -0,0 +1,32 @@
+"""Auto-configured experiment for ML-Logger.
+This module provides a pre-configured global `experiment` instance that can be
+imported and used immediately without manual setup.
+Example:
+    from ml_dash.autolog import experiment
+    # No setup needed!
+    experiment.params.set(learning_rate=0.001)
+    experiment.metrics.log(step=0, loss=0.5)
+    experiment.files.save(model.state_dict(), "checkpoint.pt")
+Configuration:
+    The auto-experiment is configured from environment variables:
+    - ML_LOGGER_NAMESPACE: User/team namespace (default: "default")
+    - ML_LOGGER_WORKSPACE: Project workspace (default: "experiments")
+    - ML_LOGGER_PREFIX: Experiment prefix (default: auto-generated timestamp+uuid)
+    - ML_LOGGER_REMOTE: Remote server URL (optional)
+    Or from ~/.ml-logger/config.yaml:
+        namespace: alice
+        workspace: my-project
+        remote: http://localhost:3001
+"""
+from .run import Experiment
+# Auto-configured global experiment instance
+experiment = Experiment._auto_configure()
+__all__ = ["experiment"]

ml_dash/backends/__init__.py ADDED Viewed

@@ -0,0 +1,11 @@
+"""Storage backends for ML-Logger."""
+from .base import StorageBackend
+from .local_backend import LocalBackend
+from .dash_backend import DashBackend
+__all__ = [
+    "StorageBackend",
+    "LocalBackend",
+    "DashBackend",
+]

ml_dash/backends/base.py ADDED Viewed

@@ -0,0 +1,124 @@
+"""Storage backend abstract base class for ML-Logger.
+This module defines the abstract interface that all storage backends must implement.
+"""
+from abc import ABC, abstractmethod
+from pathlib import Path
+from typing import Optional, List
+class StorageBackend(ABC):
+    """Abstract base class for storage backends.
+    All storage backends (local, S3, GCP, ML-Dash) must implement these methods.
+    """
+    @abstractmethod
+    def exists(self, path: str) -> bool:
+        """Check if a file or directory exists.
+        Args:
+            path: Path to check
+        Returns:
+            True if path exists, False otherwise
+        """
+        pass
+    @abstractmethod
+    def write_bytes(self, path: str, data: bytes) -> None:
+        """Write binary data to a file.
+        Args:
+            path: File path
+            data: Binary data to write
+        """
+        pass
+    @abstractmethod
+    def read_bytes(self, path: str) -> bytes:
+        """Read binary data from a file.
+        Args:
+            path: File path
+        Returns:
+            Binary data from file
+        """
+        pass
+    @abstractmethod
+    def write_text(self, path: str, text: str) -> None:
+        """Write text to a file.
+        Args:
+            path: File path
+            text: Text to write
+        """
+        pass
+    @abstractmethod
+    def read_text(self, path: str) -> str:
+        """Read text from a file.
+        Args:
+            path: File path
+        Returns:
+            Text content from file
+        """
+        pass
+    @abstractmethod
+    def append_text(self, path: str, text: str) -> None:
+        """Append text to a file.
+        Args:
+            path: File path
+            text: Text to append
+        """
+        pass
+    @abstractmethod
+    def list_dir(self, path: str = "") -> List[str]:
+        """List contents of a directory.
+        Args:
+            path: Directory path (empty string for root)
+        Returns:
+            List of file/directory names
+        """
+        pass
+    @abstractmethod
+    def get_url(self, path: str) -> Optional[str]:
+        """Get a URL for accessing a file (if applicable).
+        Args:
+            path: File path
+        Returns:
+            URL string or None if not applicable
+        """
+        pass
+    @abstractmethod
+    def makedirs(self, path: str, exist_ok: bool = True) -> None:
+        """Create directories recursively.
+        Args:
+            path: Directory path to create
+            exist_ok: Don't raise error if directory exists
+        """
+        pass
+    @abstractmethod
+    def delete(self, path: str) -> None:
+        """Delete a file.
+        Args:
+            path: File path to delete
+        """
+        pass

ml-dash 0.0.17__py3-none-any.whl → 0.4.0__py3-none-any.whl

ml-dash 0.0.17py3-none-any.whl → 0.4.0py3-none-any.whl