PyPI - microlens-submit - Versions diffs - 0.12.2__py3-none-any.whl → 0.16.0__py3-none-any.whl - Mend

microlens-submit 0.12.2py3-none-any.whl → 0.16.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (34) hide show

microlens_submit/__init__.py +7 -157
microlens_submit/cli/__init__.py +5 -0
microlens_submit/cli/__main__.py +6 -0
microlens_submit/cli/commands/__init__.py +1 -0
microlens_submit/cli/commands/dossier.py +139 -0
microlens_submit/cli/commands/export.py +177 -0
microlens_submit/cli/commands/init.py +172 -0
microlens_submit/cli/commands/solutions.py +722 -0
microlens_submit/cli/commands/validation.py +241 -0
microlens_submit/cli/main.py +120 -0
microlens_submit/dossier/__init__.py +51 -0
microlens_submit/dossier/dashboard.py +499 -0
microlens_submit/dossier/event_page.py +369 -0
microlens_submit/dossier/full_report.py +330 -0
microlens_submit/dossier/solution_page.py +533 -0
microlens_submit/dossier/utils.py +111 -0
microlens_submit/error_messages.py +283 -0
microlens_submit/models/__init__.py +28 -0
microlens_submit/models/event.py +406 -0
microlens_submit/models/solution.py +569 -0
microlens_submit/models/submission.py +569 -0
microlens_submit/tier_validation.py +208 -0
microlens_submit/utils.py +373 -0
microlens_submit/validate_parameters.py +478 -180
{microlens_submit-0.12.2.dist-info → microlens_submit-0.16.0.dist-info}/METADATA +42 -27
microlens_submit-0.16.0.dist-info/RECORD +32 -0
{microlens_submit-0.12.2.dist-info → microlens_submit-0.16.0.dist-info}/WHEEL +1 -1
microlens_submit/api.py +0 -1257
microlens_submit/cli.py +0 -1803
microlens_submit/dossier.py +0 -1443
microlens_submit-0.12.2.dist-info/RECORD +0 -13
{microlens_submit-0.12.2.dist-info/licenses → microlens_submit-0.16.0.dist-info}/LICENSE +0 -0
{microlens_submit-0.12.2.dist-info → microlens_submit-0.16.0.dist-info}/entry_points.txt +0 -0
{microlens_submit-0.12.2.dist-info → microlens_submit-0.16.0.dist-info}/top_level.txt +0 -0

microlens_submit/tier_validation.py ADDED Viewed

@@ -0,0 +1,208 @@
+"""
+Tier validation module for microlens-submit.
+This module provides centralized validation logic for challenge tiers and their
+associated event lists. It validates event IDs against tier-specific event lists
+and provides tier definitions for the microlensing data challenge.
+The module defines:
+- Tier definitions with associated event lists
+- Event ID validation functions
+- Tier-specific validation logic
+**Supported Tiers:**
+- basic: Basic challenge tier with limited event set
+- standard: Standard challenge tier with full event set
+- advanced: Advanced challenge tier with all events
+- test: Testing tier for development
+- 2018-test: 2018 test events tier
+- None: No validation tier (skips event validation)
+Example:
+    >>> from microlens_submit.tier_validation import validate_event_id, TIER_DEFINITIONS
+    >>>
+    >>> # Check if an event is valid for a tier
+    >>> is_valid = validate_event_id("EVENT001", "standard")
+    >>> if is_valid:
+    ...     print("Event is valid for standard tier")
+    >>> else:
+    ...     print("Event is not valid for standard tier")
+    >>> # Get available tiers
+    >>> print("Available tiers:", list(TIER_DEFINITIONS.keys()))
+Note:
+    All validation functions return boolean values and provide human-readable
+    error messages for invalid events. The "None" tier skips all validation.
+"""
+from typing import Dict, List, Optional, Set
+# Tier definitions with their associated event lists
+TIER_DEFINITIONS = {
+    "standard": {
+        "description": "Standard challenge tier with limited event set",
+        "event_list": [
+            # Add standard tier events here
+            "EVENT001",
+            "EVENT002",
+            "EVENT003",
+        ],
+    },
+    "advanced": {
+        "description": "Advanced challenge tier with full event set",
+        "event_list": [
+            # Add advanced tier events here
+            "EVENT001",
+            "EVENT002",
+            "EVENT003",
+            "EVENT004",
+            "EVENT005",
+            "EVENT006",
+            "EVENT007",
+        ],
+    },
+    "test": {
+        "description": "Testing tier for development",
+        "event_list": [
+            # Add test events here
+            "evt",
+            "test-event",
+        ],
+    },
+    "2018-test": {
+        "description": "2018 test events tier",
+        "event_list": [
+            # Add 2018 test events here
+            "2018-EVENT-001",
+            "2018-EVENT-002",
+        ],
+    },
+    "None": {
+        "description": "No validation tier (skips event validation)",
+        "event_list": [],  # Empty list means no validation
+    },
+}
+# Cache for event lists to avoid repeated list creation
+_EVENT_LIST_CACHE: Dict[str, Set[str]] = {}
+def get_tier_event_list(tier: str) -> Set[str]:
+    """Get the set of valid event IDs for a given tier.
+    Args:
+        tier: The challenge tier name.
+    Returns:
+        Set[str]: Set of valid event IDs for the tier.
+    Raises:
+        ValueError: If the tier is not defined.
+    Example:
+        >>> events = get_tier_event_list("standard")
+        >>> print(f"Standard tier has {len(events)} events")
+        >>> print("EVENT001" in events)
+    """
+    if tier not in TIER_DEFINITIONS:
+        raise ValueError(f"Unknown tier: {tier}. Available tiers: {list(TIER_DEFINITIONS.keys())}")
+    # Use cache for performance
+    if tier not in _EVENT_LIST_CACHE:
+        _EVENT_LIST_CACHE[tier] = set(TIER_DEFINITIONS[tier]["event_list"])
+    return _EVENT_LIST_CACHE[tier]
+def validate_event_id(event_id: str, tier: str) -> bool:
+    """Validate if an event ID is valid for a given tier.
+    Args:
+        event_id: The event ID to validate.
+        tier: The challenge tier to validate against.
+    Returns:
+        bool: True if the event ID is valid for the tier, False otherwise.
+    Example:
+        >>> is_valid = validate_event_id("EVENT001", "standard")
+        >>> if is_valid:
+        ...     print("Event is valid for standard tier")
+        >>> else:
+        ...     print("Event is not valid for standard tier")
+    """
+    # Skip validation for "None" tier or if tier is not defined
+    if tier == "None" or tier not in TIER_DEFINITIONS:
+        return True
+    valid_events = get_tier_event_list(tier)
+    return event_id in valid_events
+def get_event_validation_error(event_id: str, tier: str) -> Optional[str]:
+    """Get a human-readable error message for an invalid event ID.
+    Args:
+        event_id: The event ID that failed validation.
+        tier: The challenge tier that was validated against.
+    Returns:
+        Optional[str]: Error message if the event is invalid, None if valid.
+    Example:
+        >>> error = get_event_validation_error("INVALID_EVENT", "standard")
+        >>> if error:
+        ...     print(f"Validation error: {error}")
+        >>> else:
+        ...     print("Event is valid")
+    """
+    if validate_event_id(event_id, tier):
+        return None
+    # No error for "None" tier or undefined tiers
+    if tier == "None" or tier not in TIER_DEFINITIONS:
+        return None
+    valid_events = get_tier_event_list(tier)
+    tier_desc = TIER_DEFINITIONS[tier]["description"]
+    return (
+        f"Event '{event_id}' is not valid for tier '{tier}' ({tier_desc}). "
+        f"Valid events for this tier: {sorted(valid_events)}"
+    )
+def get_available_tiers() -> List[str]:
+    """Get a list of all available tiers.
+    Returns:
+        List[str]: List of all available tier names.
+    Example:
+        >>> tiers = get_available_tiers()
+        >>> print(f"Available tiers: {tiers}")
+    """
+    return list(TIER_DEFINITIONS.keys())
+def get_tier_description(tier: str) -> str:
+    """Get the description for a given tier.
+    Args:
+        tier: The tier name.
+    Returns:
+        str: Description of the tier.
+    Raises:
+        ValueError: If the tier is not defined.
+    Example:
+        >>> desc = get_tier_description("standard")
+        >>> print(f"Standard tier: {desc}")
+    """
+    if tier not in TIER_DEFINITIONS:
+        raise ValueError(f"Unknown tier: {tier}. Available tiers: {list(TIER_DEFINITIONS.keys())}")
+    return TIER_DEFINITIONS[tier]["description"]

microlens_submit/utils.py ADDED Viewed

@@ -0,0 +1,373 @@
+"""Utility functions for microlens-submit.
+This module contains utility functions for importing data and loading
+submissions.
+"""
+import csv
+import json
+import shutil
+from pathlib import Path
+from typing import Optional
+# Resolve forward references
+from .models.event import Event
+from .models.submission import Submission
+def load(project_path: str) -> Submission:
+    """Load or create a submission project from a directory.
+    This is the main entry point for working with submission projects. If the
+    directory doesn't exist, it will be created with a basic project structure.
+    If it exists, the submission data will be loaded from disk.
+    Args:
+        project_path: Path to the project directory.
+    Returns:
+        A :class:`Submission` instance representing the project.
+    Example:
+        >>> from microlens_submit import load
+        >>>
+        >>> # Load or create a submission project
+        >>> submission = load("./my_project")
+        >>>
+        >>> # Set submission metadata
+        >>> submission.team_name = "Team Alpha"
+        >>> submission.tier = "advanced"
+        >>> submission.repo_url = "https://github.com/team/repo"
+        >>>
+        >>> # Add an event and solution
+        >>> event = submission.get_event("EVENT001")
+        >>> params = {"t0": 2459123.5, "u0": 0.1, "tE": 20.0}
+        >>> solution = event.add_solution("1S1L", params)
+        >>> solution.log_likelihood = -1234.56
+        >>> solution.set_compute_info(cpu_hours=2.5, wall_time_hours=0.5)
+        >>>
+        >>> # Save the submission
+        >>> submission.save()
+        >>>
+        >>> # Export for submission
+        >>> submission.export("submission.zip")
+    Note:
+        The project directory structure is automatically created when you
+        first call load() with a new directory. All data is stored in JSON
+        format with a clear directory structure for events and solutions.
+    """
+    project = Path(project_path)
+    events_dir = project / "events"
+    if not project.exists():
+        events_dir.mkdir(parents=True, exist_ok=True)
+        submission = Submission(project_path=str(project))
+        with (project / "submission.json").open("w", encoding="utf-8") as fh:
+            fh.write(
+                submission.model_dump_json(
+                    exclude={"events", "project_path"},
+                    indent=2,
+                )
+            )
+        return submission
+    sub_json = project / "submission.json"
+    if sub_json.exists():
+        with sub_json.open("r", encoding="utf-8") as fh:
+            submission = Submission.model_validate_json(fh.read())
+        submission.project_path = str(project)
+    else:
+        submission = Submission(project_path=str(project))
+    if events_dir.exists():
+        for event_dir in events_dir.iterdir():
+            if event_dir.is_dir():
+                event = Event._from_dir(event_dir, submission)
+                submission.events[event.event_id] = event
+    return submission
+def import_solutions_from_csv(
+    submission,
+    csv_file: Path,
+    parameter_map_file: Optional[Path] = None,
+    delimiter: Optional[str] = None,
+    dry_run: bool = False,
+    validate: bool = False,
+    on_duplicate: str = "error",
+    project_path: Optional[Path] = None,
+) -> dict:
+    """Import solutions from a CSV file into a :class:`Submission`.
+    The CSV must contain an ``event_id`` column along with either ``solution_id``
+    or ``solution_alias`` and a ``model_tags`` column. Parameter values can be
+    provided as individual columns or via a JSON-encoded ``parameters`` column.
+    Additional columns such as ``notes`` are also supported. The optional
+    ``parameter_map_file`` can map arbitrary CSV column names to the expected
+    attribute names.
+    Args:
+        submission: The active :class:`Submission` object.
+        csv_file: Path to the CSV file to read.
+        parameter_map_file: Optional YAML file that remaps CSV column names.
+        delimiter: CSV delimiter. If ``None`` the delimiter is automatically
+            detected.
+        dry_run: If ``True``, parse and validate the file but do not persist
+            any changes.
+        validate: If ``True``, run solution validation as each row is imported.
+        on_duplicate: Policy for handling duplicate alias keys: ``error``,
+            ``override``, or ``ignore``.
+        project_path: Project root used for resolving relative file paths.
+    Returns:
+        dict: Summary statistics describing the import operation.
+    Example:
+        >>> from microlens_submit.utils import load, import_solutions_from_csv
+        >>> sub = load("./project")
+        >>> stats = import_solutions_from_csv(
+        ...     sub,
+        ...     Path("solutions.csv"),
+        ...     validate=True,
+        ... )
+        >>> print(stats["successful_imports"], "solutions imported")
+    Note:
+        This function performs no console output. Use the CLI wrapper
+        :func:`microlens_submit.cli.import_solutions` for user-facing messages.
+    """
+    if on_duplicate not in ["error", "override", "ignore"]:
+        raise ValueError(f"Invalid on_duplicate: {on_duplicate}")
+    if project_path is None:
+        project_path = Path(".")
+    # Load parameter mapping if provided
+    if parameter_map_file:
+        with open(parameter_map_file, "r", encoding="utf-8") as f:
+            # TODO: Implement parameter mapping functionality
+            pass
+    # Auto-detect delimiter if not specified
+    if not delimiter:
+        with open(csv_file, "r", encoding="utf-8") as f:
+            sample = f.read(1024)
+            if "\t" in sample:
+                delimiter = "\t"
+            elif ";" in sample:
+                delimiter = ";"
+            else:
+                delimiter = ","
+    stats = {
+        "total_rows": 0,
+        "successful_imports": 0,
+        "skipped_rows": 0,
+        "validation_errors": 0,
+        "duplicate_handled": 0,
+        "errors": [],
+    }
+    with open(csv_file, "r", newline="", encoding="utf-8") as f:
+        lines = f.readlines()
+        header_row = 0
+        for i, line in enumerate(lines):
+            if line.strip().startswith("#"):
+                header_row = i
+                break
+        header_line = lines[header_row].strip()
+        if header_line.startswith("# "):
+            header_line = header_line[2:]
+        elif header_line.startswith("#"):
+            header_line = header_line[1:]
+        reader = csv.DictReader(
+            [header_line] + lines[header_row + 1 :],
+            delimiter=delimiter,
+        )
+        for row_num, row in enumerate(reader, start=header_row + 2):
+            stats["total_rows"] += 1
+            try:
+                # Validate required fields
+                if not row.get("event_id"):
+                    stats["skipped_rows"] += 1
+                    stats["errors"].append(f"Row {row_num}: " f"Missing event_id")
+                    continue
+                solution_id = row.get("solution_id")
+                solution_alias = row.get("solution_alias")
+                if not solution_id and not solution_alias:
+                    stats["skipped_rows"] += 1
+                    stats["errors"].append(f"Row {row_num}: " "Missing solution_id or solution_alias")
+                    continue
+                if not row.get("model_tags"):
+                    stats["skipped_rows"] += 1
+                    stats["errors"].append(f"Row {row_num}: " f"Missing model_tags")
+                    continue
+                # Parse model tags
+                try:
+                    model_tags = json.loads(row["model_tags"])
+                    if not isinstance(model_tags, list):
+                        raise ValueError("model_tags must be a list")
+                except json.JSONDecodeError:
+                    stats["skipped_rows"] += 1
+                    stats["errors"].append(f"Row {row_num}: " f"Invalid model_tags JSON")
+                    continue
+                # Extract model type and higher order effects
+                model_type = None
+                higher_order_effects = []
+                allowed_tags = ["1S1L", "1S2L", "2S1L", "2S2L", "1S3L", "2S3L", "other"]
+                for tag in model_tags:
+                    if tag in allowed_tags:
+                        if model_type:
+                            stats["skipped_rows"] += 1
+                            stats["errors"].append(f"Row {row_num}:" "Multiple model types specified")
+                            continue
+                        model_type = tag
+                    elif tag in [
+                        "parallax",
+                        "finite-source",
+                        "lens-orbital-motion",
+                        "xallarap",
+                        "gaussian-process",
+                        "stellar-rotation",
+                        "fitted-limb-darkening",
+                        "other",
+                    ]:
+                        higher_order_effects.append(tag)
+                if not model_type:
+                    stats["skipped_rows"] += 1
+                    stats["errors"].append(f"Row {row_num}: " f"No valid model type found in model_tags")
+                    continue
+                # Parse parameters
+                parameters = {}
+                for key, value in row.items():
+                    if key not in [
+                        "event_id",
+                        "solution_id",
+                        "solution_alias",
+                        "model_tags",
+                        "notes",
+                        "parameters",
+                    ]:
+                        if isinstance(value, str) and value.strip():
+                            try:
+                                parameters[key] = float(value)
+                            except ValueError:
+                                parameters[key] = value
+                        elif value and str(value).strip():
+                            try:
+                                parameters[key] = float(value)
+                            except (ValueError, TypeError):
+                                parameters[key] = str(value)
+                if not parameters and row.get("parameters"):
+                    try:
+                        parameters = json.loads(row["parameters"])
+                    except json.JSONDecodeError:
+                        stats["skipped_rows"] += 1
+                        stats["errors"].append(f"Row {row_num}: " f"Invalid parameters JSON")
+                        continue
+                # Handle notes
+                notes = row.get("notes", "").strip()
+                notes_path = None
+                notes_content = None
+                if notes:
+                    notes_file = Path(notes)
+                    if notes_file.exists() and notes_file.is_file():
+                        notes_path = str(notes_file)
+                    else:
+                        # CSV files encode newlines as literal \n, so we convert
+                        # them to real newlines here.
+                        # We do NOT do this when reading .md files or in
+                        # set_notes(), because users may want literal '\n'.
+                        notes_content = notes.replace("\\n", "\n").replace("\\r", "\r")
+                else:
+                    pass
+                # Get or create event
+                event = submission.get_event(row["event_id"])
+                # Check for duplicates
+                alias_key = f"{row['event_id']} {solution_alias or solution_id}"
+                existing_solution = None
+                if solution_alias:
+                    existing_solution = submission.get_solution_by_alias(
+                        row["event_id"],
+                        solution_alias,
+                    )
+                elif solution_id:
+                    existing_solution = event.get_solution(solution_id)
+                if existing_solution:
+                    if on_duplicate == "error":
+                        stats["skipped_rows"] += 1
+                        stats["errors"].append(f"Row {row_num}: " f"Duplicate alias key '{alias_key}'")
+                        continue
+                    elif on_duplicate == "ignore":
+                        stats["duplicate_handled"] += 1
+                        continue
+                    elif on_duplicate == "override":
+                        event.remove_solution(
+                            existing_solution.solution_id,
+                            force=True,
+                        )
+                        stats["duplicate_handled"] += 1
+                if not dry_run:
+                    solution = event.add_solution(model_type, parameters)
+                    if solution_alias:
+                        solution.alias = solution_alias
+                    elif solution_id:
+                        solution.alias = solution_id
+                    if higher_order_effects:
+                        solution.higher_order_effects = higher_order_effects
+                    if notes_path:
+                        tmp_path = Path(project_path) / "tmp"
+                        solution_notes_path = tmp_path / f"{solution.solution_id}.md"
+                        solution_notes_path.parent.mkdir(
+                            parents=True,
+                            exist_ok=True,
+                        )
+                        shutil.copy2(notes_path, solution_notes_path)
+                        solution.notes_path = str(solution_notes_path.relative_to(project_path))
+                    elif notes_content:
+                        solution.set_notes(
+                            notes_content,
+                            project_path,
+                            convert_escapes=True,
+                        )
+                    if validate:
+                        validation_messages = solution.run_validation()
+                        if validation_messages:
+                            stats["validation_errors"] += 1
+                            for msg in validation_messages:
+                                stats["errors"].append(f"Row {row_num} validation: " f"{msg}")
+                stats["successful_imports"] += 1
+            except Exception as e:
+                stats["errors"].append(f"Row {row_num}: {str(e)}")
+                continue
+    return stats

microlens-submit 0.12.2__py3-none-any.whl → 0.16.0__py3-none-any.whl

microlens-submit 0.12.2py3-none-any.whl → 0.16.0py3-none-any.whl