PyPI - samplekit - Versions diffs - 0.1.0__py3-none-any.whl - Mend

samplekit 0.1.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (12) hide show

samplekit/__init__.py +20 -0
samplekit/converters.py +117 -0
samplekit/property.py +332 -0
samplekit/report.py +214 -0
samplekit/sample.py +320 -0
samplekit/sample_list.py +190 -0
samplekit/table.py +612 -0
samplekit-0.1.0.dist-info/METADATA +422 -0
samplekit-0.1.0.dist-info/RECORD +12 -0
samplekit-0.1.0.dist-info/WHEEL +5 -0
samplekit-0.1.0.dist-info/licenses/LICENSE +8 -0
samplekit-0.1.0.dist-info/top_level.txt +1 -0

samplekit/__init__.py ADDED Viewed

@@ -0,0 +1,20 @@
+"""SampleKit — Scientific sample documentation framework."""
+from .property import Property
+from .table import Table, Column
+from .sample import Sample
+from .sample_list import SampleList
+from . import report
+from . import converters
+__version__ = "0.1.0"
+__all__ = [
+    "Property",
+    "Table",
+    "Column",
+    "Sample",
+    "SampleList",
+    "report",
+    "converters",
+]

samplekit/converters.py ADDED Viewed

@@ -0,0 +1,117 @@
+"""Converters — transform Samples to/from dicts, DataFrames, and other formats."""
+from __future__ import annotations
+from typing import Any, TYPE_CHECKING
+if TYPE_CHECKING:
+    from .sample import Sample
+    from .sample_list import SampleList
+# ── Sample converters ───────────────────────────────────
+def sample_to_dict(sample: Sample) -> dict[str, Any]:
+    """Export all sample data as a nested dict.
+    Parameters
+    ----------
+    sample : Sample
+        The sample to export.
+    Returns
+    -------
+    dict
+        ``{"name": ..., "prop_name": {"value": ..., "uncertainty": ..., ...}, ...}``
+    """
+    result: dict[str, Any] = {"name": sample.name}
+    for key, prop in sample.props.items():
+        entry: dict[str, Any] = {}
+        if prop.value is not None:
+            entry["value"] = prop.value
+        if prop.uncertainty is not None:
+            entry["uncertainty"] = prop.uncertainty
+        if prop.unit:
+            entry["unit"] = prop.unit
+        if prop.data is not None:
+            entry["data"] = prop.data
+        if entry:
+            result[key] = entry
+    for key, table in sample.tables.items():
+        result[key] = table.to_yaml()
+    return result
+def sample_to_dataframe(sample: Sample):
+    """Export scalar properties as a single-row pandas DataFrame.
+    Parameters
+    ----------
+    sample : Sample
+        The sample to export.
+    Returns
+    -------
+    pandas.DataFrame
+        One row indexed by sample name, columns are numeric properties.
+    """
+    import pandas as pd
+    data: dict[str, Any] = {}
+    for name, prop in sample.props.items():
+        v = prop.value
+        if v is not None and not isinstance(v, str):
+            data[name] = v
+            if prop.uncertainty is not None:
+                data[f"{name}_unc"] = prop.uncertainty
+    return pd.DataFrame(data, index=[sample.name])
+# ── SampleList converters ───────────────────────────────
+def samplelist_to_dataframe(sample_list: SampleList):
+    """Concatenate all samples into a single DataFrame (samples as rows).
+    Parameters
+    ----------
+    sample_list : SampleList
+        The collection to export.
+    Returns
+    -------
+    pandas.DataFrame
+    """
+    import pandas as pd
+    frames = [sample_to_dataframe(s) for s in sample_list]
+    return pd.concat(frames) if frames else pd.DataFrame()
+def samplelist_stats(sample_list: SampleList, prop_name: str):
+    """Descriptive statistics for a property across all samples.
+    Parameters
+    ----------
+    sample_list : SampleList
+        The collection to analyze.
+    prop_name : str
+        Name of the property to gather statistics on.
+    Returns
+    -------
+    pandas.Series
+        Output of ``pandas.Series.describe()``.
+    """
+    import pandas as pd
+    values = []
+    for s in sample_list:
+        try:
+            v = s[prop_name].value
+            if v is not None and not isinstance(v, str):
+                values.append(float(v))
+        except (KeyError, TypeError, ValueError):
+            pass
+    return pd.Series(values, name=prop_name).describe()

samplekit/property.py ADDED Viewed

@@ -0,0 +1,332 @@
+"""Property — a scalar scientific quantity: value ± uncertainty [unit]."""
+from __future__ import annotations
+import statistics
+from typing import Any, Callable, TYPE_CHECKING
+if TYPE_CHECKING:
+    from .sample import Sample
+class Property:
+    """
+    Scientific property with value, uncertainty, unit, and optional computation.
+    Modes
+    -----
+    - Static:   Property(value=25.0)
+    - Measured:  Property(value=[25.1, 24.9, 25.0])     → auto mean ± std
+    - Computed:  Property(compute=self._calc_rho)         → lazy, cached, invalidated
+    Parameters
+    ----------
+    value : float, str, list[float], or None
+        Static value or list of measurements (auto mean ± std).
+    uncertainty : float or None
+        Static uncertainty (overrides auto-std when value is a list).
+    unit : str
+        Plain-text unit (e.g. "°C", "kPa").
+    unit_math : str, optional
+        Math-mode unit for MathJax/LaTeX (defaults to unit).
+    symbol : str, optional
+        Text/unicode symbol for CLI/TUI display (defaults to name).
+    symbol_math : str, optional
+        Math-mode symbol for MathJax/LaTeX (defaults to symbol).
+    precision : str
+        Format spec for value (default "").
+    precision_unc : str, optional
+        Format spec for uncertainty (defaults to precision).
+    compute : callable, optional
+        Function() → float. Called lazily when value is accessed.
+    compute_unc : callable, optional
+        Function() → float. Called lazily when uncertainty is accessed.
+    depends_on : list[Property], optional
+        Properties that this one depends on. When they change,
+        this property's cache is invalidated.
+    """
+    def __init__(
+        self,
+        value: float | str | list[float] | None = None,
+        uncertainty: float | None = None,
+        unit: str = "",
+        unit_math: str | None = None,
+        symbol: str | None = None,
+        symbol_math: str | None = None,
+        precision: str = "",
+        precision_unc: str | None = None,
+        compute: Callable[[], Any] | None = None,
+        compute_unc: Callable[[], float] | None = None,
+        depends_on: list[Property] | None = None,
+    ):
+        # Identity (set by Sample.__setattr__)
+        self._name: str | None = None
+        self._parent: Sample | None = None
+        # Display
+        self.symbol = symbol
+        self.symbol_math = symbol_math
+        self.unit = unit
+        self.unit_math = unit_math or unit
+        self.precision = precision
+        self.precision_unc = precision_unc or precision
+        # Dependencies
+        self._depends_on_refs: list[Property] = depends_on or []
+        self._dependents: list[Property] = []
+        # Value backends
+        self._compute = compute
+        self._compute_unc = compute_unc
+        self._data: list[float] | None = None
+        self._static_value: float | str | None = None
+        self._static_uncertainty: float | None = None
+        # Cache (for computed properties)
+        self._value_cached: Any = None
+        self._unc_cached: float | None = None
+        self._value_cache_valid = False
+        self._unc_cache_valid = False
+        # Initialize from constructor args
+        if compute is None:
+            if isinstance(value, list):
+                self._data = list(value)
+            else:
+                self._static_value = value
+        if compute_unc is None:
+            self._static_uncertainty = uncertainty
+    # ── Name ─────────────────────────────────────────────
+    @property
+    def name(self) -> str | None:
+        return self._name
+    # ── Value ────────────────────────────────────────────
+    @property
+    def value(self) -> float | str | None:
+        if self._compute is not None:
+            if not self._value_cache_valid:
+                self._value_cached = self._compute()
+                self._value_cache_valid = True
+            return self._value_cached
+        if self._data is not None:
+            return statistics.mean(self._data) if self._data else None
+        return self._static_value
+    @value.setter
+    def value(self, val):
+        """Set value directly (clears compute if any)."""
+        self._compute = None
+        if isinstance(val, list):
+            self._data = list(val)
+            self._static_value = None
+        else:
+            self._data = None
+            self._static_value = val
+        self._value_cache_valid = False
+        self._invalidate_dependents()
+    # ── Uncertainty ──────────────────────────────────────
+    @property
+    def uncertainty(self) -> float | None:
+        if self._compute_unc is not None:
+            if not self._unc_cache_valid:
+                self._unc_cached = self._compute_unc()
+                self._unc_cache_valid = True
+            return self._unc_cached
+        if self._static_uncertainty is not None:
+            return self._static_uncertainty
+        # Auto std from measurement list
+        if self._data is not None and len(self._data) > 1:
+            return statistics.stdev(self._data)
+        return None
+    @uncertainty.setter
+    def uncertainty(self, val):
+        self._compute_unc = None
+        self._static_uncertainty = val
+        self._unc_cache_valid = False
+        self._invalidate_dependents()
+    # ── Data (raw measurements) ──────────────────────────
+    @property
+    def data(self) -> list[float] | None:
+        return list(self._data) if self._data is not None else None
+    @property
+    def is_computed(self) -> bool:
+        return self._compute is not None
+    # ── Cache management ────────────────────────────────
+    def invalidate(self):
+        """Manually invalidate this property's cache and propagate."""
+        self._value_cache_valid = False
+        self._unc_cache_valid = False
+        self._invalidate_dependents()
+    def _invalidate_dependents(self, _seen: set[int] | None = None):
+        if _seen is None:
+            _seen = set()
+        for dep in self._dependents:
+            dep_id = id(dep)
+            if dep_id not in _seen:
+                _seen.add(dep_id)
+                dep._value_cache_valid = False
+                dep._unc_cache_valid = False
+                dep._invalidate_dependents(_seen)
+    def _wire_dependencies(self):
+        """Register self as a dependent of each dependency."""
+        for dep in self._depends_on_refs:
+            if isinstance(dep, Property) and self not in dep._dependents:
+                dep._dependents.append(self)
+    def _seed_cache(self, value=None, uncertainty=None):
+        """Seed the cache for a computed property (used during hydration)."""
+        if value is not None:
+            self._value_cached = value
+            self._value_cache_valid = True
+        if uncertainty is not None:
+            self._unc_cached = uncertainty
+            self._unc_cache_valid = True
+    # ── Display ─────────────────────────────────────────
+    @property
+    def text(self) -> str:
+        return self.format()
+    def format(self, unit: bool = True) -> str:
+        """Format as plain text.
+        Parameters
+        ----------
+        unit : bool
+            Include unit in output.
+        """
+        v = self.value
+        if v is None:
+            return "N/A"
+        # String values (e.g. material name)
+        if isinstance(v, str):
+            if unit and self.unit and self.unit != "-":
+                return f"{v} {self.unit}"
+            return v
+        u = self.uncertainty
+        v_str = f"{v:{self.precision}}"
+        if u is not None and u != 0:
+            u_str = f"{u:{self.precision_unc}}"
+            val_part = f"{v_str} ± {u_str}"
+        else:
+            val_part = v_str
+        if unit and self.unit and self.unit != "-":
+            return f"{val_part} {self.unit}"
+        return val_part
+    def __repr__(self):
+        return f"Property({self._name}: {self.text})"
+    def __str__(self):
+        return self.text
+    # ── Serialization ───────────────────────────────────
+    def to_yaml(self) -> Any:
+        """Convert to a YAML-friendly value (scalar, dict, or None)."""
+        v = self.value
+        u = self.uncertainty
+        unit = self.unit
+        data = self.data
+        # String with no extra metadata → bare string
+        if isinstance(v, str) and u is None and not unit:
+            return v
+        d: dict[str, Any] = {}
+        if v is not None:
+            d["value"] = v
+        if data is not None:
+            d["data"] = data
+        if u is not None:
+            d["uncertainty"] = u
+        if unit:
+            d["unit"] = unit
+        if self.unit_math and self.unit_math != unit:
+            d["unit_math"] = self.unit_math
+        sym = self.symbol
+        if sym and sym != self._name:
+            d["symbol"] = sym
+        if self.symbol_math and self.symbol_math != (sym or self._name):
+            d["symbol_math"] = self.symbol_math
+        if self.precision:
+            d["precision"] = self.precision
+        if self.precision_unc and self.precision_unc != self.precision:
+            d["precision_unc"] = self.precision_unc
+        if not d:
+            return None
+        # Only metadata and no actual data → skip
+        data_keys = {"value", "data", "uncertainty"}
+        if not (set(d.keys()) & data_keys):
+            return None
+        # Only value and it's numeric → bare scalar
+        if list(d.keys()) == ["value"] and isinstance(v, (int, float)):
+            return v
+        return d
+    def from_yaml(self, raw: Any):
+        """Populate this Property from a YAML value (scalar or dict)."""
+        if isinstance(raw, dict):
+            data = {
+                "value": raw.get("value"),
+                "uncertainty": raw.get("uncertainty"),
+                "unit": raw.get("unit"),
+                "data": raw.get("data"),
+            }
+            # Metadata fields
+            if raw.get("unit_math") is not None:
+                self.unit_math = raw["unit_math"]
+            if raw.get("symbol") is not None:
+                self.symbol = raw["symbol"]
+            if raw.get("symbol_math") is not None:
+                self.symbol_math = raw["symbol_math"]
+            if raw.get("precision") is not None:
+                self.precision = raw["precision"]
+            if raw.get("precision_unc") is not None:
+                self.precision_unc = raw["precision_unc"]
+        else:
+            data = {"value": raw}
+        # Data list takes priority (value/uncertainty will be computed from it)
+        if data.get("data") is not None:
+            self.value = data["data"]
+        elif data.get("value") is not None:
+            if self.is_computed:
+                self._seed_cache(value=data["value"])
+            else:
+                self.value = data["value"]
+        if data.get("uncertainty") is not None:
+            if self._compute_unc is not None:
+                self._seed_cache(uncertainty=data["uncertainty"])
+            else:
+                self.uncertainty = data["uncertainty"]
+        if data.get("unit") is not None:
+            self.unit = data["unit"]
+            if self.unit_math == self.unit or not self.unit_math:
+                self.unit_math = data["unit"]

samplekit/report.py ADDED Viewed

@@ -0,0 +1,214 @@
+"""Rendering utilities — markdown tables, property tables, Table rendering."""
+from __future__ import annotations
+from typing import TYPE_CHECKING
+if TYPE_CHECKING:
+    from .property import Property
+    from .sample import Sample
+    from .table import Table
+# Characters that need escaping inside $...$ (LaTeX math mode)
+_LATEX_SPECIAL = str.maketrans({"#": r"\#", "%": r"\%", "&": r"\&", "_": r"\_"})
+import re
+_SCI_RE = re.compile(r'^([+-]?\d+(?:\.\d+)?)[eE]([+-]?\d+)$')
+def _math_sci(s: str) -> str:
+    """Convert '9e-07' → '9 \\times 10^{-7}' for math mode."""
+    m = _SCI_RE.match(s.strip())
+    if not m:
+        return s
+    mantissa, exp = m.group(1), int(m.group(2))
+    return f"{mantissa} \\times 10^{{{exp}}}"
+# ════════════════════════════════════════════════════════════
+# Property formatting
+# ════════════════════════════════════════════════════════════
+def format_property(prop: Property, style: str = "text", unit: bool = True) -> str:
+    """Format a Property for display.
+    Parameters
+    ----------
+    prop : Property
+    style : "text" or "math"
+        "text" → plain text (e.g. ``25.0 ± 0.5 °C``)
+        "math" → inline math (e.g. ``$25.0 \\pm 0.5$ $°C$``)
+    unit : bool
+        Include unit in output.
+    """
+    if style == "math":
+        v = prop.value
+        if v is None:
+            return "N/A"
+        if isinstance(v, str):
+            if unit and prop.unit and prop.unit != "-":
+                return f"{v} {prop.unit}"
+            return v
+        u = prop.uncertainty
+        v_str = _math_sci(f"{v:{prop.precision}}")
+        if u is not None and u != 0:
+            u_str = _math_sci(f"{u:{prop.precision_unc}}")
+            val_part = f"${v_str} \\pm {u_str}$"
+        else:
+            val_part = f"${v_str}$"
+        if unit and prop.unit and prop.unit != "-":
+            return f"{val_part} ${prop.unit_math.translate(_LATEX_SPECIAL)}$"
+        return val_part
+    return prop.format(unit=unit)
+# ════════════════════════════════════════════════════════════
+# Generic markdown table
+# ════════════════════════════════════════════════════════════
+def markdown_table(
+    rows: list[list[str]],
+    headers: list[str],
+    align: list[str] | None = None,
+) -> str:
+    """Generate a markdown table.
+    Parameters
+    ----------
+    rows : list of list of str
+        Table data.
+    headers : list of str
+        Column headers.
+    align : list of str, optional
+        Per-column alignment: "l", "c", "r". Defaults to center.
+    """
+    ncols = len(headers)
+    align = align or ["c"] * ncols
+    header_row = "| " + " | ".join(headers) + " |"
+    sep_map = {"l": ":---", "r": "---:", "c": ":---:"}
+    sep_row = "| " + " | ".join(sep_map.get(a, ":---:") for a in align) + " |"
+    data_rows = "\n".join("| " + " | ".join(row) + " |" for row in rows)
+    return f"{header_row}\n{sep_row}\n{data_rows}"
+# ════════════════════════════════════════════════════════════
+# Property table
+# ════════════════════════════════════════════════════════════
+def properties_table(
+    sample: Sample,
+    names: list[str],
+    headers: list[str] | None = None,
+    style: str = "math",
+    align: list[str] | None = None,
+) -> str:
+    """Render selected scalar properties as a markdown table.
+    Parameters
+    ----------
+    sample : Sample
+    names : list of property names to include
+    headers : column headers (default: ["Property", "Value", "Unit"])
+    style : "math" or "text"
+    """
+    headers = headers or ["Property", "Value", "Unit"]
+    math = style == "math"
+    props = sample.props
+    rows = []
+    for name in names:
+        prop = props.get(name)
+        if prop is None or prop.value is None:
+            continue
+        if math:
+            sym = prop.symbol_math or prop.symbol or name
+            sym_cell = f"${sym}$"
+        else:
+            sym = prop.symbol or name
+            sym_cell = sym
+        val_cell = format_property(prop, style, unit=False)
+        unit_cell = f"${prop.unit_math.translate(_LATEX_SPECIAL)}$" if math and prop.unit else prop.unit
+        rows.append([sym_cell, val_cell, unit_cell])
+    return markdown_table(rows, headers, align or ["c"] * len(headers))
+# ════════════════════════════════════════════════════════════
+# Table rendering
+# ════════════════════════════════════════════════════════════
+def _col_header(col_name: str, col, style: str) -> str:
+    """Build a column header string (symbol + unit) for a given style."""
+    math = style == "math"
+    if col:
+        if math:
+            sym = col.symbol_math or col.symbol or col_name
+        else:
+            sym = col.symbol or col_name
+    else:
+        sym = col_name
+    h = f"${sym}$" if math else sym
+    if col and col.unit and col.unit != "-":
+        unit_str = f"${col.unit_math.translate(_LATEX_SPECIAL)}$" if math else col.unit
+        h += f" ({unit_str})"
+    return h
+def table_to_markdown(
+    table: Table,
+    style: str = "math",
+    columns: list[str] | None = None,
+    index_label: str | None = None,
+    align: list[str] | None = None,
+) -> str:
+    """Render a Table as a markdown table.
+    Parameters
+    ----------
+    table : Table
+    style : "math" or "text"
+    columns : list of column names to include (default: all)
+    index_label : override for the index column header
+    """
+    math = style == "math"
+    cols = columns or table.data_columns
+    # Index header
+    if index_label:
+        idx_header = index_label
+    else:
+        idx_col = table.columns.get(table.index)
+        idx_header = _col_header(table.index, idx_col, style)
+    # Column headers
+    headers = [idx_header]
+    for col_name in cols:
+        col = table.columns.get(col_name)
+        headers.append(_col_header(col_name, col, style))
+    # Data rows
+    rows = []
+    for idx in table.index_values:
+        row_cells = [f"${idx}$" if math else str(idx)]
+        row = table(idx)
+        for col_name in cols:
+            try:
+                cell = row[col_name]
+                row_cells.append(format_property(cell, style, unit=False))
+            except (KeyError, AttributeError):
+                row_cells.append("N/A")
+        rows.append(row_cells)
+    return markdown_table(rows, headers, align or ["c"] * len(headers))
+# ════════════════════════════════════════════════════════════
+# Heading helper
+# ════════════════════════════════════════════════════════════
+def heading(text: str, level: int = 2) -> str:
+    """Generate a markdown heading."""
+    return f"{'#' * level} {text}\n"