PyPI - morphgen-rates - Versions diffs - 0.3.0__py3-none-any.whl → 0.5.0__py3-none-any.whl - Mend

morphgen-rates 0.3.0py3-none-any.whl → 0.5.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (9) hide show

morphgen_rates/__init__.py CHANGED Viewed

@@ -1,3 +1,4 @@
 from .rates import compute_rates
 from .data import get_data
-__all__ = ["compute_rates", "get_data"]
+from .init_count import compute_init_number_probs
+__all__ = ["compute_rates", "get_data", "compute_init_number_probs"]

morphgen_rates/data.py CHANGED Viewed

@@ -22,85 +22,82 @@ def _local_data_path(filename='morph_data', ext="csv"):
   return work_dir / f"{filename}.{ext}"
-def get_data(key):
+def get_data(area, neuron_type):
   """
-  Retrieve a dataset entry using a key-path of the form
-  "<brain region>/<neuron class>/<subcellular section>".
+  Retrieve summary morphology statistics for a given brain area and neuron class.
-  The argument `data_path` is interpreted as a slash-separated path of keys used
-  to traverse a nested dataset dictionary. The selected dataset is expected to
-  contain both Sholl-plot statistics and bifurcation statistics; when both are
-  available, this function returns a standardized dictionary compatible with
-  `compute_rates`.
+  This function loads a local CSV dataset, filters rows matching the requested
+  `area` and `neuron_type`, and aggregates statistics by `section_type`. The
+  output is a nested dictionary keyed by section type (e.g., soma, apical, basal),
+  containing:
+  - Summary statistics for bifurcation counts and total length
+  - Estimated number of primary neurites at the soma (Count0)
+  - Sholl plot summary statistics (bin size, mean counts, standard deviation)
   Parameters
   ----------
-  key : str
-      Dataset identifier expressed as a key path:
-      "<brain region>/<neuron class>/<subcellular section>"
-      Examples:
-      - "CTX/pyr/apical"
-      - "HPC/pyr/basal"
-      Each component is used as a successive key lookup into the nested dataset
-      container.
+  area : str
+      Brain region identifier used in the dataset (must match values in the
+      'area' column of the CSV)
+  neuron_type : str
+      Neuron class identifier used in the dataset (must match values in the
+      'neuron_type' column of the CSV)
   Returns
   -------
   dict
-      If both Sholl and bifurcation information are present for the selected dataset,
-      returns:
+      Nested dictionary structured as:
       data = {
-        "sholl": {
-          "bin_size": float,
-          "mean": numpy.ndarray,   # shape (K,)
-          "var":  numpy.ndarray,   # shape (K,)
-        },
-        "bifurcations": {
-          "mean": float,
-          "var":  float,
+        "<section_type>": {
+          "bifurcation_count": {"mean": ..., "std": ..., "min": ..., "max": ...},
+          "total_length": {"mean": ..., "std": ..., "min": ..., "max": ...},
+          "primary_count": {"mean": ..., "std": ..., "min": ..., "max": ...},
+          "sholl_plot": {
+            "bin_size": float,
+            "mean": list[float],
+            "std": list[float],
+          },
         },
+        ...
       }
-      Where:
-      - `data["sholl"]["bin_size"]` is the spatial bin size used to define Sholl shells
-      - `data["sholl"]["mean"]` is the mean Sholl intersection count per radial bin
-      - `data["sholl"]["var"]` is the variance of the Sholl intersection count per bin
-      - `data["bifurcations"]["mean"]` is the mean bifurcation count
-      - `data["bifurcations"]["var"]` is the variance of the bifurcation count
+      Notes on fields:
+      - `primary_count` corresponds to the row group labeled 'Count0'
+      - Sholl values are collected from rows whose metric name starts with 'Count'
+        (including 'Count0'); users may want to interpret/plot them as a function
+        of radial bin index multiplied by `bin_size`
   Raises
   ------
-  KeyError
-      If any key along `data_path` is missing (brain region, neuron class, or section)
-  ValueError
-      If the selected dataset does not contain both Sholl and bifurcation data, or
-      if the provided arrays have incompatible shapes
+  AssertionError
+      If no rows match the requested `area` and `neuron_type`
   Notes
   -----
-  - `data_path` is a *key path*, not a filesystem path
-  - The function assumes the dataset entry referenced by `data_path` includes:
-      - Sholl bin size, mean array, variance array
-      - Bifurcation mean and variance
+  - The function expects the local CSV to include at least the following columns:
+      'area', 'neuron_type', 'neuron_name', 'section_type', 'bin_size'
+      plus metric columns including:
+        - 'bifurcation_count'
+        - 'total_length'
+        - 'Count0', 'Count1', ... (Sholl counts per radial bin)
+  - Statistics are computed using `pandas.DataFrame.groupby(...).describe()`.
+    Only the summary columns 'mean', 'std', 'min', 'max' are retained.
   Examples
   --------
-  >>> data = get("CTX/pyr/apical")
-  >>> data["sholl"]["bin_size"]
+  >>> data = get_data("CTX", "pyr")
+  >>> data["apical"]["bifurcation_count"]["mean"]
+  42.0
+  >>> data["apical"]["sholl_plot"]["bin_size"]
   50.0
-  >>> data["bifurcations"]["mean"]
-  12.3
+  >>> len(data["apical"]["sholl_plot"]["mean"])
+  20
   """
   data = {}
-  # split the key
-  parts = tuple(p.strip() for p in key.split("/") if p.strip())
-  if len(parts) != 2:
-      raise ValueError(f"Expected key like 'area/neuron_type', got: {key!r}")
   area, neuron_type = parts
   # load data
@@ -108,6 +105,9 @@ def get_data(key):
   # select specific area and neuron type
   df = df[(df['area'] == area) & (df['neuron_type'] == neuron_type)]
+  # ensure that there are area and neuron_type in the df
+  assert df.shape[0] > 0, "The area {area} or neuron class {neuron_type} are not known"
   # neuron name unnecessary
   df.drop(['area', 'neuron_type', 'neuron_name'], axis=1, inplace=True)
@@ -122,8 +122,6 @@ def get_data(key):
   for section_type, row in df.iterrows():
     data[section_type] = {}
-    print()
     # get statistics
     for data_type in ['bifurcation_count', 'total_length']:
       tmp = row.loc[row.index.get_level_values(0) == data_type, :]

morphgen_rates/init_count.py ADDED Viewed

@@ -0,0 +1,208 @@
+from __future__ import annotations
+from typing import Dict, Optional, Sequence, Union
+import numpy as np
+import pyomo.environ as pyo
+def compute_init_number_probs(
+    mean_primary_dendrites: float,
+    sd_primary_dendrites: float,
+    min_primary_dendrites: int,
+    max_primary_dendrites: int,
+    *,
+    support_values: Optional[Sequence[float]] = None,
+    epsilon: float = 1e-12,
+    slack_penalty: float = 1e-1,
+    use_variance_form: bool = True,
+    use_abs_slack: bool = False,
+    solver: str = "ipopt",
+    solver_options: Optional[Dict[str, Union[str, int, float]]] = None,
+) -> np.ndarray:
+    """
+    Maximum-entropy PMF for the (discrete) number of primary dendrites.
+    This returns a numpy array p of length n = max_primary_dendrites + 1, where:
+      - p[i] is the probability of observing i primary dendrites
+      - p[i] = 0 for i < min_primary_dendrites or i > max_primary_dendrites
+    The distribution is obtained by maximizing Shannon entropy:
+        H(p) = -sum_i p[i] * log(p[i])
+    Subject to:
+      - Normalization: sum_{i in [min,max]} p[i] = 1
+      - Soft mean constraint (with slack):
+            sum i*p[i] - mean_primary_dendrites = slack_mean
+      - Soft dispersion constraint (with slack):
+        If use_variance_form=True (recommended):
+            sum (i-mean)^2 * p[i] - (sd_primary_dendrites^2) = slack_disp
+        If use_variance_form=False:
+            sqrt( sum (i-mean)^2 * p[i] + tiny ) - sd_primary_dendrites = slack_disp
+    The objective is penalized to keep slacks small:
+        maximize  H(p) - slack_penalty * (slack terms)
+    Parameters
+    ----------
+    mean_primary_dendrites : float
+        Target mean number of primary dendrites
+    sd_primary_dendrites : float
+        Target standard deviation (>= 0)
+    min_primary_dendrites : int
+        Minimum allowed dendrite count (inclusive)
+    max_primary_dendrites : int
+        Maximum allowed dendrite count (inclusive). Also sets array length n=max+1
+    Keyword-only parameters
+    ----------------------
+    support_values : Sequence[float] | None
+        Optional support for indices 0..max. If None, uses support=i (integers).
+        Keep this None if you truly mean "i is the dendrite count".
+    epsilon : float
+        Lower bound on active probabilities to avoid log(0)
+    slack_penalty : float
+        Larger values enforce closer moment matching
+    use_variance_form : bool
+        Recommended True: match variance to sd^2 (smoother than sqrt constraint)
+    use_abs_slack : bool
+        If True, use L1-like slack penalty via +/- variables; otherwise squared (smooth)
+    solver : str
+        Nonlinear solver name (typically "ipopt")
+    solver_options : dict | None
+        Passed to the solver (e.g., {"max_iter": 5000})
+    Returns
+    -------
+    np.ndarray
+        Probability vector p with length max_primary_dendrites + 1
+    Raises
+    ------
+    ValueError
+        For invalid inputs
+    RuntimeError
+        If the requested solver is not available
+    """
+    if max_primary_dendrites < 0:
+        raise ValueError("max_primary_dendrites must be >= 0")
+    if sd_primary_dendrites < 0:
+        raise ValueError("sd_primary_dendrites must be nonnegative")
+    if not (0 <= min_primary_dendrites <= max_primary_dendrites):
+        raise ValueError("Require 0 <= min_primary_dendrites <= max_primary_dendrites")
+    if slack_penalty <= 0:
+        raise ValueError("slack_penalty must be positive")
+    if epsilon <= 0:
+        raise ValueError("epsilon must be positive")
+    n = max_primary_dendrites + 1
+    active = list(range(min_primary_dendrites, max_primary_dendrites + 1))
+    # Support values for each index i (default: i itself)
+    if support_values is None:
+        support_values = list(range(n))
+    if len(support_values) != n:
+        raise ValueError("support_values must have length n = max_primary_dendrites + 1")
+    support = {i: float(support_values[i]) for i in range(n)}
+    mu = float(mean_primary_dendrites)
+    sd = float(sd_primary_dendrites)
+    target_var = sd * sd
+    # -----------------------------
+    # Pyomo model
+    # -----------------------------
+    m = pyo.ConcreteModel()
+    m.A = pyo.Set(initialize=active, ordered=True)
+    # Decision variables for active probabilities only
+    m.p = pyo.Var(m.A, domain=pyo.NonNegativeReals, bounds=(epsilon, 1.0))
+    # Normalization over active set
+    m.norm = pyo.Constraint(expr=sum(m.p[i] for i in m.A) == 1.0)
+    # Moment expressions
+    mean_expr = sum(support[i] * m.p[i] for i in m.A)
+    var_expr = sum((support[i] - mu) ** 2 * m.p[i] for i in m.A)
+    # Soft constraints with slack
+    if use_abs_slack:
+        # L1 slack via +/- decomposition
+        m.s_mean_pos = pyo.Var(domain=pyo.NonNegativeReals)
+        m.s_mean_neg = pyo.Var(domain=pyo.NonNegativeReals)
+        m.s_disp_pos = pyo.Var(domain=pyo.NonNegativeReals)
+        m.s_disp_neg = pyo.Var(domain=pyo.NonNegativeReals)
+        m.mean_soft = pyo.Constraint(expr=mean_expr - mu == m.s_mean_pos - m.s_mean_neg)
+        if use_variance_form:
+            m.disp_soft = pyo.Constraint(expr=var_expr - target_var == m.s_disp_pos - m.s_disp_neg)
+        else:
+            tiny = 1e-18
+            m.disp_soft = pyo.Constraint(
+                expr=pyo.sqrt(var_expr + tiny) - sd == m.s_disp_pos - m.s_disp_neg
+            )
+        slack_term = (m.s_mean_pos + m.s_mean_neg) + (m.s_disp_pos + m.s_disp_neg)
+    else:
+        # Smooth squared slacks
+        m.s_mean = pyo.Var(domain=pyo.Reals)
+        m.s_disp = pyo.Var(domain=pyo.Reals)
+        m.mean_soft = pyo.Constraint(expr=mean_expr - mu == m.s_mean)
+        if use_variance_form:
+            m.disp_soft = pyo.Constraint(expr=var_expr - target_var == m.s_disp)
+        else:
+            tiny = 1e-18
+            m.disp_soft = pyo.Constraint(expr=pyo.sqrt(var_expr + tiny) - sd == m.s_disp)
+        slack_term = m.s_mean**2 + m.s_disp**2
+    # Entropy objective (active probs only; inactive probs are exactly 0)
+    entropy = -sum(m.p[i] * pyo.log(m.p[i]) for i in m.A)
+    m.obj = pyo.Objective(expr=entropy - float(slack_penalty) * slack_term, sense=pyo.maximize)
+    # Solve
+    opt = pyo.SolverFactory(solver)
+    if opt is None or not opt.available():
+        raise RuntimeError(
+            f"Solver '{solver}' is not available. Install/configure it (e.g., ipopt) "
+            "or pass a different solver name."
+        )
+    if solver_options:
+        for k, v in solver_options.items():
+            opt.options[k] = v
+    res = opt.solve(m, tee=False)
+    # -----------------------------
+    # Extract solution into numpy array
+    # -----------------------------
+    p = np.zeros(n, dtype=float)
+    for i in active:
+        p[i] = float(pyo.value(m.p[i]))
+    # Optional: renormalize tiny numerical drift (keeps zeros outside band)
+    s = p.sum()
+    if s > 0:
+        p[active] /= s
+    return p
+if __name__ == "__main__":
+    p = maxent_primary_dendrite_pmf(
+        mean_primary_dendrites=2.33,
+        sd_primary_dendrites=1.53,
+        min_primary_dendrites=1,
+        max_primary_dendrites=4,
+        slack_penalty=0.1,
+        use_variance_form=True,
+        use_abs_slack=False,
+        solver="ipopt",
+    )
+    print("p shape:", p.shape)
+    print("sum:", p.sum())
+    print(p)

{morphgen_rates-0.3.0.dist-info → morphgen_rates-0.5.0.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: morphgen-rates
-Version: 0.3.0
+Version: 0.5.0
 Summary: Compute bifurcation and annihilation rates from morphology data
 Author-email: Francesco Cavarretta <fcavarretta@ualr.edu>
 Requires-Python: >=3.9

morphgen_rates-0.5.0.dist-info/RECORD ADDED Viewed

@@ -0,0 +1,9 @@
+morphgen_rates/__init__.py,sha256=UE8YWsulDIfeYhGb5GHdkakUIFx4j9H3ZkoKoaDCd_0,179
+morphgen_rates/data.py,sha256=Onc2dRlB_QXpgScDzHCE7DRtg6PLtFld5W91QGuDkYo,4518
+morphgen_rates/init_count.py,sha256=PhYlp0-CzRdf8opTKb-om3cFIKSv5M8eTcyKy1_IFMI,7283
+morphgen_rates/rates.py,sha256=2Gn3Ew2uVJ7c_LdYJogxS-jAM9q-039y0maWi4CNpTM,6442
+morphgen_rates-0.5.0.dist-info/licenses/LICENSE,sha256=VONsnKVXQRcWwCaHWHuwMtemIj9jNJSmpunazxlyvOk,670
+morphgen_rates-0.5.0.dist-info/METADATA,sha256=xYYNva-7mn6Vk-iFKKJJUg3jw_phgW-iZvHeSd4z7gk,1178
+morphgen_rates-0.5.0.dist-info/WHEEL,sha256=wUyA8OaulRlbfwMtmQsvNngGrxQHAvkKcvRmdizlJi0,92
+morphgen_rates-0.5.0.dist-info/top_level.txt,sha256=UYPGC2dGp9xD_4iVxVVTkKaizBA4XeDNM7OBC_DCWRk,15
+morphgen_rates-0.5.0.dist-info/RECORD,,

morphgen_rates-0.3.0.dist-info/RECORD DELETED Viewed

@@ -1,8 +0,0 @@
-morphgen_rates/__init__.py,sha256=p347dyzb_8MuKdh4YUIrZOmdctfd-9xEhUJU9XOOVdU,100
-morphgen_rates/data.py,sha256=yj_GT3ks6ukwtALfC4Bklcwu3MeTOr-2BGGo5W0ZxM0,4330
-morphgen_rates/rates.py,sha256=2Gn3Ew2uVJ7c_LdYJogxS-jAM9q-039y0maWi4CNpTM,6442
-morphgen_rates-0.3.0.dist-info/licenses/LICENSE,sha256=VONsnKVXQRcWwCaHWHuwMtemIj9jNJSmpunazxlyvOk,670
-morphgen_rates-0.3.0.dist-info/METADATA,sha256=4umattnyl1InefhNOyEE0KXkqhLt_Y9PSimPO0qimRk,1178
-morphgen_rates-0.3.0.dist-info/WHEEL,sha256=wUyA8OaulRlbfwMtmQsvNngGrxQHAvkKcvRmdizlJi0,92
-morphgen_rates-0.3.0.dist-info/top_level.txt,sha256=UYPGC2dGp9xD_4iVxVVTkKaizBA4XeDNM7OBC_DCWRk,15
-morphgen_rates-0.3.0.dist-info/RECORD,,

{morphgen_rates-0.3.0.dist-info → morphgen_rates-0.5.0.dist-info}/WHEEL RENAMED Viewed

File without changes

{morphgen_rates-0.3.0.dist-info → morphgen_rates-0.5.0.dist-info}/licenses/LICENSE RENAMED Viewed

File without changes

{morphgen_rates-0.3.0.dist-info → morphgen_rates-0.5.0.dist-info}/top_level.txt RENAMED Viewed

File without changes

morphgen-rates 0.3.0__py3-none-any.whl → 0.5.0__py3-none-any.whl

morphgen-rates 0.3.0py3-none-any.whl → 0.5.0py3-none-any.whl