PyPI - mergeron - Versions diffs - 2025.739290.4__tar.gz → 2025.739290.6__tar.gz - Mend

mergeron 2025.739290.4tar.gz → 2025.739290.6tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of mergeron might be problematic. Click here for more details.

Files changed (26) hide show

{mergeron-2025.739290.4 → mergeron-2025.739290.6}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.3
 Name: mergeron
-Version: 2025.739290.4
+Version: 2025.739290.6
 Summary: Analyze merger enforcement policy using Python
 License: MIT
 Keywords: merger policy analysis,merger guidelines,merger screening,policy presumptions,concentration standards,upward pricing pressure,GUPPI

{mergeron-2025.739290.4 → mergeron-2025.739290.6}/pyproject.toml RENAMED Viewed

@@ -13,7 +13,7 @@ keywords = [
     "upward pricing pressure",
     "GUPPI",
 ]
-version = "2025.739290.4"
+version = "2025.739290.6"
 # Classifiers list: https://pypi.org/classifiers/
 classifiers = [
@@ -68,11 +68,11 @@ pendulum = ">=3.0.0"
 ruff = ">=0.5"
 poetry-plugin-export = "^1.8.0"
 pytest = ">=8.0"
-Sphinx = ">=7.2, <8.0"
+sphinx = ">8.2"
 semver = ">=3.0"
 sphinx-autodoc-typehints = ">=2.0.0"
-sphinx-autoapi = ">=3.0"
-sphinx-immaterial = ">=0.11"
+sphinx-autoapi = ">=3.6.0"
+sphinx-immaterial = ">0.11"
 pipdeptree = ">=2.15.1"
 types-openpyxl = ">=3.0.0"
 virtualenv = ">=20.28.0"

{mergeron-2025.739290.4 → mergeron-2025.739290.6}/src/mergeron/__init__.py RENAMED Viewed

@@ -12,18 +12,20 @@ from ruamel import yaml
 _PKG_NAME: str = Path(__file__).parent.stem
-VERSION = "2025.739290.4"
+VERSION = "2025.739290.6"
 __version__ = VERSION
-DATA_DIR: Path = Path.home() / _PKG_NAME
+WORK_DIR = globals().get("WORK_DIR", Path.home() / _PKG_NAME)
 """
-Defines a subdirectory named for this package in the user's home path.
+If defined, the global variable WORK_DIR is used as a data store.
-If the subdirectory doesn't exist, it is created on package invocation.
+If the user does not define WORK_DIR, a subdirectory in
+the user's home directory, named for this package, is
+created/reused.
 """
-if not DATA_DIR.is_dir():
-    DATA_DIR.mkdir(parents=False)
+if not WORK_DIR.is_dir():
+    WORK_DIR.mkdir(parents=False)
 DEFAULT_REC_RATIO = 0.85
@@ -32,19 +34,18 @@ EMPTY_ARRAYINT = np.array([], int)
 NTHREADS = 2 * cpu_count()
-PKG_ENUMS_MAP: dict[str, object] = {}
 PKG_ATTRS_MAP: dict[str, object] = {}
 np.set_printoptions(precision=24, floatmode="fixed")
-type HMGPubYear = Literal[1982, 1984, 1992, 2010, 2023]
+type HMGPubYear = Literal[1992, 2010, 2023]
 type ArrayBoolean = NDArray[np.bool_]
 type ArrayFloat = NDArray[np.floating]
-type ArrayINT = NDArray[np.unsignedinteger]
+type ArrayINT = NDArray[np.integer]
 type ArrayDouble = NDArray[np.float64]
-type ArrayBIGINT = NDArray[np.uint64]
+type ArrayBIGINT = NDArray[np.int64]
 this_yaml = yaml.YAML(typ="rt")
@@ -71,38 +72,27 @@ this_yaml.indent(mapping=2, sequence=4, offset=2)
 )
-@this_yaml.register_class
-class EnumYAMLized(enum.Enum):
-    @classmethod
-    def to_yaml(
-        cls, _r: yaml.representer.RoundTripRepresenter, _d: object[enum.EnumType]
-    ) -> yaml.ScalarNode:
-        return _r.represent_scalar(
-            f"!{super().__getattribute__(cls, '__name__')}", f"{_d.name}"
-        )
-    @classmethod
-    def from_yaml(
-        cls, _c: yaml.constructor.RoundTripConstructor, _n: yaml.ScalarNode
-    ) -> object[enum.EnumType]:
-        return super().__getattribute__(cls, _n.value)
 def yaml_rt_mapper(
     _c: yaml.constructor.RoundTripConstructor, _n: yaml.MappingNode
 ) -> Mapping[str, Any]:
+    """
+    Constructs a mapping from a mapping node with the RoundTripConstructor
+    """
     data_: Mapping[str, Any] = yaml.constructor.CommentedMap()
     _c.construct_mapping(_n, maptyp=data_, deep=True)
     return data_
 def yamelize_attrs(
-    _typ: object,
-    excluded_attributes: set | None = None,
-    /,
-    *,
-    attr_map: Mapping[str, object] = PKG_ATTRS_MAP,
+    _typ: object, /, *, attr_map: Mapping[str, object] = PKG_ATTRS_MAP
 ) -> None:
+    """Add yaml representer, constructor for attrs-defined class.
+    Applying this function, attributes with property, `init=False` are
+    not serialized to YAML.
+    """
     attr_map |= {_typ.__name__: _typ}
     _ = this_yaml.representer.add_representer(
@@ -112,11 +102,7 @@ def yamelize_attrs(
             # construct mapping, rather than calling attrs.asdict(),
             # to use yaml representers defined in this package for
             # "upstream" objects
-            {
-                _a.name: getattr(_d, _a.name)
-                for _a in _d.__attrs_attrs__
-                if excluded_attributes is None or _a.name not in excluded_attributes
-            },
+            {_a.name: getattr(_d, _a.name) for _a in _d.__attrs_attrs__ if _a.init},
         ),
     )
     _ = this_yaml.constructor.add_constructor(
@@ -125,19 +111,76 @@ def yamelize_attrs(
     )
+@this_yaml.register_class
+class Enameled(enum.Enum):
+    """Add YAML representer, constructor for enum.Enum"""
+    @classmethod
+    def to_yaml(
+        cls, _r: yaml.representer.RoundTripRepresenter, _d: object[enum.EnumType]
+    ) -> yaml.ScalarNode:
+        return _r.represent_scalar(
+            f"!{super().__getattribute__(cls, '__name__')}", f"{_d.name}"
+        )
+    @classmethod
+    def from_yaml(
+        cls, _c: yaml.constructor.RoundTripConstructor, _n: yaml.ScalarNode
+    ) -> object[enum.EnumType]:
+        return super().__getattribute__(cls, _n.value)
 @this_yaml.register_class
 @enum.unique
-class RECForm(str, EnumYAMLized):
-    """For derivation of recapture ratio from market shares."""
+class RECForm(str, Enameled):
+    R"""For derivation of recapture ratio from market shares.
+    With :math:`\mathscr{N}` a set of firms, each supplying a
+    single differentiated product, and :math:`\mathscr{M} \subset \mathscr{N}`
+    a putative relevant product market, with
+    :math:`d_{ij}` denoting diversion ratio from good :math:`i` to good :math:`j`,
+    :math:`s_i` denoting market shares, and
+    :math:`\overline{r}` the default market recapture ratio,
+    market recapture ratios for the respective products may be specified
+    as having one of the following forms:
+    """
+    FIXED = "proportional"
+    R"""Given, :math:`\overline{r}`,
+    .. math::
+        REC_i = \overline{r} {\ } \forall {\ } i \in \mathscr{M}
+    """
     INOUT = "inside-out"
+    R"""
+    Given, :math:`\overline{r}, s_i {\ } \forall {\ } i \in \mathscr{M}`, with
+    :math:`s_{min} = \min(s_1, s_2)`,
+    .. math::
+        REC_i = \frac{\overline{r} (1 - s_i)}{1 - (1 - \overline{r}) s_{min} - \overline{r} s_i}
+        {\ } \forall {\ } i \in \mathscr{M}
+    """
     OUTIN = "outside-in"
-    FIXED = "proportional"
+    R"""
+    Given, :math:`d_{ij} {\ } \forall {\ } i, j \in \mathscr{M}, i \neq j`,
+    .. math::
+        REC_i = {\sum_{j \in \mathscr{M}}^{j \neq i} d_{ij}}
+        {\ } \forall {\ } i \in \mathscr{M}
+    """
 @this_yaml.register_class
 @enum.unique
-class UPPAggrSelector(str, EnumYAMLized):
+class UPPAggrSelector(str, Enameled):
     """
     Aggregator for GUPPI and diversion ratio estimates.

{mergeron-2025.739290.4 → mergeron-2025.739290.6}/src/mergeron/core/__init__.py RENAMED Viewed

@@ -27,7 +27,7 @@ class INVTableData:
 type INVData = MappingProxyType[
     str, MappingProxyType[str, MappingProxyType[str, INVTableData]]
 ]
-type INVData_in_ = Mapping[str, Mapping[str, Mapping[str, INVTableData]]]
+type INVData_in = Mapping[str, Mapping[str, Mapping[str, INVTableData]]]
 (_, _) = (
@@ -61,14 +61,14 @@ type INVData_in_ = Mapping[str, Mapping[str, Mapping[str, INVTableData]]]
 def _dict_from_mapping(_p: Mapping[Any, Any], /) -> dict[Any, Any]:
-    retval = {}
+    retval: dict[Any, Any] = {}
     for _k, _v in _p.items():  # for subit in it:
         retval |= {_k: _dict_from_mapping(_v)} if isinstance(_v, Mapping) else {_k: _v}
     return retval
 def _mappingproxy_from_mapping(_p: Mapping[Any, Any], /) -> MappingProxyType[Any, Any]:
-    retval = {}
+    retval: dict[Any, Any] = {}
     for _k, _v in _p.items():  # for subit in it:
         retval |= (
             {_k: _mappingproxy_from_mapping(_v)}

{mergeron-2025.739290.4 → mergeron-2025.739290.6}/src/mergeron/core/empirical_margin_distribution.py RENAMED Viewed

@@ -39,7 +39,6 @@ price-cost margins fall in the interval :math:`[0, 1]`.
 import shutil
 import zipfile
 from collections.abc import Mapping
-from importlib import resources
 from pathlib import Path
 from types import MappingProxyType
@@ -49,12 +48,17 @@ from numpy.random import PCG64DXSM, Generator, SeedSequence
 from scipy import stats  # type: ignore
 from xlrd import open_workbook  # type: ignore
-from .. import _PKG_NAME, DATA_DIR, VERSION, ArrayDouble, this_yaml  # noqa: TID252
+from .. import VERSION, ArrayDouble, this_yaml  # noqa: TID252
+from .. import WORK_DIR as PKG_WORK_DIR  # noqa: TID252
+from .. import data as mdat  # noqa: TID252
 from . import _mappingproxy_from_mapping
 __version__ = VERSION
-MGNDATA_ARCHIVE_PATH = DATA_DIR / "damodaran_margin_data_serialized.zip"
+WORK_DIR = globals().get("WORK_DIR", PKG_WORK_DIR)
+"""Redefined, in case the user defines WORK_DIR betweeen module imports."""
+MGNDATA_ARCHIVE_PATH = WORK_DIR / "damodaran_margin_data_serialized.zip"
 u3pm = urllib3.PoolManager()
@@ -71,21 +75,21 @@ def margin_data_getter(  # noqa: PLR0912
             "This code is designed for parsing Prof. Damodaran's margin tables."
         )
-    data_archive_path_ = data_archive_path or MGNDATA_ARCHIVE_PATH
-    workbook_path_ = data_archive_path_.parent / f"damodaran_{_table_name}_data.xls"
-    if data_archive_path_.is_file() and not data_download_flag:
-        # with data_archive_path_.open("r") as _yfh:
-        #     margin_data_dict: dict[str, dict[str, float | int]] = this_yaml.load(_yfh)
+    data_archive_path = data_archive_path or MGNDATA_ARCHIVE_PATH
+    workbook_path = data_archive_path.parent / f"damodaran_{_table_name}_data.xls"
+    if data_archive_path.is_file() and not data_download_flag:
         with (
-            zipfile.ZipFile(data_archive_path_) as _yzip,
-            _yzip.open(f"{data_archive_path_.stem}.yaml") as _yfh,
+            zipfile.ZipFile(data_archive_path) as _yzip,
+            _yzip.open(f"{data_archive_path.stem}.yaml") as _yfh,
         ):
-            margin_data_dict: dict[str, dict[str, float | int]] = this_yaml.load(_yfh)
-        return _mappingproxy_from_mapping(margin_data_dict)
-    elif workbook_path_.is_file():
-        workbook_path_.unlink()
-        if data_archive_path_.is_file():
-            data_archive_path_.unlink()
+            margin_data_dict: MappingProxyType[
+                str, MappingProxyType[str, float | int]
+            ] = this_yaml.load(_yfh)
+        return margin_data_dict
+    elif workbook_path.is_file():
+        workbook_path.unlink()
+        if data_archive_path.is_file():
+            data_archive_path.unlink()
     margin_urlstr = (
         f"https://pages.stern.nyu.edu/~adamodar/pc/datasets/{_table_name}.xls"
@@ -96,7 +100,7 @@ def margin_data_getter(  # noqa: PLR0912
             u3pm.request(
                 "GET", margin_urlstr, preload_content=False
             ) as _urlopen_handle,
-            workbook_path_.open("wb") as margin_file,
+            workbook_path.open("wb") as margin_file,
         ):
             while True:
                 data_ = _urlopen_handle.read(chunk_size_)
@@ -104,7 +108,7 @@ def margin_data_getter(  # noqa: PLR0912
                     break
                 margin_file.write(data_)
-        print(f"Downloaded {margin_urlstr} to {workbook_path_}.")
+        print(f"Downloaded {margin_urlstr} to {workbook_path}.")
     except urllib3.exceptions.MaxRetryError as error_:
         if isinstance(error_.__cause__, urllib3.exceptions.SSLError):
@@ -115,42 +119,38 @@ def margin_data_getter(  # noqa: PLR0912
                 f"WARNING: Could not establish secure connection to, {margin_urlstr}."
                 "Using bundled copy."
             )
-            if not workbook_path_.is_file():
-                with resources.as_file(
-                    resources.files(f"{_PKG_NAME}.data").joinpath(
-                        "empirical_margin_distribution.xls"
-                    )
-                ) as margin_data_archive_path:
-                    shutil.copy2(margin_data_archive_path, workbook_path_)
+            if not workbook_path.is_file():
+                shutil.copy2(mdat.DAMODARAN_MARGIN_WORKBOOK, workbook_path)
         else:
             raise error_
-    xl_book_ = open_workbook(workbook_path_, ragged_rows=True, on_demand=True)
-    xl_sheet_ = xl_book_.sheet_by_name("Industry Averages")
+    xl_book = open_workbook(workbook_path, ragged_rows=True, on_demand=True)
+    xl_sheet = xl_book.sheet_by_name("Industry Averages")
-    margin_dict: dict[str, dict[str, float | int]] = {}
-    row_keys_: list[str] = []
+    margin_dict_in: dict[str, dict[str, float | int]] = {}
+    row_keys: list[str] = []
     read_row_flag = False
-    for _ridx in range(xl_sheet_.nrows):
-        xl_row = xl_sheet_.row_values(_ridx)
+    for _ridx in range(xl_sheet.nrows):
+        xl_row = xl_sheet.row_values(_ridx)
         if xl_row[0] == "Industry Name":
             read_row_flag = True
-            row_keys_ = xl_row
+            row_keys = xl_row
             continue
         if not xl_row[0] or not read_row_flag:
             continue
         xl_row[1] = int(xl_row[1])
-        margin_dict[xl_row[0]] = dict(zip(row_keys_[1:], xl_row[1:], strict=True))
+        margin_dict_in[xl_row[0]] = dict(zip(row_keys[1:], xl_row[1:], strict=True))
+    margin_dict = _mappingproxy_from_mapping(margin_dict_in)
     with (
-        zipfile.ZipFile(data_archive_path_, "w") as _yzip,
-        _yzip.open(f"{data_archive_path_.stem}.yaml", "w") as _yfh,
+        zipfile.ZipFile(data_archive_path, "w") as _yzip,
+        _yzip.open(f"{data_archive_path.stem}.yaml", "w") as _yfh,
     ):
         this_yaml.dump(margin_dict, _yfh)
-    return _mappingproxy_from_mapping(margin_dict)
+    return margin_dict
 def margin_data_builder(
@@ -240,9 +240,9 @@ def margin_data_resampler(
     seed_sequence_ = seed_sequence or SeedSequence(pool_size=8)
-    x_, w_, _ = margin_data_builder(margin_data_getter())
+    _x, _w, _ = margin_data_builder(margin_data_getter())
-    margin_kde = stats.gaussian_kde(x_, weights=w_, bw_method="silverman")
+    margin_kde = stats.gaussian_kde(_x, weights=_w, bw_method="silverman")
     margin_kde.set_bandwidth(bw_method=margin_kde.factor / 3.0)
     if isinstance(_sample_size, int):

{mergeron-2025.739290.4 → mergeron-2025.739290.6}/src/mergeron/core/ftc_merger_investigations_data.py RENAMED Viewed

@@ -13,7 +13,6 @@ from __future__ import annotations
 import re
 import shutil
 from collections.abc import Sequence
-from importlib import resources
 from operator import itemgetter
 from pathlib import Path
 from types import MappingProxyType
@@ -26,17 +25,12 @@ import urllib3
 from bs4 import BeautifulSoup
 from numpy.testing import assert_array_equal
-from .. import (  # noqa: TID252
-    _PKG_NAME,
-    DATA_DIR,
-    EMPTY_ARRAYINT,
-    VERSION,
-    ArrayBIGINT,
-    this_yaml,
-)
+from .. import EMPTY_ARRAYINT, VERSION, ArrayBIGINT, this_yaml  # noqa: TID252
+from .. import WORK_DIR as PKG_WORK_DIR  # noqa: TID252
+from .. import data as mdat  # noqa: TID252
 from . import (
     INVData,
-    INVData_in_,
+    INVData_in,
     INVTableData,
     _dict_from_mapping,
     _mappingproxy_from_mapping,
@@ -46,21 +40,16 @@ __version__ = VERSION
 m.patch()
-FTCDATA_DIR = DATA_DIR / "FTCData"
-if not FTCDATA_DIR.is_dir():
-    FTCDATA_DIR.mkdir(parents=True)
+WORK_DIR = globals().get("WORK_DIR", PKG_WORK_DIR)
+"""Redefined, in case the user defines WORK_DIR betweeen module imports."""
-INVDATA_ARCHIVE_PATH = DATA_DIR / "ftc_invdata.zip"
-if (
-    not INVDATA_ARCHIVE_PATH.is_file()
-    and (
-        _bundled_copy := resources.files(f"{_PKG_NAME}.data").joinpath(
-            INVDATA_ARCHIVE_PATH.name
-        )
-    ).is_file()
-):
-    with resources.as_file(_bundled_copy) as _bundled_copy_path:
-        shutil.copy2(_bundled_copy_path, INVDATA_ARCHIVE_PATH)
+FID_WORK_DIR = WORK_DIR / "FTCData"
+if not FID_WORK_DIR.is_dir():
+    FID_WORK_DIR.mkdir(parents=True)
+INVDATA_ARCHIVE_PATH = WORK_DIR / mdat.FTC_MERGER_INVESTIGATIONS_DATA.name
+if not INVDATA_ARCHIVE_PATH.is_file():
+    shutil.copy2(mdat.FTC_MERGER_INVESTIGATIONS_DATA, INVDATA_ARCHIVE_PATH)
 TABLE_NO_RE = re.compile(r"Table \d+\.\d+")
 TABLE_TYPES = ("ByHHIandDelta", "ByFirmCount")
@@ -147,8 +136,8 @@ def construct_data(
             ZipFile(_archive_path, "r") as _yzh,
             _yzh.open(f"{_archive_path.stem}.yaml", "r") as _yfh,
         ):
-            invdata_ = this_yaml.load(_yfh)
-        if isinstance(invdata_, MappingProxyType):
+            invdata_: INVData = this_yaml.load(_yfh)
+        if not isinstance(invdata_, MappingProxyType):
             invdata_ = _mappingproxy_from_mapping(invdata_)
             with (
                 ZipFile(_archive_path, "w", compression=ZIP_DEFLATED) as _yzh,
@@ -157,7 +146,7 @@ def construct_data(
                 this_yaml.dump(invdata_, _yfh)
         return invdata_
-    invdata: INVData_in_ = _dict_from_mapping(_parse_invdata())
+    invdata: INVData_in = _dict_from_mapping(_parse_invdata())
     # Add some data periods (
     #   only periods ending in 2011, others have few observations and
@@ -217,7 +206,7 @@ def construct_data(
     return retval
-def _construct_no_evidence_data(_invdata: INVData_in_, _data_period: str, /) -> None:
+def _construct_no_evidence_data(_invdata: INVData_in, _data_period: str, /) -> None:
     invdata_ind_grp = "All Markets"
     table_nos_map = dict(
         zip(
@@ -442,12 +431,12 @@ def _parse_invdata() -> INVData:
     # )
     import pymupdf  # type: ignore  # noqa: PLC0415
-    invdata_docnames = _download_invdata(FTCDATA_DIR)
+    invdata_docnames = _download_invdata(FID_WORK_DIR)
-    invdata: INVData_in_ = {}
+    invdata: INVData_in = {}
     for invdata_docname in invdata_docnames:
-        invdata_pdf_path = FTCDATA_DIR.joinpath(invdata_docname)
+        invdata_pdf_path = FID_WORK_DIR.joinpath(invdata_docname)
         invdata_doc = pymupdf.open(invdata_pdf_path)
         invdata_meta = invdata_doc.metadata
@@ -513,7 +502,7 @@ def _parse_invdata() -> INVData:
 def _parse_page_blocks(
-    _invdata: INVData_in_, _data_period: str, _doc_pg_blocks: Sequence[Sequence[Any]], /
+    _invdata: INVData_in, _data_period: str, _doc_pg_blocks: Sequence[Sequence[Any]], /
 ) -> None:
     if _data_period != "1996-2011":
         _parse_table_blocks(_invdata, _data_period, _doc_pg_blocks)
@@ -540,7 +529,7 @@ def _parse_page_blocks(
 def _parse_table_blocks(
-    _invdata: INVData_in_, _data_period: str, _table_blocks: Sequence[Sequence[str]], /
+    _invdata: INVData_in, _data_period: str, _table_blocks: Sequence[Sequence[str]], /
 ) -> None:
     invdata_evid_cond = "Unrestricted on additional evidence"
     table_num, table_ser, table_type = _identify_table_type(
@@ -709,7 +698,7 @@ def _process_table_blks_cnt_type(
     return invdata_array[np.argsort(invdata_array[:, 0])]
-def _download_invdata(_dl_path: Path = FTCDATA_DIR) -> tuple[str, ...]:
+def _download_invdata(_dl_path: Path = FID_WORK_DIR) -> tuple[str, ...]:
     if not _dl_path.is_dir():
         _dl_path.mkdir(parents=True)

{mergeron-2025.739290.4 → mergeron-2025.739290.6}/src/mergeron/core/guidelines_boundaries.py RENAMED Viewed

@@ -12,7 +12,6 @@ from typing import Literal
 import numpy as np
 from attrs import Attribute, field, frozen, validators
 from mpmath import mp  # type: ignore
-from ruamel import yaml
 from .. import (  # noqa: TID252
     DEFAULT_REC_RATIO,
@@ -23,7 +22,6 @@ from .. import (  # noqa: TID252
     UPPAggrSelector,
     this_yaml,
     yamelize_attrs,
-    yaml_rt_mapper,
 )
 from . import guidelines_boundary_functions as gbfn
@@ -53,14 +51,12 @@ class GuidelinesThresholds:
     ΔHHI, Recapture Ratio, GUPPI, Diversion ratio, CMCR, and IPR thresholds
     constructed from concentration standards in Guidelines published in
-    1982, 1984, 1992, 2010, and 2023.
+    1992, 2010, and 2023.
     """
     pub_year: HMGPubYear = field(
-        kw_only=False,
-        default=2023,
-        validator=validators.in_([1982, 1984, 1992, 2010, 2023]),
+        kw_only=False, default=2023, validator=validators.in_([1992, 2010, 2023])
     )
     """
     Year of publication of the Guidelines
@@ -99,9 +95,7 @@ class GuidelinesThresholds:
         # thus, here, the tentative delta safeharbor under
         # the 2023 Guidelines is 100 points
         hhi_p, dh_s, dh_p = {
-            1982: (_s1982 := (0.18, 0.005, 0.01)),
-            1984: _s1982,
-            1992: _s1982,
+            1992: (0.18, 0.005, 0.01),
             2010: (0.25, 0.01, 0.02),
             2023: (0.18, 0.01, 0.01),
         }[self.pub_year]
@@ -147,21 +141,6 @@ class GuidelinesThresholds:
             ),
         )
-    @classmethod
-    def to_yaml(
-        cls, _r: yaml.representer.RoundTripRepresenter, _d: GuidelinesThresholds
-    ) -> yaml.MappingNode:
-        ret: yaml.MappingNode = _r.represent_mapping(
-            f"!{cls.__name__}", {"pub_year": _d.pub_year}
-        )
-        return ret
-    @classmethod
-    def from_yaml(
-        cls, _c: yaml.constructor.RoundTripConstructor, _n: yaml.MappingNode
-    ) -> GuidelinesThresholds:
-        return cls(**yaml_rt_mapper(_c, _n))
 @frozen
 class ConcentrationBoundary:
@@ -170,8 +149,8 @@ class ConcentrationBoundary:
     measure_name: Literal[
         "ΔHHI",
         "Combined share",
-        "Pre-merger HHI Contribution",
-        "Post-merger HHI Contribution",
+        "HHI contribution, pre-merger",
+        "HHI contribution, post-merger",
     ] = field(kw_only=False, default="ΔHHI")
     @measure_name.validator
@@ -181,8 +160,8 @@ class ConcentrationBoundary:
         if _value not in {
             "ΔHHI",
             "Combined share",
-            "Pre-merger HHI Contribution",
-            "Post-merger HHI Contribution",
+            "HHI contribution, pre-merger",
+            "HHI contribution, post-merger",
         }:
             raise ValueError(f"Invalid name for a concentration measure, {_value!r}.")
@@ -211,9 +190,9 @@ class ConcentrationBoundary:
                 conc_fn = gbfn.hhi_delta_boundary
             case "Combined share":
                 conc_fn = gbfn.combined_share_boundary
-            case "Pre-merger HHI Contribution":
+            case "HHI contribution, pre-merger":
                 conc_fn = gbfn.hhi_pre_contrib_boundary
-            case "Post-merger HHI Contribution":
+            case "HHI contribution, post-merger":
                 conc_fn = gbfn.hhi_post_contrib_boundary
         boundary_ = conc_fn(self.threshold, dps=self.precision)
@@ -257,7 +236,7 @@ class DiversionRatioBoundary:
     )
     recapture_form: RECForm | None = field(kw_only=True, default=RECForm.INOUT)
-    """
+    R"""
     The form of the recapture ratio.
     When :attr:`mergeron.RECForm.INOUT`, the recapture ratio for
@@ -268,12 +247,17 @@ class DiversionRatioBoundary:
     constructed from the generated purchase-probabilities for products in
     the market and for the outside good, specify :attr:`mergeron.RECForm.OUTIN`.)
-    The GUPPI boundary is a continuum of diversion ratio boundaries conditional on
-    price-cost margins, :math:`d_{ij} = g_i * p_i / (m_j * p_j)`,
-    with :math:`d_{ij}` the diverion ratio from product :math:`i` to product :math:`j`;
+    The GUPPI boundary is a continuum of conditional diversion ratio boundaries,
+    .. math::
+        d_{ij} \vert_{p_i, p_j, m_j} \triangleq \frac{g_i p_i}{m_j p_j} = \overline{d}
+    with :math:`d_{ij}` the diversion ratio from product :math:`i` to product :math:`j`;
     :math:`g_i` the GUPPI for product :math:`i`;
-    :math:`m_j` the margin for product :math:`j`; and
-    :math:`p_i, p_j` the prices of goods :math:`i, j`, respectively.
+    :math:`m_j` the price-cost margin on product :math:`j`;
+    :math:`p_i, p_j` the prices of goods :math:`i, j`, respectively; and
+    :math:`\overline{d}` the diversion ratio threshold (i.e., bound).
     """
@@ -477,5 +461,10 @@ if __name__ == "__main__":
     )
-for _typ in (HMGThresholds, ConcentrationBoundary, DiversionRatioBoundary):
-    yamelize_attrs(_typ, {"coordinates", "area"})
+for _typ in (
+    ConcentrationBoundary,
+    DiversionRatioBoundary,
+    GuidelinesThresholds,
+    HMGThresholds,
+):
+    yamelize_attrs(_typ)

{mergeron-2025.739290.4 → mergeron-2025.739290.6}/src/mergeron/core/guidelines_boundary_functions.py RENAMED Viewed

@@ -699,7 +699,7 @@ def _shrratio_boundary_intcpt(
 def lerp[LerpT: (float, MPFloat, ArrayDouble, ArrayBIGINT)](
-    _x1: LerpT, _x2: LerpT, r_: float | MPFloat = 0.25, /
+    _x1: LerpT, _x2: LerpT, _r: float | MPFloat = 0.25, /
 ) -> LerpT:
     """
     From the function of the same name in the C++ standard [2]_
@@ -711,7 +711,7 @@ def lerp[LerpT: (float, MPFloat, ArrayDouble, ArrayBIGINT)](
     ----------
     _x1, _x2
         bounds :math:`x_1, x_2` to interpolate between.
-    r_
+    _r
         interpolation weight :math:`r` assigned to :math:`x_2`
     Returns
@@ -731,14 +731,14 @@ def lerp[LerpT: (float, MPFloat, ArrayDouble, ArrayBIGINT)](
     """
-    if not 0 <= r_ <= 1:
+    if not 0 <= _r <= 1:
         raise ValueError("Specified interpolation weight must lie in [0, 1].")
-    elif r_ == 0:
+    elif _r == 0:
         return _x1
-    elif r_ == 1:
+    elif _r == 1:
         return _x2
     else:
-        return r_ * _x2 + (1 - r_) * _x1
+        return _r * _x2 + (1 - _r) * _x1
 def round_cust(

{mergeron-2025.739290.4 → mergeron-2025.739290.6}/src/mergeron/core/guidelines_boundary_functions_extra.py RENAMED Viewed

@@ -45,8 +45,6 @@ def dh_area_quad(_dh_val: float = 0.01, /) -> float:
     ----------
     _dh_val
         Merging-firms' ΔHHI bound.
-    dps
-        Specified precision in decimal places.
     Returns
     -------
@@ -297,10 +295,10 @@ def shrratio_boundary_distance(  # noqa: PLR0914
             weights_i = (
                 (
-                    w_ := mp.fdiv(
+                    _w := mp.fdiv(
                         s_2 if weighting == "cross-product-share" else s_1, s_1 + s_2
                     ),
-                    1 - w_,
+                    1 - _w,
                 )
                 if weighting
                 else _weights_base

{mergeron-2025.739290.4 → mergeron-2025.739290.6}/src/mergeron/core/pseudorandom_numbers.py RENAMED Viewed

@@ -112,11 +112,11 @@ def gen_seed_seq_list_default(
         63206306147411023146090085885772240748399174641427012462446714431253444120718,
     ]
-    if _len > (lge_ := len(generated_entropy)):
+    if _len > (_lge := len(generated_entropy)):
         e_str_segs = (
             "This function can presently create SeedSequences for generating up to ",
-            f"{lge_:,d} independent random variates. If you really need to generate ",
-            f"more than {lge_:,d} seeded independent random variates, please pass a ",
+            f"{_lge:,d} independent random variates. If you really need to generate ",
+            f"more than {_lge:,d} seeded independent random variates, please pass a ",
             "sufficiently large list of seeds as generated_entropy. See,",
             "{}/{}.".format(
                 "https://numpy.org/doc/stable/reference/random",
@@ -219,13 +219,13 @@ class MultithreadedRNG:
             self.dist_parms, DEFAULT_DIST_PARMS
         ):
             if self.dist_type == "Uniform":
-                dist_type_ = "Random"
+                dist_type = "Random"
             elif self.dist_type == "Normal":
-                dist_type_ = "Gaussian"
+                dist_type = "Gaussian"
         else:
-            dist_type_ = self.dist_type
+            dist_type = self.dist_type
-        step_size = (len(self.values) / self.nthreads).__ceil__()  # noqa: PLC2801
+        step_size = (len(self.values) / self.nthreads).__ceil__()
         seed_ = (
             SeedSequence(pool_size=8)
@@ -233,7 +233,7 @@ class MultithreadedRNG:
             else self.seed_sequence
         )
-        random_generators_ = tuple(prng(_t) for _t in seed_.spawn(self.nthreads))
+        random_generators = tuple(prng(_t) for _t in seed_.spawn(self.nthreads))
         def _fill(
             _rng: np.random.Generator,
@@ -244,23 +244,23 @@ class MultithreadedRNG:
             _last: int,
             /,
         ) -> None:
-            sz_: tuple[int, ...] = out_[_first:_last].shape
+            _sz: tuple[int, ...] = out_[_first:_last].shape
             match _dist_type:
                 case "Beta":
                     shape_a, shape_b = _dist_parms
-                    out_[_first:_last] = _rng.beta(shape_a, shape_b, size=sz_)
+                    out_[_first:_last] = _rng.beta(shape_a, shape_b, size=_sz)
                 case "Dirichlet":
-                    out_[_first:_last] = _rng.dirichlet(_dist_parms, size=sz_[:-1])
+                    out_[_first:_last] = _rng.dirichlet(_dist_parms, size=_sz[:-1])
                 case "Gaussian":
                     _rng.standard_normal(out=out_[_first:_last])
                 case "Normal":
-                    mu_, sigma_ = _dist_parms
-                    out_[_first:_last] = _rng.normal(mu_, sigma_, size=sz_)
+                    _mu, _sigma = _dist_parms
+                    out_[_first:_last] = _rng.normal(_mu, _sigma, size=_sz)
                 case "Random":
                     _rng.random(out=out_[_first:_last])
                 case "Uniform":
                     uni_l, uni_h = _dist_parms
-                    out_[_first:_last] = _rng.uniform(uni_l, uni_h, size=sz_)
+                    out_[_first:_last] = _rng.uniform(uni_l, uni_h, size=_sz)
                 case _:
                     "Unreachable. The validator would have rejected this as invalid."
@@ -271,8 +271,8 @@ class MultithreadedRNG:
                 executor_.submit(
                     _fill,
-                    random_generators_[_i],
-                    dist_type_,
+                    random_generators[_i],
+                    dist_type,
                     self.dist_parms,
                     self.values,
                     range_first,

mergeron-2025.739290.6/src/mergeron/data/__init__.py ADDED Viewed

@@ -0,0 +1,57 @@
+"""
+Data useful for empirical analysis of merger enforcement policy
+These data are processed for further analysis within relevant
+submodules of the parent package. Thus, direct access is
+unnecessary in routine use of this package.
+"""
+from importlib import resources
+from .. import _PKG_NAME, VERSION  # noqa: TID252
+__version__ = VERSION
+DAMODARAN_MARGIN_WORKBOOK = resources.files(f"{_PKG_NAME}.data").joinpath(
+    "damodaran_margin_data.xls"
+)
+"""
+Python object pointing to included copy of Prof. Damodaran's margin data
+Only used as a fallback, in case direct download from source fails.
+NOTES
+-----
+Source data are from Prof. Aswath Damodaran, Stern School of Business, NYU; available online
+at https://pages.stern.nyu.edu/~adamodar/pc/datasets/margin.xls
+Use as, for example:
+.. code-block:: python
+    from mergeron.data import DAMODARAN_MARGIN_WORKBOOK
+    shutil.copy2(DAMODARAN_MARGIN_WORKBOOK, Path.home() / f"{DAMODARAN_MARGIN_WORKBOOK.name}")
+"""
+FTC_MERGER_INVESTIGATIONS_DATA = resources.files(f"{_PKG_NAME}.data").joinpath(
+    "ftc_merger_investigations_data.zip"
+)
+"""
+FTC merger investigtions data published in 2004, 2007, 2008, and 2013
+NOTES
+-----
+Raw data tables published by the FTC are loaded into a nested distionary, organized by
+data period, table type, and table number. Each table is stored as a numerical array
+(:module:`numpy` arrray), with additonal attrubutes for the industry group and additonal
+evidence noted in the source data.
+Data for additonal data periods (time spans) not reported in the  source data,
+e.g., 2004-2011, are constructed by subtracting counts in the base data from counts
+in the cumulative data, by table, for "enforced" mergers and "closed" mergers, when
+the cumulative data for the longer period are consistent with the base data for
+a sub-period.
+"""

mergeron-2025.739290.6/src/mergeron/data/ftc_merger_investigations_data.zip ADDED Viewed

Binary file

{mergeron-2025.739290.4 → mergeron-2025.739290.6}/src/mergeron/demo/visualize_empirical_margin_distribution.py RENAMED Viewed

@@ -13,9 +13,12 @@ from numpy.random import PCG64DXSM, Generator, SeedSequence
 from scipy import stats  # type: ignore
 import mergeron.core.empirical_margin_distribution as emd
-from mergeron import DATA_DIR
+from mergeron import WORK_DIR as PKG_WORK_DIR
 from mergeron.core.guidelines_boundary_functions import boundary_plot
+WORK_DIR = globals().get("WORK_DIR", PKG_WORK_DIR)
+"""Redefined, in case the user defines WORK_DIR betweeen module imports."""
 SAMPLE_SIZE = 10**6
 BIN_COUNT = 25
 margin_data_obs, margin_data_wts, margin_data_stats = emd.margin_data_builder()
@@ -85,4 +88,4 @@ mgn_ax.set_xlabel("Price Cost Margin", fontsize=10)
 mgn_ax.set_ylabel("Relative Frequency", fontsize=10)
 mgn_fig.tight_layout()
-plt.savefig(DATA_DIR / f"{Path(__file__).stem}.pdf")
+plt.savefig(WORK_DIR / f"{Path(__file__).stem}.pdf")

{mergeron-2025.739290.4 → mergeron-2025.739290.6}/src/mergeron/gen/__init__.py RENAMED Viewed

@@ -7,9 +7,11 @@ containers for industry data generation and testing.
 from __future__ import annotations
 import enum
+import io
 from collections.abc import Sequence
 from operator import attrgetter
+import h5py  # type: ignore
 import numpy as np
 from attrs import Attribute, Converter, cmp_using, field, frozen, validators
 from numpy.random import SeedSequence
@@ -22,7 +24,7 @@ from .. import (  # noqa: TID252
     ArrayDouble,
     ArrayFloat,
     ArrayINT,
-    EnumYAMLized,
+    Enameled,
     RECForm,
     UPPAggrSelector,
     this_yaml,
@@ -50,7 +52,7 @@ class SeedSequenceData:
 @this_yaml.register_class
 @enum.unique
-class PriceSpec(tuple[bool, str | None], EnumYAMLized):
+class PriceSpec(tuple[bool, str | None], Enameled):
     """Price specification.
     Whether prices are symmetric and, if not, the direction of correlation, if any.
@@ -65,7 +67,7 @@ class PriceSpec(tuple[bool, str | None], EnumYAMLized):
 @this_yaml.register_class
 @enum.unique
-class SHRDistribution(str, EnumYAMLized):
+class SHRDistribution(str, Enameled):
     """Market share distributions."""
     UNI = "Uniform"
@@ -253,7 +255,7 @@ class ShareSpec:
     in published merger guidelines. Accordingly, the recapture ratio rounded to
     the nearest 5% is:
-    * 0.85, **7-to-6 merger from symmetry**; US Guidelines, 1982, 1984, 1992, 2023
+    * 0.85, **7-to-6 merger from symmetry**; US Guidelines, 1992, 2023
     * 0.80, 5-to-4 merger from symmetry
     * 0.80, **5-to-4 merger to symmetry**; US Guidelines, 2010
@@ -285,7 +287,7 @@ class ShareSpec:
 @this_yaml.register_class
 @enum.unique
-class PCMDistribution(str, EnumYAMLized):
+class PCMDistribution(str, Enameled):
     """Margin distributions."""
     UNI = "Uniform"
@@ -296,7 +298,7 @@ class PCMDistribution(str, EnumYAMLized):
 @this_yaml.register_class
 @enum.unique
-class FM2Constraint(str, EnumYAMLized):
+class FM2Constraint(str, Enameled):
     """Firm 2 margins - derivation methods."""
     IID = "i.i.d"
@@ -401,7 +403,7 @@ class PCMSpec:
 @this_yaml.register_class
 @enum.unique
-class SSZConstant(float, EnumYAMLized):
+class SSZConstant(float, Enameled):
     """
     Scale factors to offset sample size reduction.
@@ -467,10 +469,10 @@ class MarketSampleData:
     """
     @aggregate_purchase_prob.default
-    def __appd(_i: MarketSampleData) -> ArrayINT:
-        e_ = np.empty_like(_i.frmshr_array[:, :1], float)
-        e_.fill(np.nan)
-        return e_
+    def __appd(_i: MarketSampleData) -> ArrayDouble:
+        retval: ArrayDouble = np.empty_like(_i.frmshr_array[:, :1], float)
+        retval.fill(np.nan)
+        return retval
     fcounts: ArrayINT = field(eq=cmp_using(np.array_equal))
     """Number of firms in market"""
@@ -487,19 +489,38 @@ class MarketSampleData:
     """
     @nth_firm_share.default
-    def __nfsd(_i: MarketSampleData) -> ArrayINT:
-        e_ = np.empty_like(_i.frmshr_array[:, :1], float)
-        e_.fill(np.nan)
-        return e_
+    def __nfsd(_i: MarketSampleData) -> ArrayDouble:
+        retval: ArrayDouble = np.empty_like(_i.frmshr_array[:, :1], float)
+        retval.fill(np.nan)
+        return retval
     hhi_post: ArrayDouble = field(eq=cmp_using(np.array_equal))
     """Post-merger change in Herfindahl-Hirschmann Index (HHI)"""
     @hhi_post.default
-    def __hpd(_i: MarketSampleData) -> ArrayINT:
-        e_ = np.empty_like(_i.frmshr_array[:, :1], float)
-        e_.fill(np.nan)
-        return e_
+    def __hpd(_i: MarketSampleData) -> ArrayDouble:
+        retval: ArrayDouble = np.empty_like(_i.frmshr_array[:, :1], float)
+        retval.fill(np.nan)
+        return retval
+    def to_h5bin(self) -> bytes:
+        """Save market sample data to HDF5 file."""
+        byte_stream = io.BytesIO()
+        with h5py.File(byte_stream, "w") as _h5f:
+            for _a in self.__attrs_attrs__:
+                if all((
+                    (_arr := getattr(self, _a.name)).any(),
+                    not np.isnan(_arr).all(),
+                )):
+                    _h5f.create_dataset(_a.name, data=_arr, fletcher32=True)
+        return byte_stream.getvalue()
+    @classmethod
+    def from_h5f(cls, _hfh: io.BufferedReader) -> MarketSampleData:
+        """Load market sample data from HDF5 file."""
+        with h5py.File(_hfh, "r") as _h5f:
+            _retval = cls(**{_a: _h5f[_a][:] for _a in _h5f})
+        return _retval
 @frozen
@@ -557,7 +578,7 @@ class MarginDataSample:
 @this_yaml.register_class
 @enum.unique
-class INVResolution(str, EnumYAMLized):
+class INVResolution(str, Enameled):
     CLRN = "clearance"
     ENFT = "enforcement"
     BOTH = "investigation"

{mergeron-2025.739290.4 → mergeron-2025.739290.6}/src/mergeron/gen/data_generation.py RENAMED Viewed

@@ -5,12 +5,10 @@ Methods to generate data for analyzing merger enforcement policy.
 from __future__ import annotations
-import io
 import zipfile
 from itertools import starmap
 from typing import TypedDict
-import h5py  # type: ignore
 import numpy as np
 from attrs import Attribute, Converter, define, field, validators
 from joblib import Parallel, cpu_count, delayed  # type: ignore
@@ -448,26 +446,26 @@ class MarketSample:
             this_yaml.dump(self, _yfh)
         if save_dataset:
-            if all((_dt := self.dataset is None, _et := self.enf_counts is None)):
+            if all((_ndt := self.dataset is None, _net := self.enf_counts is None)):
                 raise ValueError(
                     "No dataset and/or enforcement counts available for saving. "
                     "Generate some data or set save_dataset to False to poceed."
                 )
-            if not _dt:
-                byte_stream = io.BytesIO()
-                with h5py.File(byte_stream, "w") as h5f:
-                    for _a in self.dataset.__attrs_attrs__:
-                        if all((
-                            (_arr := getattr(self.dataset, _a.name)).any(),
-                            not np.isnan(_arr).all(),
-                        )):
-                            h5f.create_dataset(_a.name, data=_arr, fletcher32=True)
+            if not _ndt:
+                # byte_stream = io.BytesIO()
+                # with h5py.File(byte_stream, "w") as h5f:
+                #     for _a in self.dataset.__attrs_attrs__:
+                #         if all((
+                #             (_arr := getattr(self.dataset, _a.name)).any(),
+                #             not np.isnan(_arr).all(),
+                #         )):
+                #             h5f.create_dataset(_a.name, data=_arr, fletcher32=True)
                 with (zpath / f"{name_root}_dataset.h5").open("wb") as _hfh:
-                    _hfh.write(byte_stream.getvalue())
+                    _hfh.write(self.dataset.to_h5bin())
-            if not _et:
+            if not _net:
                 with (zpath / f"{name_root}_enf_counts.yaml").open("w") as _yfh:
                     this_yaml.dump(self.enf_counts, _yfh)
@@ -491,11 +489,11 @@ class MarketSample:
             if _dt:
                 with _dp.open("rb") as _hfh:
-                    h5f = h5py.File(_hfh)
                     object.__setattr__(  # noqa: PLC2801
                         market_sample_,
                         "dataset",
-                        MarketSampleData(**{_a: h5f[_a][:] for _a in h5f}),
+                        # MarketSampleData(**{_a: h5f[_a][:] for _a in h5f}),
+                        MarketSampleData.from_h5f(_hfh),
                     )
             if _et:
                 object.__setattr__(  # noqa: PLC2801

{mergeron-2025.739290.4 → mergeron-2025.739290.6}/src/mergeron/gen/enforcement_stats.py RENAMED Viewed

@@ -9,7 +9,7 @@ from collections.abc import Mapping
 import numpy as np
 from scipy.interpolate import interp1d  # type: ignore
-from .. import VERSION, ArrayBIGINT, EnumYAMLized, this_yaml  # noqa: TID252
+from .. import VERSION, ArrayBIGINT, Enameled, this_yaml  # noqa: TID252
 from ..core import ftc_merger_investigations_data as fid  # noqa: TID252
 from . import INVResolution
@@ -18,7 +18,7 @@ __version__ = VERSION
 @this_yaml.register_class
 @enum.unique
-class IndustryGroup(str, EnumYAMLized):
+class IndustryGroup(str, Enameled):
     ALL = "All Markets"
     GRO = "Grocery Markets"
     OIL = "Oil Markets"
@@ -33,7 +33,7 @@ class IndustryGroup(str, EnumYAMLized):
 @this_yaml.register_class
 @enum.unique
-class OtherEvidence(str, EnumYAMLized):
+class OtherEvidence(str, Enameled):
     UR = "Unrestricted on additional evidence"
     HD = "Hot Documents Identified"
     HN = "No Hot Documents Identified"
@@ -48,7 +48,7 @@ class OtherEvidence(str, EnumYAMLized):
 @this_yaml.register_class
 @enum.unique
-class StatsGrpSelector(str, EnumYAMLized):
+class StatsGrpSelector(str, Enameled):
     FC = "ByFirmCount"
     HD = "ByHHIandDelta"
     DL = "ByDelta"
@@ -57,7 +57,7 @@ class StatsGrpSelector(str, EnumYAMLized):
 @this_yaml.register_class
 @enum.unique
-class StatsReturnSelector(str, EnumYAMLized):
+class StatsReturnSelector(str, Enameled):
     CNT = "count"
     RPT = "rate, point"
     RIN = "rate, interval"
@@ -65,7 +65,7 @@ class StatsReturnSelector(str, EnumYAMLized):
 @this_yaml.register_class
 @enum.unique
-class SortSelector(str, EnumYAMLized):
+class SortSelector(str, Enameled):
     UCH = "unchanged"
     REV = "reversed"
@@ -236,19 +236,19 @@ def table_no_lku(
     /,
 ) -> str:
     if _table_ind_group not in (
-        igl_ := [_data_array_dict_sub[_v].industry_group for _v in _data_array_dict_sub]
+        _igl := [_data_array_dict_sub[_v].industry_group for _v in _data_array_dict_sub]
     ):
         raise ValueError(
             f"Invalid value for industry group, {f'"{_table_ind_group}"'}."
-            f"Must be one of {igl_!r}"
+            f"Must be one of {_igl!r}"
         )
     tno_ = next(
-        t_
-        for t_ in _data_array_dict_sub
+        _t
+        for _t in _data_array_dict_sub
         if all((
-            _data_array_dict_sub[t_].industry_group == _table_ind_group,
-            _data_array_dict_sub[t_].additional_evidence == _table_evid_cond,
+            _data_array_dict_sub[_t].industry_group == _table_ind_group,
+            _data_array_dict_sub[_t].additional_evidence == _table_evid_cond,
         ))
     )
@@ -259,10 +259,10 @@ def enf_cnts_byfirmcount(_cnts_array: ArrayBIGINT, /) -> ArrayBIGINT:
     ndim_in = 1
     return np.vstack([
         np.concatenate([
-            (f,),
-            np.einsum("ij->j", _cnts_array[_cnts_array[:, 0] == f][:, ndim_in:]),
+            (_i,),
+            np.einsum("ij->j", _cnts_array[_cnts_array[:, 0] == _i][:, ndim_in:]),
         ])
-        for f in np.unique(_cnts_array[:, 0])
+        for _i in np.unique(_cnts_array[:, 0])
     ])
@@ -270,10 +270,10 @@ def enf_cnts_bydelta(_cnts_array: ArrayBIGINT, /) -> ArrayBIGINT:
     ndim_in = 2
     return np.vstack([
         np.concatenate([
-            (f_,),
-            np.einsum("ij->j", _cnts_array[_cnts_array[:, 1] == f_][:, ndim_in:]),
+            (_k,),
+            np.einsum("ij->j", _cnts_array[_cnts_array[:, 1] == _k][:, ndim_in:]),
         ])
-        for f_ in HHI_DELTA_KNOTS[:-1]
+        for _k in HHI_DELTA_KNOTS[:-1]
     ])
@@ -286,10 +286,11 @@ def enf_cnts_byconczone(_cnts_array: ArrayBIGINT, /) -> ArrayBIGINT:
     # aggregation reduces the footprint of this step in memory. Although this point
     # is more relevant for generated than observed data, using the same coding pattern
     # in both cases does make life easier
-    ndim_in = 2
-    nkeys_ = 3
+    _ndim_in = 2
+    _nkeys = 3
     cnts_byhhipostanddelta, cnts_byconczone = (
-        np.zeros(nkeys_ + _cnts_array.shape[1] - ndim_in, dtype=int) for _ in range(2)
+        np.zeros((1, _nkeys + _cnts_array.shape[1] - _ndim_in), dtype=int)
+        for _ in range(2)
     )
     # Prepare to tag clearance stats by presumption zone
@@ -314,7 +315,7 @@ def enf_cnts_byconczone(_cnts_array: ArrayBIGINT, /) -> ArrayBIGINT:
                 np.array(
                     (
                         *zone_val,
-                        *np.einsum("ij->j", _cnts_array[:, ndim_in:][conc_test]),
+                        *np.einsum("ij->j", _cnts_array[:, _ndim_in:][conc_test]),
                     ),
                     dtype=int,
                 ),
@@ -337,7 +338,7 @@ def enf_cnts_byconczone(_cnts_array: ArrayBIGINT, /) -> ArrayBIGINT:
                 (
                     zone_val,
                     np.einsum(
-                        "ij->j", cnts_byhhipostanddelta[hhi_zone_test][:, nkeys_:]
+                        "ij->j", cnts_byhhipostanddelta[hhi_zone_test][:, _nkeys:]
                     ),
                 ),
                 dtype=int,

{mergeron-2025.739290.4 → mergeron-2025.739290.6}/src/mergeron/gen/upp_tests.py RENAMED Viewed

@@ -191,7 +191,7 @@ def compute_upp_test_arrays(
     Parameters
     ----------
-    _market_data
+    _market_data_sample
         market data sample
     _upp_test_parms
         guidelines thresholds for testing UPP and related statistics