PyPI - mgplot - Versions diffs - 0.1.0__py3-none-any.whl - Mend

mgplot 0.1.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (24) hide show

mgplot/__init__.py +121 -0
mgplot/bar_plot.py +107 -0
mgplot/colors.py +199 -0
mgplot/date_utils.py +324 -0
mgplot/finalise_plot.py +335 -0
mgplot/finalisers.py +364 -0
mgplot/growth_plot.py +275 -0
mgplot/kw_type_checking.py +460 -0
mgplot/line_plot.py +178 -0
mgplot/multi_plot.py +339 -0
mgplot/postcovid_plot.py +106 -0
mgplot/py.typed +1 -0
mgplot/revision_plot.py +60 -0
mgplot/run_plot.py +182 -0
mgplot/seastrend_plot.py +74 -0
mgplot/settings.py +164 -0
mgplot/summary_plot.py +240 -0
mgplot/test.py +31 -0
mgplot/utilities.py +254 -0
mgplot-0.1.0.dist-info/METADATA +53 -0
mgplot-0.1.0.dist-info/RECORD +24 -0
mgplot-0.1.0.dist-info/WHEEL +5 -0
mgplot-0.1.0.dist-info/licenses/LICENSE +8 -0
mgplot-0.1.0.dist-info/top_level.txt +1 -0

mgplot/kw_type_checking.py ADDED Viewed

@@ -0,0 +1,460 @@
+"""
+kw_type_checking.py
+- report_kwargs()
+- validate_kwargs()
+- validate_expected()
+- limit_kwargs()
+Private functions used for validating the arguments passed
+to the major functions as **kwargs keyword arguments.  This
+allows us to warn when an unexpected argument appears or
+when the value is not of the expected type.
+This module is not intended to be used directly by the user.
+The assumption is that most keyword arguments are one of the
+following types:
+- simple types (such as str, int, float, bool, complex, NoneType)
+- Sequences (such as list, tuple, but excluding strings, and without
+  being infinitely recursive, like a list of lists of lists ...)
+- Sets (such as set, frozenset)
+- Mappings (such as dict)
+Note: this means some Python types are only partially supported.
+Others are unsupported, such as: generators, iterators, and
+coroutines.
+In  order to check the **kwargs dictionary, we need to construct
+a dictionary of expected keywords and their expected types.
+An example follows.
+expected = {
+    "arg1": str,  # arg1 is expected to be a string
+    "arg2": (int, float),  # arg2 is an int or a float
+    "arg3": (list, (bool,)), # arg3 is a list of Booleans
+    "arg4": (list, (float, int)), # arg4 is a list of floats or ints
+    "arg5": (Sequence, (float, int)), # a sequence of floats or ints
+    "arg6": (dict, (str, int)), # a dictionary with str keys and int values
+)
+Parsing Rules:
+- If the type is a single type, it is used as is.
+- if the type is a tuple of simple types, it is treated as a union.
+- if the type of non-String Sequence, the subsequent tuple is a
+  union of Sequence member types.
+  - eg, (list, (float, int)) is a list of floats or ints.
+  - eg, (int, float, list, (int, float)) is an int, a float or
+        a list of ints or floats.
+- if the type of a Mapping, the subsequent 2-part tuple is treated
+  as the types of the keys and values of the Mapping.
+  - eg, (dict, (str, int)) is a dictionary with str keys and int values.
+  - eg, (dict, (str, (int, float))) is a dictionary with str keys and
+        an int or float values.
+  - eg, (dict, (str, list, (int, float)), (list, (int, float))) is a
+        dictionary with str keys and a list of ints or floats as values.
+- Sets are treated like Sequences.
+Limitations:
+- cannot specify multiple types of Sequence as a type - for example
+    ((list, tuple), int) - but you can specify (Sequence, int) which
+    will match list and tuple types. or you might do it as follows:
+    (list, (int, float), tuple, (int, float)).
+- strings, bytearrays, bytes are treated as simple types, not Sequences.
+- You cannot use generators or iterators as types, they would be
+    consumed in the testing.
+- Sequence, Set and Mapping must be imported from collections.abc
+    and not from the older typing module. A world of pain awaits
+    if you do.
+"""
+# --- imports
+from typing import Any, Final, Union, Optional
+from typing import Sequence as TypingSequence
+from typing import Set as TypingSet
+from typing import Iterable as TypingIterable
+from typing import Mapping as TypingMapping
+from collections.abc import Sequence, Set  # Iterable and Sized
+from collections.abc import Mapping
+from collections.abc import Iterable, Sized, Container, Callable, Generator, Iterator
+import textwrap
+# --- constants
+type NestedTypeTuple = tuple[type | NestedTypeTuple, ...]  # recursive type
+type ExpectedTypeDict = dict[str, type | NestedTypeTuple]
+NOT_SEQUENCE: Final[tuple[type, ...]] = (str, bytearray, bytes, memoryview)
+REPORT_KWARGS: Final[str] = "report_kwargs"  # special case
+# --- module-scoped global variable
+module_testing: bool = False
+# --- functions
+# === keyword argument reporting ===
+def report_kwargs(
+    called_from: str,
+    **kwargs,
+) -> None:
+    """
+    Dump the received keyword arguments to the console.
+    Useful for debugging purposes.
+    Arguments:
+    - called_from: str - the name of the function that called this
+      function, used for debugging.
+    - **kwargs - the keyword arguments to be reported, but only if
+        the REPORT_KWARGS key is present and set to True.
+    """
+    if kwargs.get(REPORT_KWARGS, False):
+        wrapped = textwrap.fill(str(kwargs), width=79)
+        print(f"{called_from} kwargs:\n{wrapped}\n".strip())
+# === limit kwargs to those in an approved list
+def limit_kwargs(
+    expected: ExpectedTypeDict,
+    **kwargs,
+) -> dict[str, Any]:
+    """
+    Limit the keyword arguments to those in the expected dict.
+    """
+    return {k: v for k, v in kwargs.items() if k in expected or k == REPORT_KWARGS}
+# === Keyword expectation validation ===
+def _check_expected_tuple(
+    t: NestedTypeTuple,
+) -> bool:
+    post_mapping = post_sequence = False
+    empty = True
+    for element in t:
+        empty = False
+        if isinstance(element, type):
+            if post_mapping or post_sequence:
+                return False
+            if issubclass(element, NOT_SEQUENCE):
+                post_mapping = post_sequence = False
+                continue
+            if issubclass(element, (Sequence, Set)):
+                post_sequence = True
+                continue
+            if issubclass(element, Mapping):
+                post_mapping = True
+                continue
+            post_mapping = post_sequence = False
+            continue
+        if isinstance(element, tuple):
+            if not (post_mapping or post_sequence):
+                return False
+            if post_sequence:
+                check = _check_expectations(element)
+                if not check:
+                    return False
+                post_sequence = False
+            if post_mapping:
+                if len(element) != 2:
+                    return False
+                check = _check_expectations(element[0]) and _check_expectations(
+                    element[1]
+                )
+                if not check:
+                    return False
+                post_mapping = False
+    if empty:
+        return False
+    return True
+def _check_expected_type(t: type) -> bool:
+    """
+    Check t is an acceptable stand alone type
+    """
+    if issubclass(t, NOT_SEQUENCE):
+        return True
+    if issubclass(t, (Sequence, Set, Mapping)):
+        return False
+    return True
+def _check_expectations(
+    t: type | NestedTypeTuple,
+) -> bool:
+    """
+    Check t is a type or a tuple of types.
+    Where a Sequence or Mapping type is found, check that
+    the subsequent tuple contains valid member types.
+    """
+    # --- simple case
+    if isinstance(t, type):
+        return _check_expected_type(t)
+    # --- more challenging case
+    if isinstance(t, tuple):
+        return _check_expected_tuple(t)
+    return False
+def validate_expected(
+    expected: ExpectedTypeDict,
+    called_from: str,
+) -> None:
+    """
+    Check the expected types dictionary is properly formed.
+    This function should be used on all the expected types
+    dictionaries in the module.
+    It is not intended to be used by the user.
+    This function raises an ValueError exception if the expected
+    types dictionary is malformed.
+    """
+    def check_members(key: str, t: type | NestedTypeTuple) -> str:
+        """
+        Recursively check each element of the NestedTypeTuple.
+        to ensure it is a type or a tuple of types. Returns a string
+        description of any problems found.
+        """
+        problems = ""
+        # --- start with the things that are types
+        if t in (Iterable, Sized, Container, Callable, Generator, Iterator):
+            # note: these collections.abc types *are* types
+            problems += f"{key}: the collections.abc type {t} in {called_from} is unsupported.\n"
+        elif t in (Any,):
+            # Any is also an instance of type
+            problems += f"{key}: please use 'object' rather than 'typing.Any'.\n"
+        elif isinstance(t, type):
+            pass  # Fantastic!
+        # --- then the things that are not types
+        elif isinstance(t, tuple):
+            for element in t:
+                problems += check_members(key, element)
+        elif t in (
+            # note: these typing types *are not* types
+            TypingSequence,
+            TypingSet,
+            TypingMapping,
+            TypingIterable,
+            Union,
+            Optional,
+        ):
+            problems += (
+                f"{key}: Only use the collection.abc types: {t} in {called_from}.\n"
+            )
+        else:
+            problems += f"{key}: Malformed typing '{t}' in {called_from}.\n"
+        return problems
+    problems = ""
+    for key, value in expected.items():
+        if not isinstance(key, str):
+            problems += f"Key '{key}' is not a string - {called_from=}.\n"
+            continue
+        problems += check_members(key, value)
+        if not _check_expectations(value):
+            problems += f"{key}: Malformed '{value}' in {called_from}.\n"
+    if problems:
+        # Other than testing, we want to raise an exception here
+        statement = (
+            "Expected types validation failed "
+            + f"(this is an internal package error):\n{problems}"
+        )
+        if not module_testing:
+            raise ValueError(statement)
+        print(statement)
+# === keyword validation: (1) if expected, (2) of the right type ===
+def _check_tuple(
+    value: Any,
+    typeinfo: NestedTypeTuple,  # we know this is a tuple
+) -> bool:
+    """
+    Check the value against the expected tuple type.
+    """
+    check_sequence = check_mapping = False
+    for thistype in typeinfo:
+        if check_mapping or check_sequence:  # the guard-rail
+            if not isinstance(thistype, tuple):
+                return False
+        if check_sequence and isinstance(thistype, tuple):
+            for v in value:
+                check = _type_check_kwargs(v, thistype)
+                if not check:
+                    check_sequence = False
+                    continue
+            return True
+        if check_mapping and isinstance(thistype, tuple):
+            for k, v in value.items():
+                check = _type_check_kwargs(k, thistype[0]) and _type_check_kwargs(
+                    v, thistype[1]
+                )
+                if not check:
+                    check_mapping = False
+                    continue
+            return True
+        if isinstance(thistype, type) and isinstance(value, thistype):
+            if thistype in NOT_SEQUENCE:
+                return True
+            if issubclass(thistype, (Sequence, Set)):
+                check_sequence = True
+                continue
+            if issubclass(thistype, Mapping):
+                check_mapping = True
+                continue
+            return True
+    return False
+def _type_check_kwargs(
+    value: Any,
+    typeinfo: type | NestedTypeTuple,
+) -> bool:
+    """
+    Check the type of the value against the expected type.
+    """
+    # --- the simple case
+    if isinstance(typeinfo, type):
+        return isinstance(value, typeinfo)
+    # --- complex
+    if isinstance(typeinfo, tuple):
+        return _check_tuple(value, typeinfo)
+    return False
+def validate_kwargs(
+    expected: ExpectedTypeDict,
+    called_from: str,
+    **kwargs,
+) -> None:
+    """
+    This function is used to validate the keyword arguments.
+    To check we don't have unexpected keyword arguments, and
+    to check that the values are of the expected type.
+    Arguments
+    - expected: ExpectedTypeDict - the expected keyword arguments and their types.
+    - called_from: str - the name of the function that called this function,
+    - **kwargs - the keyword arguments to be validated.
+    It is not intended to be used by the user.
+    """
+    problems = ""
+    for key, value in kwargs.items():
+        if key == REPORT_KWARGS and isinstance(value, bool):
+            # This is a special case - and always okay if the value is boolean
+            continue
+        if key not in expected:
+            problems += (
+                f"{key}: unexpected keyword argument with {value=}in {called_from}.\n"
+            )
+            continue
+        if not _type_check_kwargs(value, expected[key]):
+            problems += (
+                f"{key}: with {value=} had the type "
+                f"'{type(value)}' in {called_from}. Expected: {expected[key]}\n"
+            )
+    if problems:
+        # don't raise an exception - just warn instead
+        statement = f"Keyword argument validation issues:\n{problems}"
+        print(statement)
+# --- test code
+if __name__ == "__main__":
+    # Test the type_check_kwargs function
+    module_testing = True  # pylint: disable=invalid-name
+    # --- test the validate_expected() function
+    expected_gb: ExpectedTypeDict = {
+        # - these ones should pass
+        "good1": str,
+        "good2": (int, float),
+        "good3": bool,
+        "good4": (list, (float, int)),
+        "good5": (Sequence, (float, int)),
+        "good6": (dict, (str, int)),
+        "good7": (int, float, list, (int, float)),
+        "good8": (dict, (str, (int, float))),
+        "good9": (set, (str,)),
+        "good10": (frozenset, (str,), int, complex),
+        "good11": (dict, ((str, int), (int, float))),
+        "good12": (list, (dict, ((str, int), (list, (complex,))))),
+        "good13": (Sequence, (int, float), Set, (int, float)),
+        "good14": (Sequence, (str,)),
+        # - these ones should fail
+        "bad1": list,
+        "bad2": (int, (str, bool)),
+        "bad3": tuple(),
+        "bad4": (int, float, set, bool, float),
+        "bad5": (list, float),
+        "bad6": ((list, tuple), (int, float)),
+        "bad7": (dict, (str, int), (int, float)),
+        "bad8": (TypingSequence, (int, float)),
+        # "bad9": (list, [int, float]),
+        "bad10": (dict, (str,)),
+        "bad11": (Iterable, (int, float)),
+        # "bad12": Any,
+    }
+    validate_expected(expected_gb, "testing")
+    # --- test the validate_kwargs() function
+    # bad means the KWARGS are not of the expected type
+    expected_kw: ExpectedTypeDict = {
+        "good_1": str,
+        "good_2": (Sequence, (int, float), int, float),
+        "good_3": (int, float, Sequence, (int, float)),
+        "good_4": (Sequence, (str,)),
+        "bad_1": str,
+        "bad_2": (int, float),
+    }
+    validate_expected(expected_kw, "test")
+    kwargs_test = {
+        # - these ones should pass
+        "good_1": "hello",
+        "good_2": [1, 2, 3],
+        "good_3": (),
+        "good_4": ["fred", "bill", "janice"],
+        "report_kwargs": True,  # special case
+        # - these ones should fail
+        "missing": "hello",
+        "bad_1": 3.14,
+        "bad_2": (3, 4),
+    }
+    validate_kwargs(expected_kw, "test", **kwargs_test)

mgplot/line_plot.py ADDED Viewed

@@ -0,0 +1,178 @@
+"""
+line_plot.py:
+Plot a series or a dataframe with lines.
+"""
+# --- imports
+from typing import Any
+from collections.abc import Sequence
+import matplotlib.pyplot as plt
+from pandas import DataFrame, Period
+from mgplot.settings import DataT, get_setting
+from mgplot.kw_type_checking import (
+    report_kwargs,
+    validate_kwargs,
+    validate_expected,
+    ExpectedTypeDict,
+)
+from mgplot.utilities import (
+    apply_defaults,
+    get_color_list,
+    get_axes,
+    annotate_series,
+    constrain_data,
+    check_clean_timeseries,
+)
+# --- constants
+DATA = "data"
+AX = "ax"
+STYLE, WIDTH, COLOR, ALPHA = "style", "width", "color", "alpha"
+ANNOTATE = "annotate"
+ROUNDING = "rounding"
+FONTSIZE = "fontsize"
+DROPNA = "dropna"
+DRAWSTYLE, MARKER, MARKERSIZE = "drawstyle", "marker", "markersize"
+PLOT_FROM = "plot_from"  # used to constrain the data to a starting point
+LEGEND = "legend"
+LP_KW_TYPES: ExpectedTypeDict = {
+    AX: (plt.Axes, type(None)),
+    STYLE: (str, Sequence, (str,)),
+    WIDTH: (float, int, Sequence, (float, int)),
+    COLOR: (str, Sequence, (str,)),
+    ALPHA: (float, Sequence, (float,)),
+    DRAWSTYLE: (str, Sequence, (str,), type(None)),
+    MARKER: (str, Sequence, (str,), type(None)),
+    MARKERSIZE: (float, Sequence, (float,), int, type(None)),
+    DROPNA: (bool, Sequence, (bool,)),
+    ANNOTATE: (bool, Sequence, (bool,)),
+    ROUNDING: (Sequence, (bool, int), int, bool, type(None)),
+    FONTSIZE: (Sequence, (str, int), str, int, type(None)),
+    PLOT_FROM: (int, Period, type(None)),
+    LEGEND: (dict, (str, object), bool, type(None)),
+}
+validate_expected(LP_KW_TYPES, "line_plot")
+# --- functions
+def _get_style_width_color_etc(
+    item_count, num_data_points, **kwargs
+) -> tuple[dict[str, list | tuple], dict[str, Any]]:
+    """
+    Get the plot-line attributes arguemnts.
+    Returns a dictionary of lists of attributes for each line, and
+    a modified kwargs dictionary.
+    """
+    data_point_thresh = 151
+    defaults: dict[str, Any] = {
+        STYLE: "-",
+        WIDTH: (
+            get_setting("line_normal")
+            if num_data_points > data_point_thresh
+            else get_setting("line_wide")
+        ),
+        COLOR: kwargs.get(COLOR, get_color_list(item_count)),
+        ALPHA: 1.0,
+        DRAWSTYLE: None,
+        MARKER: None,
+        MARKERSIZE: 10,
+        DROPNA: True,
+        ANNOTATE: False,
+        ROUNDING: True,
+        FONTSIZE: "small",
+    }
+    return apply_defaults(item_count, defaults, kwargs)
+def line_plot(data: DataT, **kwargs) -> plt.Axes:
+    """
+    Build a single plot from the data passed in.
+    This can be a single- or multiple-line plot.
+    Return the axes object for the build.
+    Agruments:
+    - data: DataFrame | Series - data to plot
+    - kwargs:
+        - ax: plt.Axes | None - axes to plot on (optional)
+        - dropna: bool | list[bool] - whether to delete NAs frm the
+          data before plotting [optional]
+        - color: str | list[str] - line colors.
+        - width: float | list[float] - line widths [optional].
+        - style: str | list[str] - line styles [optional].
+        - alpha: float | list[float] - line transparencies [optional].
+        - marker: str | list[str] - line markers [optional].
+        - marker_size: float | list[float] - line marker sizes [optional].
+        - annotate: bool | list[bool] - whether to annotate a series.
+        - rounding: int | bool | list[int | bool] - number of decimal places
+          to round an annotation. If True, a default between 0 and 2 is
+          used.
+        - fontsize: int | str | list[int | str] - font size for the
+          annotation.
+        - drawstyle: str | list[str] - matplotlib line draw styles.
+    Returns:
+    - axes: plt.Axes - the axes object for the plot
+    """
+    # sanity checks
+    report_kwargs(called_from="line_plot", **kwargs)
+    data = check_clean_timeseries(data)
+    validate_kwargs(LP_KW_TYPES, called_from="line_plot", **kwargs)
+    # the data to be plotted:
+    df = DataFrame(data)  # really we are only plotting DataFrames
+    df, kwargs = constrain_data(df, **kwargs)
+    if df.empty:
+        print("Warning: No data to plot.")
+    # get the arguments for each line we will plot ...
+    item_count = len(df.columns)
+    num_data_points = len(df)
+    swce, kwargs = _get_style_width_color_etc(item_count, num_data_points, **kwargs)
+    # Let's plot
+    axes, kwargs = get_axes(**kwargs)  # get the axes to plot on
+    for i, column in enumerate(df.columns):
+        series = df[column]
+        series = series.dropna() if DROPNA in swce and swce[DROPNA][i] else series
+        if series.empty or series.isna().all():
+            continue
+        axes = series.plot(
+            ls=swce[STYLE][i],
+            lw=swce[WIDTH][i],
+            color=swce[COLOR][i],
+            alpha=swce[ALPHA][i],
+            marker=swce[MARKER][i],
+            ms=swce[MARKERSIZE][i],
+            drawstyle=swce[DRAWSTYLE][i],
+            ax=axes,
+        )
+        if swce[ANNOTATE][i] is None or not swce[ANNOTATE][i]:
+            continue
+        annotate_series(
+            series,
+            axes,
+            rounding=swce[ROUNDING][i],
+            color=swce[COLOR][i],
+            fontsize=swce[FONTSIZE][i],
+        )
+    # add a legend if requested
+    if len(df.columns) > 1:
+        kwargs[LEGEND] = kwargs.get(LEGEND, get_setting("legend"))
+    if LEGEND in kwargs and kwargs[LEGEND] is not None:
+        legend = kwargs[LEGEND]
+        if isinstance(legend, bool):
+            legend = get_setting("legend")
+        axes.legend(**legend)
+    return axes