PyPI - ledgerkit - Versions diffs - 1.0.0.dev1__py3-none-any.whl - Mend

ledgerkit 1.0.0.dev1__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (18) hide show

ledgerkit/__init__.py +51 -0
ledgerkit/__main__.py +12 -0
ledgerkit/_pandas_compat.py +21 -0
ledgerkit/checks.py +617 -0
ledgerkit/cli.py +448 -0
ledgerkit/commodity_style.py +274 -0
ledgerkit/editor_model.py +193 -0
ledgerkit/loader.py +311 -0
ledgerkit/models.py +459 -0
ledgerkit/parser.py +1547 -0
ledgerkit/reports.py +573 -0
ledgerkit/writer.py +97 -0
ledgerkit-1.0.0.dev1.dist-info/METADATA +203 -0
ledgerkit-1.0.0.dev1.dist-info/RECORD +18 -0
ledgerkit-1.0.0.dev1.dist-info/WHEEL +5 -0
ledgerkit-1.0.0.dev1.dist-info/entry_points.txt +2 -0
ledgerkit-1.0.0.dev1.dist-info/licenses/LICENSE +21 -0
ledgerkit-1.0.0.dev1.dist-info/top_level.txt +1 -0

ledgerkit/commodity_style.py ADDED Viewed

@@ -0,0 +1,274 @@
+"""Commodity display style inference and formatting for ledgerkit.
+Captures how a commodity's amounts should be formatted: symbol position,
+spacing, decimal mark, digit-group separator, and precision. Styles are
+inferred from the first amount seen in the journal or from an explicit
+`commodity` directive, then applied consistently throughout report output.
+"""
+from __future__ import annotations
+import re
+from dataclasses import dataclass
+from decimal import Decimal
+from typing import Optional
+# ---------------------------------------------------------------------------
+# Module-level helpers
+# ---------------------------------------------------------------------------
+def _group_digits(digits: str, sep: str) -> str:
+    """Insert sep every 3 digits from the right (e.g. "1234567" → "1,234,567")."""
+    result = []
+    for i, ch in enumerate(reversed(digits)):
+        if i > 0 and i % 3 == 0:
+            result.append(sep)
+        result.append(ch)
+    return "".join(reversed(result))
+# ---------------------------------------------------------------------------
+# Regexes
+# ---------------------------------------------------------------------------
+# Matches a trailing suffix commodity symbol in a style/amount string.
+#
+# Purpose: identify an alphabetic commodity code (e.g. "EUR", "USD", "AAPL")
+#          at the end of an amount string, optionally preceded by whitespace.
+#          Used by parse_style_override() to extract the commodity before
+#          delegating to infer().
+#
+# Group breakdown:
+#   (1) ([A-Za-z][A-Za-z0-9]*)  — letter-started alphanumeric token;
+#                                  matches "EUR", "USD", "AAPL", "GBP" etc.
+#   \s*$                         — optional trailing whitespace then end of string
+#
+# Edge cases:
+#   - "1,234.56 EUR"  → matches "EUR"
+#   - "1.000,00 EUR"  → matches "EUR"
+#   - "$1,234.56"     → does NOT match (no trailing alphabetic token)
+#   - "bad input !!"  → does NOT match ("!!" is not alphanumeric)
+#   - "EUR 1,234.56"  → does NOT match (EUR is not at the end)
+_STYLE_SUFFIX_COMMODITY = re.compile(r"([A-Za-z][A-Za-z0-9]*)\s*$")
+# Matches a leading prefix commodity symbol in a style/amount string.
+#
+# Purpose: identify a non-numeric, non-separator commodity symbol (e.g. "$",
+#          "£", "€") at the start of an amount string, after an optional
+#          minus sign.  Used by parse_style_override() when no suffix
+#          alphabetic commodity is found.
+#
+# Group breakdown:
+#   (1) (-?)               — optional leading minus sign (consumed, not used here)
+#   (2) ([^\d,.\s-]+)      — one or more characters that are not digits, commas,
+#                            dots, whitespace, or minus; captures currency symbols
+#                            like "$", "£", "€", "¥"
+#
+# Edge cases:
+#   - "$1,234.56"     → group 2 = "$"
+#   - "£9,999.00"     → group 2 = "£"
+#   - "1,234.56 EUR"  → does NOT match (starts with a digit)
+#   - "-$1,234.56"    → group 1 = "-", group 2 = "$"
+#   - "bad input !!"  → group 2 = "bad" (but caller validates digits are present)
+_STYLE_PREFIX_COMMODITY = re.compile(r"^(-?)([^\d,.\s-]+)")
+# ---------------------------------------------------------------------------
+# CommodityStyle
+# ---------------------------------------------------------------------------
+@dataclass
+class CommodityStyle:
+    """Display style for a single commodity, inferred from journal data.
+    Captures how amounts in this commodity should be formatted: whether the
+    symbol is a prefix or suffix, whether there is a space between symbol
+    and number, which character is the decimal mark, which (if any) is the
+    digit-group separator, and how many decimal places to show.
+    """
+    commodity: str
+    prefix: bool = True
+    space: bool = False
+    decimal_mark: str = "."
+    group_separator: str = ""
+    precision: int = 2
+    # ------------------------------------------------------------------
+    # Formatting
+    # ------------------------------------------------------------------
+    def format(self, quantity: Decimal) -> str:
+        """Return a formatted amount string using this commodity's display style."""
+        negative = quantity < 0
+        abs_qty = abs(quantity)
+        if self.precision > 0:
+            # Python always formats with '.' — we replace it with decimal_mark below.
+            formatted = f"{abs_qty:.{self.precision}f}"
+            int_str, frac_str = formatted.split(".")
+        else:
+            int_str = str(int(abs_qty))
+            frac_str = ""
+        if self.group_separator:
+            int_str = _group_digits(int_str, self.group_separator)
+        if frac_str:
+            number = int_str + self.decimal_mark + frac_str
+        else:
+            number = int_str
+        gap = " " if self.space else ""
+        if self.prefix:
+            # hledger convention: prefix-symbol negative → SYMBOL-NUMBER (e.g. £-5.00)
+            if negative:
+                return f"{self.commodity}-{number}"
+            return f"{self.commodity}{gap}{number}"
+        else:
+            # hledger convention: suffix-symbol negative → -NUMBER SYMBOL (e.g. -5.00 EUR)
+            if negative:
+                return f"-{number}{gap}{self.commodity}"
+            return f"{number}{gap}{self.commodity}"
+    # ------------------------------------------------------------------
+    # Inference
+    # ------------------------------------------------------------------
+    @classmethod
+    def infer(cls, commodity: str, raw_amount_str: str) -> "CommodityStyle":
+        """Infer a CommodityStyle by parsing the first seen raw amount string.
+        Detects prefix/suffix, spacing, decimal mark, group separator, and
+        precision from the raw text as it appeared in the journal source.
+        """
+        raw = raw_amount_str.strip()
+        # Strip leading minus sign for symbol detection purposes.
+        s = raw[1:] if raw.startswith("-") else raw
+        prefix = True
+        space = False
+        numeric = s
+        if commodity and s.startswith(commodity):
+            prefix = True
+            rest = s[len(commodity):]
+            space = rest.startswith(" ") or rest.startswith("\t")
+            numeric = rest.lstrip()
+        elif commodity and s.endswith(commodity):
+            prefix = False
+            rest = s[: -len(commodity)]
+            space = rest.endswith(" ") or rest.endswith("\t")
+            numeric = rest.rstrip()
+        # else: numeric = s (no recognisable commodity position; rare edge case)
+        decimal_mark, group_separator, precision = _infer_separators(numeric)
+        return cls(
+            commodity=commodity,
+            prefix=prefix,
+            space=space,
+            decimal_mark=decimal_mark,
+            group_separator=group_separator,
+            precision=precision,
+        )
+    # ------------------------------------------------------------------
+    # Override parsing
+    # ------------------------------------------------------------------
+    @classmethod
+    def parse_style_override(cls, style_string: str) -> "CommodityStyle":
+        """Parse a -c/--commodity-style override string in hledger format.
+        Examples::
+            "1,000.00 USD"   → suffix, space, dot decimal, comma group, precision 2
+            "$1,000.00"      → prefix, no space, dot decimal, comma group, precision 2
+            "1.000,00 EUR"   → suffix, space, comma decimal, dot group, precision 2
+        Returns a CommodityStyle with the commodity extracted from the string.
+        Raises ValueError if the string cannot be parsed or contains no digits.
+        """
+        s = style_string.strip()
+        if not s:
+            raise ValueError(f"cannot parse commodity style: empty string")
+        # Must contain at least one digit to be a valid amount string.
+        if not any(ch.isdigit() for ch in s):
+            raise ValueError(
+                f"cannot parse commodity style (no digits): {style_string!r}"
+            )
+        # Try suffix alphabetic commodity first (e.g. "1,000.00 USD").
+        m_suffix = _STYLE_SUFFIX_COMMODITY.search(s)
+        if m_suffix:
+            commodity = m_suffix.group(1)
+            return cls.infer(commodity, s)
+        # Try prefix non-digit commodity symbol (e.g. "$1,000.00").
+        m_prefix = _STYLE_PREFIX_COMMODITY.match(s)
+        if m_prefix and m_prefix.group(2):
+            commodity = m_prefix.group(2)
+            return cls.infer(commodity, s)
+        raise ValueError(f"cannot parse commodity style: {style_string!r}")
+# ---------------------------------------------------------------------------
+# Separator inference helper
+# ---------------------------------------------------------------------------
+def _infer_separators(numeric: str) -> tuple:
+    """Return (decimal_mark, group_separator, precision) from a numeric string."""
+    dots = numeric.count(".")
+    commas = numeric.count(",")
+    if dots > 0 and commas > 0:
+        # Both present: the rightmost separator is the decimal mark.
+        last_dot = numeric.rfind(".")
+        last_comma = numeric.rfind(",")
+        if last_dot > last_comma:
+            # e.g. "1,234.56" → decimal ".", group ","
+            decimal_mark = "."
+            group_separator = ","
+            precision = len(numeric) - last_dot - 1
+        else:
+            # e.g. "1.234,56" → decimal ",", group "."
+            decimal_mark = ","
+            group_separator = "."
+            precision = len(numeric) - last_comma - 1
+    elif dots > 0:
+        last_dot = numeric.rfind(".")
+        digits_after = len(numeric) - last_dot - 1
+        if digits_after == 3 and dots == 1 and last_dot > 0:
+            # e.g. "1.234" → group ".", decimal "," (European integer)
+            group_separator = "."
+            decimal_mark = ","
+            precision = 0
+        else:
+            # e.g. "1.5", "100.00" → decimal "."
+            decimal_mark = "."
+            group_separator = ""
+            precision = digits_after
+    elif commas > 0:
+        last_comma = numeric.rfind(",")
+        digits_after = len(numeric) - last_comma - 1
+        if digits_after == 3 and commas == 1 and last_comma > 0:
+            # e.g. "1,234" → group ",", decimal "." (US/UK integer)
+            group_separator = ","
+            decimal_mark = "."
+            precision = 0
+        else:
+            # e.g. "100,5", "1,50" → decimal ","
+            decimal_mark = ","
+            group_separator = ""
+            precision = digits_after
+    else:
+        # No separators at all (e.g. "100", "42")
+        decimal_mark = "."
+        group_separator = ""
+        precision = 0
+    return decimal_mark, group_separator, precision

ledgerkit/editor_model.py ADDED Viewed

@@ -0,0 +1,193 @@
+"""In-memory editable document model for ledgerkit.
+Provides EditorDocument: load a journal file, mutate transactions in memory,
+validate individual transactions, and write changes back to disk faithfully.
+Intended for use by TUI/editor frontends. Not imported by any core module.
+"""
+from __future__ import annotations
+from pathlib import Path
+from ledgerkit.checks import CheckError, check_transaction_autobalanced
+from ledgerkit.models import Journal, SourceSpan, Transaction
+from ledgerkit.parser import parse_string
+from ledgerkit.writer import transaction_to_text
+class EditorDocument:
+    """An in-memory editable representation of a journal file.
+    Attributes:
+        path:    Resolved absolute path to the journal file.
+        journal: Parsed Journal with all transactions (source_span populated).
+        lines:   Current file content as a list of strings, one per line,
+                 without newline characters.
+        dirty:   True when lines differ from the last saved/loaded content.
+    V1 limitation: include directives in the file are not processed; the file
+    is parsed as-is with parse_string(). Use loader.load_journal() when
+    full include support is required.
+    """
+    path: str
+    journal: Journal
+    lines: list[str]
+    dirty: bool
+    def __init__(self, path: str) -> None:
+        """Load the journal at path; populate journal and lines."""
+        abs_path = str(Path(path).resolve())
+        self.path = abs_path
+        text = Path(abs_path).read_text(encoding="utf-8")
+        self.lines = text.splitlines()
+        self.journal = parse_string(text, source_file=abs_path)
+        self.dirty = False
+    # ------------------------------------------------------------------
+    # Span refresh helpers
+    # ------------------------------------------------------------------
+    def _shift_spans_after(self, after_line: int, delta: int) -> None:
+        """Shift source_span of every transaction that starts after after_line."""
+        for txn in self.journal.transactions:
+            if txn.source_span and txn.source_span.start_line > after_line:
+                txn.source_span = SourceSpan(
+                    file=txn.source_span.file,
+                    start_line=txn.source_span.start_line + delta,
+                    end_line=txn.source_span.end_line + delta,
+                )
+    # ------------------------------------------------------------------
+    # Mutation methods
+    # ------------------------------------------------------------------
+    def add_transaction(self, txn: Transaction) -> None:
+        """Insert txn into self.lines in chronological order.
+        Inserts after the last transaction whose date <= txn.date. Updates
+        self.journal.transactions. Sets dirty=True. txn.source_span is
+        assigned after insertion.
+        """
+        new_lines = transaction_to_text(txn).splitlines()
+        n = len(new_lines)
+        # Find the last transaction with date <= txn.date (by start_line order)
+        sorted_txns = sorted(
+            [t for t in self.journal.transactions if t.source_span],
+            key=lambda t: (t.date, t.source_span.start_line),  # type: ignore[union-attr]
+        )
+        insert_after: Transaction | None = None
+        for t in sorted_txns:
+            if t.date <= txn.date:
+                insert_after = t
+        if insert_after is None or insert_after.source_span is None:
+            # Insert at the very beginning (prepend)
+            insert_idx = 0  # 0-based index into self.lines
+            self.lines[0:0] = new_lines + [""]
+            txn.source_span = SourceSpan(
+                file=self.path,
+                start_line=1,
+                end_line=n,
+            )
+            self._shift_spans_after(n, n + 1)
+        else:
+            # Insert after the end of insert_after (insert_idx is 0-based)
+            insert_idx = insert_after.source_span.end_line  # end_line is 1-based → index after block
+            self.lines[insert_idx:insert_idx] = [""] + new_lines
+            txn.source_span = SourceSpan(
+                file=self.path,
+                start_line=insert_idx + 2,   # +1 for the blank line, +1 for 1-based
+                end_line=insert_idx + 1 + n,
+            )
+            self._shift_spans_after(insert_after.source_span.end_line, n + 1)
+        self.journal.transactions.append(txn)
+        self.journal.transactions.sort(
+            key=lambda t: (t.date, t.source_span.start_line if t.source_span else 0)
+        )
+        self.dirty = True
+    def update_transaction(self, original: Transaction, updated: Transaction) -> None:
+        """Replace the lines occupied by original with the serialised form of updated.
+        Refreshes all source_span values for transactions whose line numbers
+        shifted. Sets dirty=True.
+        """
+        span = original.source_span
+        if span is None:
+            raise ValueError("update_transaction: original has no source_span")
+        new_lines = transaction_to_text(updated).splitlines()
+        old_count = span.end_line - span.start_line + 1
+        delta = len(new_lines) - old_count
+        # Replace lines in-place (start_line is 1-based → index = start_line - 1)
+        self.lines[span.start_line - 1 : span.end_line] = new_lines
+        updated.source_span = SourceSpan(
+            file=span.file,
+            start_line=span.start_line,
+            end_line=span.start_line + len(new_lines) - 1,
+        )
+        # Replace in journal.transactions
+        idx = self.journal.transactions.index(original)
+        self.journal.transactions[idx] = updated
+        # Shift all transactions that come after the modified block
+        if delta != 0:
+            self._shift_spans_after(span.end_line, delta)
+        self.dirty = True
+    def delete_transaction(self, txn: Transaction) -> None:
+        """Remove the lines occupied by txn and any immediately following blank line.
+        Refreshes source_span values. Sets dirty=True.
+        """
+        span = txn.source_span
+        if span is None:
+            raise ValueError("delete_transaction: txn has no source_span")
+        # end is the 0-based exclusive end index for slicing
+        start_idx = span.start_line - 1   # inclusive, 0-based
+        end_idx = span.end_line           # exclusive, 0-based (span.end_line is 1-based inclusive)
+        # Also consume a trailing blank separator line if present
+        if end_idx < len(self.lines) and self.lines[end_idx] == "":
+            end_idx += 1
+        removed = end_idx - start_idx
+        del self.lines[start_idx:end_idx]
+        self.journal.transactions.remove(txn)
+        self._shift_spans_after(span.start_line, -removed)
+        self.dirty = True
+    def save(self) -> None:
+        """Write self.lines to self.path; set dirty=False."""
+        content = "\n".join(self.lines)
+        if content and not content.endswith("\n"):
+            content += "\n"
+        Path(self.path).write_text(content, encoding="utf-8")
+        self.dirty = False
+    def reload(self) -> None:
+        """Re-read self.path from disk and re-parse.
+        Replaces self.journal and self.lines. Resets dirty=False.
+        """
+        text = Path(self.path).read_text(encoding="utf-8")
+        self.lines = text.splitlines()
+        self.journal = parse_string(text, source_file=self.path)
+        self.dirty = False
+    def validate_transaction(self, txn: Transaction) -> list[CheckError]:
+        """Run the autobalanced check on txn alone.
+        Returns a (possibly empty) list of CheckError. Does not raise.
+        """
+        return check_transaction_autobalanced(txn)