PyPI - gcf-python - Versions diffs - 0.4.0__py3-none-any.whl → 0.5.0__py3-none-any.whl - Mend

gcf-python 0.4.0py3-none-any.whl → 0.5.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (8) hide show

gcf/__init__.py CHANGED Viewed

@@ -40,13 +40,16 @@ from .delta import encode_delta
 from .encode import encode
 from .generic import encode_generic
 from .session import Session, encode_with_session
+from .decode_generic import decode_generic
 from .stream import StreamEncoder
+from .stream_generic import GenericStreamEncoder
 from .types import Components, DeltaPayload, Edge, Payload, Symbol
 __all__ = [
     "Components",
     "DecodeError",
     "DeltaPayload",
+    "GenericStreamEncoder",
     "Edge",
     "KIND_ABBREV",
     "KIND_EXPAND",
@@ -55,6 +58,7 @@ __all__ = [
     "StreamEncoder",
     "Symbol",
     "decode",
+    "decode_generic",
     "encode",
     "encode_delta",
     "encode_generic",

gcf/decode_generic.py ADDED Viewed

@@ -0,0 +1,255 @@
+"""GCF generic decoder: parses any GCF text (tabular or graph) back to Python objects."""
+from __future__ import annotations
+from typing import Any
+from .decode import decode
+def decode_generic(input_text: str) -> Any:
+    """Decode any GCF text back into Python objects.
+    Handles tabular arrays, key-value pairs, nested sections, inline
+    primitive arrays, and graph profile payloads.
+    Returns dicts, lists, and primitives matching the original structure.
+    """
+    input_text = input_text.rstrip("\n\r")
+    if not input_text:
+        return None
+    lines = input_text.split("\n")
+    # Graph profile fallback.
+    if lines[0].startswith("GCF "):
+        p = decode(input_text)
+        return {
+            "tool": p.tool,
+            "tokenBudget": p.token_budget,
+            "tokensUsed": p.tokens_used,
+            "packRoot": p.pack_root,
+            "symbols": [
+                {
+                    "qualifiedName": s.qualified_name,
+                    "kind": s.kind,
+                    "score": s.score,
+                    "provenance": s.provenance,
+                    "distance": s.distance,
+                }
+                for s in p.symbols
+            ],
+            "edges": [
+                {
+                    "source": e.source,
+                    "target": e.target,
+                    "edgeType": e.edge_type,
+                    **({"status": e.status} if e.status else {}),
+                }
+                for e in p.edges
+            ],
+        }
+    result: dict[str, Any] = {}
+    _parse_object(lines, 0, 0, result)
+    return result
+def _parse_object(lines: list[str], start: int, depth: int, out: dict[str, Any]) -> int:
+    indent = "  " * depth
+    i = start
+    while i < len(lines):
+        raw = lines[i].rstrip("\r")
+        if raw == "" or raw.startswith("# "):
+            i += 1
+            continue
+        if depth > 0 and not raw.startswith(indent):
+            break
+        content = raw[len(indent):] if depth > 0 else raw
+        if content.startswith("## _summary"):
+            i += 1
+            continue
+        if content.startswith("## "):
+            header = content[3:]
+            bracket_idx = header.find(" [")
+            if bracket_idx >= 0:
+                name = header[:bracket_idx]
+                rest = header[bracket_idx + 2:]
+                close_bracket = rest.find("]")
+                if close_bracket >= 0:
+                    after_bracket = rest[close_bracket + 1:]
+                    if after_bracket.startswith("{"):
+                        field_end = after_bracket.find("}")
+                        if field_end >= 0:
+                            fields = after_bracket[1:field_end].split(",")
+                            i += 1
+                            rows, consumed = _parse_tabular_rows(lines, i, depth, fields)
+                            out[name] = rows
+                            i += consumed
+                            continue
+                    else:
+                        count_str = rest[:close_bracket]
+                        if count_str == "0":
+                            out[name] = []
+                            i += 1
+                            continue
+                        i += 1
+                        items, consumed = _parse_non_uniform_array(lines, i, depth)
+                        out[name] = items
+                        i += consumed
+                        continue
+            name = header
+            bi = name.find(" [")
+            if bi >= 0:
+                name = name[:bi]
+            i += 1
+            nested: dict[str, Any] = {}
+            consumed = _parse_object(lines, i, depth + 1, nested)
+            out[name] = nested
+            i += consumed
+            continue
+        # Inline primitive array.
+        bracket_idx = content.find("[")
+        if bracket_idx > 0:
+            colon_idx = content.find("]: ")
+            if colon_idx > bracket_idx:
+                name = content[:bracket_idx]
+                vals_str = content[colon_idx + 3:]
+                out[name] = [_parse_value(v.strip()) for v in vals_str.split(",")]
+                i += 1
+                continue
+        # Key=value.
+        eq_idx = content.find("=")
+        if eq_idx > 0:
+            key = content[:eq_idx]
+            val = content[eq_idx + 1:]
+            out[key] = _parse_value(val)
+            i += 1
+            continue
+        i += 1
+    return i - start
+def _parse_tabular_rows(
+    lines: list[str], start: int, depth: int, fields: list[str]
+) -> tuple[list[Any], int]:
+    indent = "  " * depth
+    rows: list[Any] = []
+    i = start
+    while i < len(lines):
+        raw = lines[i].rstrip("\r")
+        if raw == "":
+            i += 1
+            continue
+        if depth > 0 and not raw.startswith(indent):
+            break
+        content = raw[len(indent):] if depth > 0 else raw
+        if content.startswith("## "):
+            break
+        if content.startswith("# "):
+            i += 1
+            continue
+        row_data = content
+        has_nested = False
+        if row_data.startswith("@"):
+            sp = row_data.find(" ")
+            if sp > 0:
+                row_data = row_data[sp + 1:]
+                has_nested = True
+        vals = row_data.split("|")
+        row: dict[str, Any] = {}
+        for j, f in enumerate(fields):
+            row[f] = _parse_value(vals[j]) if j < len(vals) else None
+        i += 1
+        if has_nested:
+            nested_indent = indent + "  "
+            while i < len(lines):
+                nl = lines[i].rstrip("\r")
+                if not nl.startswith(nested_indent):
+                    break
+                nc = nl[len(nested_indent):]
+                if nc.startswith("."):
+                    field_name = nc[1:]
+                    i += 1
+                    nested: dict[str, Any] = {}
+                    consumed = _parse_object(lines, i, depth + 2, nested)
+                    row[field_name] = nested
+                    i += consumed
+                else:
+                    break
+        rows.append(row)
+    return rows, i - start
+def _parse_non_uniform_array(
+    lines: list[str], start: int, depth: int
+) -> tuple[list[Any], int]:
+    indent = "  " * depth
+    items: list[Any] = []
+    i = start
+    while i < len(lines):
+        raw = lines[i].rstrip("\r")
+        if raw == "":
+            i += 1
+            continue
+        if depth > 0 and not raw.startswith(indent):
+            break
+        content = raw[len(indent):] if depth > 0 else raw
+        if content.startswith("## "):
+            break
+        if content.startswith("@"):
+            sp = content.find(" ")
+            if sp > 0:
+                items.append(_parse_value(content[sp + 1:]))
+            i += 1
+        else:
+            break
+    return items, i - start
+def _parse_value(s: str) -> Any:
+    if s == "-":
+        return None
+    if s == "true":
+        return True
+    if s == "false":
+        return False
+    if s == '""':
+        return ""
+    if len(s) >= 2 and s[0] == '"' and s[-1] == '"':
+        return s[1:-1].replace('\\"', '"').replace("\\\\", "\\")
+    try:
+        return int(s)
+    except ValueError:
+        pass
+    try:
+        return float(s)
+    except ValueError:
+        pass
+    return s

gcf/stream_generic.py ADDED Viewed

@@ -0,0 +1,111 @@
+"""GCF generic streaming encoder: zero-buffering tabular encode to any writable."""
+from __future__ import annotations
+import threading
+from typing import Any, Sequence
+class GenericStreamEncoder:
+    """Writes GCF tabular output incrementally as rows arrive.
+    Zero buffering: each row is written immediately. A trailer summary is
+    emitted on close() with the final counts.
+    Example::
+        enc = GenericStreamEncoder(sys.stdout)
+        enc.begin_array("employees", ["id", "name", "department", "salary"])
+        enc.write_row([1, "Alice", "Engineering", 95000])
+        enc.write_row([2, "Bob", "Sales", 72000])
+        enc.end_array()
+        enc.close()
+    """
+    def __init__(self, writer: Any) -> None:
+        self._w = writer
+        self._lock = threading.Lock()
+        self._sections: list[tuple[str, int]] = []
+        self._current: dict[str, Any] | None = None
+    def begin_array(self, name: str, fields: Sequence[str]) -> None:
+        """Start a tabular array section with deferred count [?]."""
+        with self._lock:
+            if self._current is not None:
+                self._end_array_locked()
+            self._w.write(f"## {name} [?]{{{','.join(fields)}}}\n")
+            self._current = {"name": name, "fields": list(fields), "count": 0}
+    def write_row(self, values: Sequence[Any]) -> None:
+        """Emit a single pipe-separated row immediately."""
+        with self._lock:
+            if self._current is None:
+                return
+            parts = [_format_value(v) for v in values]
+            self._w.write("|".join(parts) + "\n")
+            self._current["count"] += 1
+    def end_array(self) -> None:
+        """Close the current array section and record its count."""
+        with self._lock:
+            self._end_array_locked()
+    def write_kv(self, key: str, value: Any) -> None:
+        """Emit a key=value line immediately."""
+        with self._lock:
+            self._w.write(f"{key}={_format_value(value)}\n")
+    def write_section(self, name: str) -> None:
+        """Start a nested object section (## key)."""
+        with self._lock:
+            if self._current is not None:
+                self._end_array_locked()
+            self._w.write(f"## {name}\n")
+    def write_inline_array(self, name: str, values: Sequence[Any]) -> None:
+        """Emit a primitive array inline: name[N]: val1,val2,val3"""
+        with self._lock:
+            parts = [_format_value(v) for v in values]
+            self._w.write(f"{name}[{len(values)}]: {','.join(parts)}\n")
+    def close(self) -> None:
+        """Emit the ## _summary trailer with final counts."""
+        with self._lock:
+            if self._current is not None:
+                self._end_array_locked()
+            if not self._sections:
+                return
+            total_rows = 0
+            section_parts: list[str] = []
+            for name, count in self._sections:
+                section_parts.append(f"{name}:{count}")
+                total_rows += count
+            self._w.write(
+                f"## _summary rows={total_rows} sections={','.join(section_parts)}\n"
+            )
+    def _end_array_locked(self) -> None:
+        if self._current is None:
+            return
+        self._sections.append((self._current["name"], self._current["count"]))
+        self._current = None
+def _format_value(v: Any) -> str:
+    if v is None:
+        return "-"
+    if isinstance(v, bool):
+        return "true" if v else "false"
+    if isinstance(v, int):
+        return str(v)
+    if isinstance(v, float):
+        # Match Go's %g formatting
+        s = f"{v:g}"
+        return s
+    if isinstance(v, str):
+        if v == "":
+            return '""'
+        if "|" in v or "\n" in v:
+            return '"' + v.replace('"', '\\"') + '"'
+        return v
+    return str(v)

{gcf_python-0.4.0.dist-info → gcf_python-0.5.0.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: gcf-python
-Version: 0.4.0
+Version: 0.5.0
 Summary: Python implementation of GCF (Graph Compact Format): token-optimized wire format for LLM tool responses
 Project-URL: Homepage, https://github.com/blackwell-systems/gcf-python
 Project-URL: Documentation, https://blackwell-systems.github.io/gcf/
@@ -30,7 +30,7 @@ Description-Content-Type: text/markdown
 # gcf-python
-Python implementation of [GCF (Graph Compact Format)](https://gcformat.com/) — the most token-efficient wire format for LLMs. A drop-in alternative to JSON and TOON for any structured data.
+Python implementation of [GCF](https://gcformat.com/) — the most token-efficient wire format for LLMs. A drop-in alternative to JSON and TOON for any structured data.
 **79% fewer input tokens than JSON. 75% fewer output tokens. 52% smaller than TOON. 100% LLM comprehension at 500 symbols, where JSON scores 76.9% and TOON scores 92.3%.**
@@ -66,33 +66,21 @@ Payload: 50 symbols, 20 edges
 ### Quick Start
 ```python
-from gcf import encode, Payload, Symbol, Edge
+from gcf import encode_generic
-p = Payload(
-    tool="context_for_task",
-    token_budget=5000,
-    tokens_used=1847,
-    symbols=[
-        Symbol(qualified_name="pkg.AuthMiddleware", kind="function", score=0.78, provenance="lsp_resolved", distance=0),
-        Symbol(qualified_name="pkg.NewServer", kind="function", score=0.54, provenance="lsp_resolved", distance=1),
-    ],
-    edges=[
-        Edge(source="pkg.NewServer", target="pkg.AuthMiddleware", edge_type="calls"),
+output = encode_generic({
+    "employees": [
+        {"id": 1, "name": "Alice", "department": "Engineering", "salary": 95000},
+        {"id": 2, "name": "Bob", "department": "Sales", "salary": 72000},
     ],
-)
-output = encode(p)
+})
 ```
 Output:
 ```
-GCF tool=context_for_task budget=5000 tokens=1847 symbols=2 edges=1
-## targets
-@0 fn pkg.AuthMiddleware 0.78 lsp_resolved
-## related
-@1 fn pkg.NewServer 0.54 lsp_resolved
-## edges [1]
-@0<@1 calls
+## employees [2]{id,name,department,salary}
+1|Alice|Engineering|95000
+2|Bob|Sales|72000
 ```
 ## Decode

{gcf_python-0.4.0.dist-info → gcf_python-0.5.0.dist-info}/RECORD RENAMED Viewed

@@ -1,15 +1,17 @@
-gcf/__init__.py,sha256=K4n34s5a0cd0MnYng5UvoTaxT1wIjidv7KgUThELmP4,1596
+gcf/__init__.py,sha256=ihKGNwTM0cYDi3t2o4PJjcRjaRW-rE6LYZKPg_KAldE,1738
 gcf/cli.py,sha256=2hSTBqiYcn1_EgGXuO65MHiEGh0C4DRMvspTd2zUaso,4258
 gcf/constants.py,sha256=cmZ8YJSOB0im_eyfN8v4UvrLpBC6Fuf4cfcKZGbutxY,638
 gcf/decode.py,sha256=48G6XmBilGYl0-c_Xy7MX0iTwOxGW9bn3wC4UyNApc4,5465
+gcf/decode_generic.py,sha256=NWRhOPWHypCDw6BbnDq78J7QA7EmfuBhvRyDKxBLwXg,7292
 gcf/delta.py,sha256=xU0ujtSq1iF7yU8yk_WNQKh8iove-WUV_nKSuvW1XVk,1656
 gcf/encode.py,sha256=Oljb1r5b7SHmng1XYvcvuJMpaRfJVJ81VOyocPf_kAs,2915
 gcf/generic.py,sha256=Nf1Ii0pYS0dgZ4o2ghl-3Qhnms-kCKY2D3q-3-oGpe8,5454
 gcf/session.py,sha256=4_ARRL06Tg2CI8D2eyi0V5nFphFAFMfOKBXYnAbI6Nk,4690
 gcf/stream.py,sha256=DBzZrb9t5ldVEsvcRX90SY59Fm0PM4aPt4XBIrJ1Gro,5186
+gcf/stream_generic.py,sha256=udKtvj-YJXl_eG_KzMZ3g9_EBMS3BTcAmAnsczPJ90M,3826
 gcf/types.py,sha256=AWm-LQoSqLHAYtEjcAxWQZqJ4JXqNreLUKO2mJFgNMA,1465
-gcf_python-0.4.0.dist-info/METADATA,sha256=pucirOGE46EL70gW8PjeRe1uY4WyzSihRZrn-zryNqk,9074
-gcf_python-0.4.0.dist-info/WHEEL,sha256=mffPy8wBnZQn2VnJUU5jE99KsxaSfiyMHV9Yt0aLVxs,87
-gcf_python-0.4.0.dist-info/entry_points.txt,sha256=aFT6gqlkh8iGfM8cblE-LUMxHH08_v71IIoZtDdRIVA,37
-gcf_python-0.4.0.dist-info/licenses/LICENSE,sha256=txSvg3E4LugiB7MOOTci6WKd6wMOrOJTvaITeFJ2SgU,1074
-gcf_python-0.4.0.dist-info/RECORD,,
+gcf_python-0.5.0.dist-info/METADATA,sha256=M399fPoVeSL4AvQqm7HaR92rkVCilg5MC1jzqWHwSSg,8667
+gcf_python-0.5.0.dist-info/WHEEL,sha256=mffPy8wBnZQn2VnJUU5jE99KsxaSfiyMHV9Yt0aLVxs,87
+gcf_python-0.5.0.dist-info/entry_points.txt,sha256=aFT6gqlkh8iGfM8cblE-LUMxHH08_v71IIoZtDdRIVA,37
+gcf_python-0.5.0.dist-info/licenses/LICENSE,sha256=txSvg3E4LugiB7MOOTci6WKd6wMOrOJTvaITeFJ2SgU,1074
+gcf_python-0.5.0.dist-info/RECORD,,

{gcf_python-0.4.0.dist-info → gcf_python-0.5.0.dist-info}/WHEEL RENAMED Viewed

File without changes

{gcf_python-0.4.0.dist-info → gcf_python-0.5.0.dist-info}/entry_points.txt RENAMED Viewed

File without changes

{gcf_python-0.4.0.dist-info → gcf_python-0.5.0.dist-info}/licenses/LICENSE RENAMED Viewed

File without changes

gcf-python 0.4.0__py3-none-any.whl → 0.5.0__py3-none-any.whl

gcf-python 0.4.0py3-none-any.whl → 0.5.0py3-none-any.whl