PyPI - python-jsonpath - Versions diffs - 1.3.2__py3-none-any.whl → 2.0.1__py3-none-any.whl - Mend

python-jsonpath 1.3.2py3-none-any.whl → 2.0.1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (31) hide show

jsonpath/__about__.py +1 -1
jsonpath/__init__.py +290 -8
jsonpath/_types.py +31 -0
jsonpath/cli.py +11 -1
jsonpath/env.py +100 -47
jsonpath/exceptions.py +78 -7
jsonpath/filter.py +78 -84
jsonpath/function_extensions/__init__.py +4 -2
jsonpath/function_extensions/_pattern.py +112 -0
jsonpath/function_extensions/keys.py +27 -8
jsonpath/function_extensions/match.py +11 -13
jsonpath/function_extensions/search.py +11 -13
jsonpath/function_extensions/starts_with.py +21 -0
jsonpath/lex.py +113 -64
jsonpath/lru_cache.py +130 -0
jsonpath/match.py +13 -0
jsonpath/parse.py +448 -302
jsonpath/patch.py +8 -3
jsonpath/path.py +48 -84
jsonpath/pointer.py +52 -55
jsonpath/segments.py +131 -0
jsonpath/selectors.py +448 -482
jsonpath/stream.py +68 -70
jsonpath/token.py +59 -61
jsonpath/unescape.py +134 -0
{python_jsonpath-1.3.2.dist-info → python_jsonpath-2.0.1.dist-info}/METADATA +7 -3
python_jsonpath-2.0.1.dist-info/RECORD +42 -0
python_jsonpath-1.3.2.dist-info/RECORD +0 -36
{python_jsonpath-1.3.2.dist-info → python_jsonpath-2.0.1.dist-info}/WHEEL +0 -0
{python_jsonpath-1.3.2.dist-info → python_jsonpath-2.0.1.dist-info}/entry_points.txt +0 -0
{python_jsonpath-1.3.2.dist-info → python_jsonpath-2.0.1.dist-info}/licenses/LICENSE.txt +0 -0

jsonpath/function_extensions/search.py CHANGED Viewed

@@ -1,21 +1,19 @@
 """The standard `search` function extension."""
-import re
+from ._pattern import AbstractRegexFilterFunction
-from jsonpath.function_extensions import ExpressionType
-from jsonpath.function_extensions import FilterFunction
+class Search(AbstractRegexFilterFunction):
+    """The standard `search` function."""
-class Search(FilterFunction):
-    """A type-aware implementation of the standard `search` function."""
+    def __call__(self, value: object, pattern: object) -> bool:
+        """Return `True` if _value_ matches _pattern_, or `False` otherwise."""
+        if not isinstance(value, str) or not isinstance(pattern, str):
+            return False
-    arg_types = [ExpressionType.VALUE, ExpressionType.VALUE]
-    return_type = ExpressionType.LOGICAL
+        _pattern = self.check_cache(pattern)
-    def __call__(self, string: str, pattern: str) -> bool:
-        """Return `True` if _string_ contains _pattern_, or `False` otherwise."""
-        try:
-            # re.search caches compiled patterns internally
-            return bool(re.search(pattern, string))
-        except (TypeError, re.error):
+        if _pattern is None:
             return False
+        return bool(_pattern.search(value))

jsonpath/function_extensions/starts_with.py ADDED Viewed

@@ -0,0 +1,21 @@
+"""The `startswith` function extension."""
+from jsonpath.function_extensions import ExpressionType
+from jsonpath.function_extensions import FilterFunction
+class StartsWith(FilterFunction):
+    """The `startswith` function extension."""
+    arg_types = [ExpressionType.VALUE, ExpressionType.VALUE]
+    return_type = ExpressionType.LOGICAL
+    def __call__(self, value: object, prefix: object) -> bool:
+        """Return `True` if `value` starts with `prefix`."""
+        if not isinstance(value, str) or not isinstance(prefix, str):
+            return False
+        try:
+            return value.startswith(prefix)
+        except AttributeError:
+            return False

jsonpath/lex.py CHANGED Viewed

@@ -10,14 +10,16 @@ from typing import Pattern
 from .exceptions import JSONPathSyntaxError
 from .token import TOKEN_AND
-from .token import TOKEN_BARE_PROPERTY
+from .token import TOKEN_COLON
 from .token import TOKEN_COMMA
 from .token import TOKEN_CONTAINS
 from .token import TOKEN_DDOT
+from .token import TOKEN_DOT
+from .token import TOKEN_DOT_KEY_PROPERTY
 from .token import TOKEN_DOT_PROPERTY
 from .token import TOKEN_DOUBLE_QUOTE_STRING
 from .token import TOKEN_EQ
-from .token import TOKEN_FAKE_ROOT
+from .token import TOKEN_ERROR
 from .token import TOKEN_FALSE
 from .token import TOKEN_FILTER
 from .token import TOKEN_FILTER_CONTEXT
@@ -25,26 +27,27 @@ from .token import TOKEN_FLOAT
 from .token import TOKEN_FUNCTION
 from .token import TOKEN_GE
 from .token import TOKEN_GT
-from .token import TOKEN_ILLEGAL
 from .token import TOKEN_IN
 from .token import TOKEN_INT
 from .token import TOKEN_INTERSECTION
 from .token import TOKEN_KEY
+from .token import TOKEN_KEY_NAME
 from .token import TOKEN_KEYS
+from .token import TOKEN_KEYS_FILTER
+from .token import TOKEN_LBRACKET
 from .token import TOKEN_LE
 from .token import TOKEN_LG
-from .token import TOKEN_LIST_SLICE
-from .token import TOKEN_LIST_START
 from .token import TOKEN_LPAREN
 from .token import TOKEN_LT
 from .token import TOKEN_MISSING
+from .token import TOKEN_NAME
 from .token import TOKEN_NE
 from .token import TOKEN_NIL
 from .token import TOKEN_NONE
 from .token import TOKEN_NOT
 from .token import TOKEN_NULL
 from .token import TOKEN_OR
-from .token import TOKEN_PROPERTY
+from .token import TOKEN_PSEUDO_ROOT
 from .token import TOKEN_RBRACKET
 from .token import TOKEN_RE
 from .token import TOKEN_RE_FLAGS
@@ -53,13 +56,10 @@ from .token import TOKEN_ROOT
 from .token import TOKEN_RPAREN
 from .token import TOKEN_SELF
 from .token import TOKEN_SINGLE_QUOTE_STRING
-from .token import TOKEN_SKIP
-from .token import TOKEN_SLICE_START
-from .token import TOKEN_SLICE_STEP
-from .token import TOKEN_SLICE_STOP
 from .token import TOKEN_TRUE
 from .token import TOKEN_UNDEFINED
 from .token import TOKEN_UNION
+from .token import TOKEN_WHITESPACE
 from .token import TOKEN_WILD
 from .token import Token
@@ -87,7 +87,7 @@ class Lexer:
     key_pattern = r"[\u0080-\uFFFFa-zA-Z_][\u0080-\uFFFFa-zA-Z0-9_-]*"
-    # `not` or !
+    # ! or `not`
     logical_not_pattern = r"(?:not\b)|!"
     # && or `and`
@@ -103,45 +103,50 @@ class Lexer:
         self.single_quote_pattern = r"'(?P<G_SQUOTE>(?:(?!(?<!\\)').)*)'"
         # .thing
-        self.dot_property_pattern = rf"\.(?P<G_PROP>{self.key_pattern})"
+        self.dot_property_pattern = rf"(?P<G_DOT>\.)(?P<G_PROP>{self.key_pattern})"
-        self.slice_list_pattern = (
-            r"(?P<G_LSLICE_START>\-?\d*)\s*"
-            r":\s*(?P<G_LSLICE_STOP>\-?\d*)\s*"
-            r"(?::\s*(?P<G_LSLICE_STEP>\-?\d*))?"
+        # .~thing
+        self.dot_key_pattern = (
+            r"(?P<G_DOT_KEY>\.)"
+            rf"(?P<G_KEY>{re.escape(env.keys_selector_token)})"
+            rf"(?P<G_PROP_KEY>{self.key_pattern})"
         )
         # /pattern/ or /pattern/flags
         self.re_pattern = r"/(?P<G_RE>.+?)/(?P<G_RE_FLAGS>[aims]*)"
         # func(
-        self.function_pattern = r"(?P<G_FUNC>[a-z][a-z_0-9]+)\(\s*"
+        self.function_pattern = r"(?P<G_FUNC>[a-z][a-z_0-9]+)(?P<G_FUNC_PAREN>\()"
-        self.rules = self.compile_rules()
+        self.rules = self.compile_strict_rules() if env.strict else self.compile_rules()
     def compile_rules(self) -> Pattern[str]:
         """Prepare regular expression rules."""
         env_tokens = [
             (TOKEN_ROOT, self.env.root_token),
-            (TOKEN_FAKE_ROOT, self.env.fake_root_token),
+            (TOKEN_PSEUDO_ROOT, self.env.pseudo_root_token),
             (TOKEN_SELF, self.env.self_token),
             (TOKEN_KEY, self.env.key_token),
             (TOKEN_UNION, self.env.union_token),
             (TOKEN_INTERSECTION, self.env.intersection_token),
             (TOKEN_FILTER_CONTEXT, self.env.filter_context_token),
             (TOKEN_KEYS, self.env.keys_selector_token),
+            (TOKEN_KEYS_FILTER, self.env.keys_filter_token),
         ]
         rules = [
             (TOKEN_DOUBLE_QUOTE_STRING, self.double_quote_pattern),
             (TOKEN_SINGLE_QUOTE_STRING, self.single_quote_pattern),
             (TOKEN_RE_PATTERN, self.re_pattern),
-            (TOKEN_LIST_SLICE, self.slice_list_pattern),
-            (TOKEN_FUNCTION, self.function_pattern),
+            (TOKEN_DOT_KEY_PROPERTY, self.dot_key_pattern),
             (TOKEN_DOT_PROPERTY, self.dot_property_pattern),
-            (TOKEN_FLOAT, r"-?\d+\.\d*(?:[eE][+-]?\d+)?"),
-            (TOKEN_INT, r"-?\d+(?P<G_EXP>[eE][+\-]?\d+)?\b"),
+            (
+                TOKEN_FLOAT,
+                r"(:?-?[0-9]+\.[0-9]+(?:[eE][+-]?[0-9]+)?)|(-?[0-9]+[eE]-[0-9]+)",
+            ),
+            (TOKEN_INT, r"-?[0-9]+(?:[eE]\+?[0-9]+)?"),
             (TOKEN_DDOT, r"\.\."),
+            (TOKEN_DOT, r"\."),
             (TOKEN_AND, self.logical_and_pattern),
             (TOKEN_OR, self.logical_or_pattern),
             *[
@@ -162,9 +167,10 @@ class Lexer:
             (TOKEN_CONTAINS, r"contains\b"),
             (TOKEN_UNDEFINED, r"undefined\b"),
             (TOKEN_MISSING, r"missing\b"),
-            (TOKEN_LIST_START, r"\["),
+            (TOKEN_LBRACKET, r"\["),
             (TOKEN_RBRACKET, r"]"),
             (TOKEN_COMMA, r","),
+            (TOKEN_COLON, r":"),
             (TOKEN_EQ, r"=="),
             (TOKEN_NE, r"!="),
             (TOKEN_LG, r"<>"),
@@ -173,12 +179,70 @@ class Lexer:
             (TOKEN_RE, r"=~"),
             (TOKEN_LT, r"<"),
             (TOKEN_GT, r">"),
-            (TOKEN_NOT, self.logical_not_pattern),
-            (TOKEN_BARE_PROPERTY, self.key_pattern),
+            (TOKEN_NOT, self.logical_not_pattern),  # Must go after "!="
+            (TOKEN_FUNCTION, self.function_pattern),
+            (TOKEN_NAME, self.key_pattern),  # Must go after reserved words
             (TOKEN_LPAREN, r"\("),
             (TOKEN_RPAREN, r"\)"),
-            (TOKEN_SKIP, r"[ \n\t\r\.]+"),
-            (TOKEN_ILLEGAL, r"."),
+            (TOKEN_WHITESPACE, r"[ \n\t\r]+"),
+            (TOKEN_ERROR, r"."),
+        ]
+        return re.compile(
+            "|".join(f"(?P<{token}>{pattern})" for token, pattern in rules),
+            re.DOTALL,
+        )
+    def compile_strict_rules(self) -> Pattern[str]:
+        """Prepare regular expression rules in strict mode."""
+        env_tokens = [
+            (TOKEN_ROOT, self.env.root_token),
+            (TOKEN_SELF, self.env.self_token),
+        ]
+        rules = [
+            (TOKEN_DOUBLE_QUOTE_STRING, self.double_quote_pattern),
+            (TOKEN_SINGLE_QUOTE_STRING, self.single_quote_pattern),
+            (TOKEN_DOT_PROPERTY, self.dot_property_pattern),
+            (
+                TOKEN_FLOAT,
+                r"(:?-?[0-9]+\.[0-9]+(?:[eE][+-]?[0-9]+)?)|(-?[0-9]+[eE]-[0-9]+)",
+            ),
+            (TOKEN_INT, r"-?[0-9]+(?:[eE]\+?[0-9]+)?"),
+            (TOKEN_DDOT, r"\.\."),
+            (TOKEN_DOT, r"\."),
+            (TOKEN_AND, r"&&"),
+            (TOKEN_OR, r"\|\|"),
+            *[
+                (token, re.escape(pattern))
+                for token, pattern in sorted(
+                    env_tokens, key=lambda x: len(x[1]), reverse=True
+                )
+                if pattern
+            ],
+            (TOKEN_WILD, r"\*"),
+            (TOKEN_FILTER, r"\?"),
+            (TOKEN_TRUE, r"true\b"),
+            (TOKEN_FALSE, r"false\b"),
+            (TOKEN_NULL, r"null\b"),
+            (TOKEN_LBRACKET, r"\["),
+            (TOKEN_RBRACKET, r"]"),
+            (TOKEN_COMMA, r","),
+            (TOKEN_COLON, r":"),
+            (TOKEN_EQ, r"=="),
+            (TOKEN_NE, r"!="),
+            (TOKEN_LG, r"<>"),
+            (TOKEN_LE, r"<="),
+            (TOKEN_GE, r">="),
+            (TOKEN_LT, r"<"),
+            (TOKEN_GT, r">"),
+            (TOKEN_NOT, r"!"),  # Must go after "!="
+            (TOKEN_FUNCTION, self.function_pattern),
+            (TOKEN_NAME, self.key_pattern),  # Must go after reserved words
+            (TOKEN_LPAREN, r"\("),
+            (TOKEN_RPAREN, r"\)"),
+            (TOKEN_WHITESPACE, r"[ \n\t\r]+"),
+            (TOKEN_ERROR, r"."),
         ]
         return re.compile(
@@ -196,31 +260,25 @@ class Lexer:
             if kind == TOKEN_DOT_PROPERTY:
                 yield _token(
-                    kind=TOKEN_PROPERTY,
-                    value=match.group("G_PROP"),
-                    index=match.start("G_PROP"),
+                    kind=TOKEN_DOT,
+                    value=match.group("G_DOT"),
+                    index=match.start("G_DOT"),
                 )
-            elif kind == TOKEN_BARE_PROPERTY:
                 yield _token(
-                    kind=TOKEN_BARE_PROPERTY,
-                    value=match.group(),
-                    index=match.start(),
-                )
-            elif kind == TOKEN_LIST_SLICE:
-                yield _token(
-                    kind=TOKEN_SLICE_START,
-                    value=match.group("G_LSLICE_START"),
-                    index=match.start("G_LSLICE_START"),
+                    kind=TOKEN_NAME,
+                    value=match.group("G_PROP"),
+                    index=match.start("G_PROP"),
                 )
+            elif kind == TOKEN_DOT_KEY_PROPERTY:
                 yield _token(
-                    kind=TOKEN_SLICE_STOP,
-                    value=match.group("G_LSLICE_STOP"),
-                    index=match.start("G_LSLICE_STOP"),
+                    kind=TOKEN_DOT,
+                    value=match.group("G_DOT_KEY"),
+                    index=match.start("G_DOT_KEY"),
                 )
                 yield _token(
-                    kind=TOKEN_SLICE_STEP,
-                    value=match.group("G_LSLICE_STEP") or "",
-                    index=match.start("G_LSLICE_STEP"),
+                    kind=TOKEN_KEY_NAME,
+                    value=match.group("G_PROP_KEY"),
+                    index=match.start("G_PROP_KEY"),
                 )
             elif kind == TOKEN_DOUBLE_QUOTE_STRING:
                 yield _token(
@@ -234,19 +292,6 @@ class Lexer:
                     value=match.group("G_SQUOTE"),
                     index=match.start("G_SQUOTE"),
                 )
-            elif kind == TOKEN_INT:
-                if match.group("G_EXP") and match.group("G_EXP")[1] == "-":
-                    yield _token(
-                        kind=TOKEN_FLOAT,
-                        value=match.group(),
-                        index=match.start(),
-                    )
-                else:
-                    yield _token(
-                        kind=TOKEN_INT,
-                        value=match.group(),
-                        index=match.start(),
-                    )
             elif kind == TOKEN_RE_PATTERN:
                 yield _token(
                     kind=TOKEN_RE_PATTERN,
@@ -270,13 +315,17 @@ class Lexer:
                     value=match.group("G_FUNC"),
                     index=match.start("G_FUNC"),
                 )
-            elif kind == TOKEN_SKIP:
-                continue
-            elif kind == TOKEN_ILLEGAL:
+                yield _token(
+                    kind=TOKEN_LPAREN,
+                    value=match.group("G_FUNC_PAREN"),
+                    index=match.start("G_FUNC_PAREN"),
+                )
+            elif kind == TOKEN_ERROR:
                 raise JSONPathSyntaxError(
                     f"unexpected token {match.group()!r}",
                     token=_token(
-                        TOKEN_ILLEGAL,
+                        TOKEN_ERROR,
                         value=match.group(),
                         index=match.start(),
                     ),

jsonpath/lru_cache.py ADDED Viewed

@@ -0,0 +1,130 @@
+"""An LRU cache with a mapping interface implemented using an ordered dict."""
+from collections import OrderedDict
+from threading import Lock
+from typing import Generic
+from typing import Iterator
+from typing import Optional
+from typing import Tuple
+from typing import TypeVar
+from typing import Union
+from typing import overload
+_KT = TypeVar("_KT")
+_VT = TypeVar("_VT")
+_T = TypeVar("_T")
+class LRUCache(Generic[_KT, _VT]):
+    """An LRU cache with a mapping interface."""
+    def __init__(self, capacity: int):
+        if capacity < 1:
+            raise ValueError("cache capacity must be greater than zero")
+        self.capacity = capacity
+        self._cache: OrderedDict[_KT, _VT] = OrderedDict()
+    def __getitem__(self, key: _KT) -> _VT:
+        value = self._cache[key]  # This will raise a KeyError if key is not cached
+        self._cache.move_to_end(key)
+        return value
+    def __setitem__(self, key: _KT, value: _VT) -> None:
+        try:
+            self._cache.move_to_end(key)
+        except KeyError:
+            if len(self._cache) >= self.capacity:
+                self._cache.popitem(last=False)
+        self._cache[key] = value
+    def __delitem__(self, key: _KT) -> None:
+        del self._cache[key]
+    def __len__(self) -> int:
+        return len(self._cache)
+    def __iter__(self) -> Iterator[_KT]:
+        return reversed(self._cache)
+    def __contains__(self, key: _KT) -> bool:
+        return key in self._cache
+    @overload
+    def get(self, key: _KT) -> Optional[_VT]: ...
+    @overload
+    def get(self, key: _KT, default: _VT) -> _VT: ...
+    @overload
+    def get(self, key: _KT, default: _T) -> Union[_VT, _T]: ...
+    def get(self, key: _KT, default: object = None) -> object:
+        """Return the cached value for _key_ if _key_ is in the cache, else default."""
+        try:
+            return self[key]
+        except KeyError:
+            return default
+    def keys(self) -> Iterator[_KT]:
+        """Return an iterator over this cache's keys."""
+        return reversed(self._cache.keys())
+    def values(self) -> Iterator[_VT]:
+        """Return an iterator over this cache's values."""
+        return reversed(self._cache.values())
+    def items(self) -> Iterator[Tuple[_KT, _VT]]:
+        """Return an iterator over this cache's key/value pairs."""
+        return reversed(self._cache.items())
+class ThreadSafeLRUCache(LRUCache[_KT, _VT]):
+    """A thread safe LRU cache."""
+    def __init__(self, capacity: int):
+        super().__init__(capacity)
+        self._lock = Lock()
+    def __getitem__(self, key: _KT) -> _VT:
+        with self._lock:
+            return super().__getitem__(key)
+    def __setitem__(self, key: _KT, value: _VT) -> None:
+        with self._lock:
+            return super().__setitem__(key, value)
+    def __delitem__(self, key: _KT) -> None:
+        with self._lock:
+            return super().__delitem__(key)
+    def __contains__(self, key: _KT) -> bool:
+        with self._lock:
+            return super().__contains__(key)
+    @overload
+    def get(self, key: _KT) -> Optional[_VT]: ...
+    @overload
+    def get(self, key: _KT, default: _VT) -> _VT: ...
+    @overload
+    def get(self, key: _KT, default: _T) -> Union[_VT, _T]: ...
+    def get(self, key: _KT, default: object = None) -> object:
+        """Return the cached value for _key_ if _key_ is in the cache, else default."""
+        # NOTE: self.__getitem__ is already acquiring the lock.
+        try:
+            return self[key]
+        except KeyError:
+            return default
+    def keys(self) -> Iterator[_KT]:
+        """Return an iterator over this cache's keys."""
+        with self._lock:
+            return super().keys()
+    def values(self) -> Iterator[_VT]:
+        """Return an iterator over this cache's values."""
+        with self._lock:
+            return super().values()
+    def items(self) -> Iterator[Tuple[_KT, _VT]]:
+        """Return an iterator over this cache's key/value pairs."""
+        with self._lock:
+            return super().items()

jsonpath/match.py CHANGED Viewed

@@ -11,6 +11,7 @@ from typing import Tuple
 from typing import Union
 from .pointer import JSONPointer
+from .serialize import canonical_string
 FilterContextVars = Mapping[str, Any]
 PathPart = Union[int, str]
@@ -69,6 +70,18 @@ class JSONPathMatch:
         """Append one or more children to this match."""
         self.children.extend(children)
+    def new_child(self, obj: object, key: Union[int, str]) -> JSONPathMatch:
+        """Return a new JSONPathMatch instance with this instance as its parent."""
+        return self.__class__(
+            filter_context=self.filter_context(),
+            obj=obj,
+            parent=self,
+            parts=self.parts + (key,),
+            path=self.path
+            + f"[{canonical_string(key) if isinstance(key, str) else key}]",
+            root=self.root,
+        )
     def filter_context(self) -> FilterContextVars:
         """Return filter context data for this match."""
         return self._filter_context

python-jsonpath 1.3.2__py3-none-any.whl → 2.0.1__py3-none-any.whl

python-jsonpath 1.3.2py3-none-any.whl → 2.0.1py3-none-any.whl