PyPI - vastdb - Versions diffs - 0.1.1__py3-none-any.whl → 0.1.3__py3-none-any.whl - Mend

vastdb 0.1.1py3-none-any.whl → 0.1.3py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (23) hide show

vastdb/__init__.py +6 -2
vastdb/bench/test_perf.py +3 -3
vastdb/bucket.py +29 -15
vastdb/errors.py +40 -7
vastdb/internal_commands.py +194 -233
vastdb/schema.py +11 -6
vastdb/session.py +16 -1
vastdb/table.py +181 -77
vastdb/tests/test_duckdb.py +61 -0
vastdb/tests/test_imports.py +13 -1
vastdb/tests/test_projections.py +1 -0
vastdb/tests/test_sanity.py +2 -2
vastdb/tests/test_schemas.py +3 -3
vastdb/tests/test_tables.py +60 -50
vastdb/tests/test_util.py +39 -0
vastdb/tests/util.py +1 -4
vastdb/transaction.py +32 -6
vastdb/util.py +42 -6
{vastdb-0.1.1.dist-info → vastdb-0.1.3.dist-info}/METADATA +2 -5
{vastdb-0.1.1.dist-info → vastdb-0.1.3.dist-info}/RECORD +23 -21
{vastdb-0.1.1.dist-info → vastdb-0.1.3.dist-info}/WHEEL +1 -1
{vastdb-0.1.1.dist-info → vastdb-0.1.3.dist-info}/LICENSE +0 -0
{vastdb-0.1.1.dist-info → vastdb-0.1.3.dist-info}/top_level.txt +0 -0

vastdb/__init__.py CHANGED Viewed

@@ -1,7 +1,11 @@
 """VAST Database Python SDK."""
+import functools
 from . import session
 # A helper function, useful as a short-hand for Session c-tor: `session = vastdb.connect(...)`
-connect = session.Session
-connect.__name__ = 'connect'
+@functools.wraps(session.Session)
+def connect(*args, **kwargs):  # noqa: D103
+    return session.Session(*args, **kwargs)

vastdb/bench/test_perf.py CHANGED Viewed

@@ -12,7 +12,7 @@ log = logging.getLogger(__name__)
 @pytest.mark.benchmark
 def test_bench(session, clean_bucket_name, parquets_path, crater_path):
-    files = [str(parquets_path/f) for f in (parquets_path.glob('**/*.pq'))]
+    files = [str(parquets_path / f) for f in (parquets_path.glob('**/*.pq'))]
     with session.transaction() as tx:
         b = tx.bucket(clean_bucket_name)
@@ -22,8 +22,8 @@ def test_bench(session, clean_bucket_name, parquets_path, crater_path):
         s = time.time()
         pa_table = pa.Table.from_batches(t.select(columns=['sid'], predicate=t['sid'] == 10033007, config=config))
         e = time.time()
-        log.info("'SELECT sid from TABLE WHERE sid = 10033007' returned in %s seconds.", e-s)
+        log.info("'SELECT sid from TABLE WHERE sid = 10033007' returned in %s seconds.", e - s)
         if crater_path:
             with open(f'{crater_path}/bench_results', 'a') as f:
-                f.write(f"'SELECT sid FROM TABLE WHERE sid = 10033007' returned in {e-s} seconds")
+                f.write(f"'SELECT sid FROM TABLE WHERE sid = 10033007' returned in {e - s} seconds")
         assert pa_table.num_rows == 255_075

vastdb/bucket.py CHANGED Viewed

@@ -6,18 +6,14 @@ It is possible to list and access VAST snapshots generated over a bucket.
 import logging
 from dataclasses import dataclass
+from typing import TYPE_CHECKING, List, Optional
 from . import errors, schema, transaction
-log = logging.getLogger(__name__)
-@dataclass
-class Snapshot:
-    """VAST bucket-level snapshot."""
+if TYPE_CHECKING:
+    from .schema import Schema
-    name: str
-    bucket: "Bucket"
+log = logging.getLogger(__name__)
 @dataclass
@@ -27,7 +23,7 @@ class Bucket:
     name: str
     tx: "transaction.Transaction"
-    def create_schema(self, path: str, fail_if_exists=True) -> "schema.Schema":
+    def create_schema(self, path: str, fail_if_exists=True) -> "Schema":
         """Create a new schema (a container of tables) under this bucket."""
         if current := self.schema(path, fail_if_missing=False):
             if fail_if_exists:
@@ -36,9 +32,9 @@ class Bucket:
                 return current
         self.tx._rpc.api.create_schema(self.name, path, txid=self.tx.txid)
         log.info("Created schema: %s", path)
-        return self.schema(path)
+        return self.schema(path)  # type: ignore[return-value]
-    def schema(self, path: str, fail_if_missing=True) -> "schema.Schema":
+    def schema(self, path: str, fail_if_missing=True) -> Optional["Schema"]:
         """Get a specific schema (a container of tables) under this bucket."""
         s = self.schemas(path)
         log.debug("schema: %s", s)
@@ -51,14 +47,14 @@ class Bucket:
         log.debug("Found schema: %s", s[0].name)
         return s[0]
-    def schemas(self, name: str = None) -> ["schema.Schema"]:
+    def schemas(self, name: Optional[str] = None) -> List["Schema"]:
         """List bucket's schemas."""
         schemas = []
         next_key = 0
         exact_match = bool(name)
         log.debug("list schemas param: schema=%s, exact_match=%s", name, exact_match)
         while True:
-            bucket_name, curr_schemas, next_key, is_truncated, _ = \
+            _bucket_name, curr_schemas, next_key, is_truncated, _ = \
                 self.tx._rpc.api.list_schemas(bucket=self.name, next_key=next_key, txid=self.tx.txid,
                                                name_prefix=name, exact_match=exact_match)
             if not curr_schemas:
@@ -69,7 +65,22 @@ class Bucket:
         return [schema.Schema(name=name, bucket=self) for name, *_ in schemas]
-    def snapshots(self) -> [Snapshot]:
+    def snapshot(self, name, fail_if_missing=True) -> Optional["Bucket"]:
+        """Get snapshot by name (if exists)."""
+        snapshots, _is_truncated, _next_key = \
+            self.tx._rpc.api.list_snapshots(bucket=self.name, name_prefix=name, max_keys=1)
+        expected_name = f".snapshot/{name}"
+        exists = snapshots and snapshots[0] == expected_name + "/"
+        if not exists:
+            if fail_if_missing:
+                raise errors.MissingSnapshot(self.name, expected_name)
+            else:
+                return None
+        return Bucket(name=f'{self.name}/{expected_name}', tx=self.tx)
+    def snapshots(self) -> List["Bucket"]:
         """List bucket's snapshots."""
         snapshots = []
         next_key = 0
@@ -82,4 +93,7 @@ class Bucket:
             if not is_truncated:
                 break
-        return [Snapshot(name=snapshot, bucket=self) for snapshot in snapshots]
+        return [
+            Bucket(name=f'{self.name}/{snapshot.strip("/")}', tx=self.tx)
+            for snapshot in snapshots
+        ]

vastdb/errors.py CHANGED Viewed

@@ -26,6 +26,7 @@ log = logging.getLogger(__name__)
 class HttpError(Exception):
     code: str
     message: str
+    method: str
     url: str
     status: int  # HTTP status
     headers: requests.structures.CaseInsensitiveDict  # HTTP response headers
@@ -84,15 +85,33 @@ class InvalidArgument(Exception):
     pass
+class TooWideRow(InvalidArgument):
+    pass
 class Missing(Exception):
     pass
+class MissingTransaction(Missing):
+    pass
+class NotSupported(Exception):
+    pass
 @dataclass
 class MissingBucket(Missing):
     bucket: str
+@dataclass
+class MissingSnapshot(Missing):
+    bucket: str
+    snapshot: str
 @dataclass
 class MissingSchema(Missing):
     bucket: str
@@ -131,6 +150,19 @@ class TableExists(Exists):
     table: str
+@dataclass
+class NotSupportedCommand(NotSupported):
+    bucket: str
+    schema: str
+    table: str
+@dataclass
+class NotSupportedVersion(NotSupported):
+    err_msg: str
+    version: str
 ERROR_TYPES_MAP = {
     HttpStatus.BAD_REQUEST: BadRequest,
     HttpStatus.FOBIDDEN: Forbidden,
@@ -150,21 +182,22 @@ def from_response(res: requests.Response):
     log.debug("response: url='%s', code=%s, headers=%s, body='%s'", res.request.url, res.status_code, res.headers, res.text)
     # try to parse S3 XML response for the error details:
-    code = None
-    message = None
+    code_str = None
+    message_str = None
     if res.text:
         try:
             root = xml.etree.ElementTree.fromstring(res.text)
             code = root.find('Code')
-            code = code.text if code is not None else None
+            code_str = code.text if code is not None else None
             message = root.find('Message')
-            message = message.text if message is not None else None
+            message_str = message.text if message is not None else None
         except xml.etree.ElementTree.ParseError:
             log.debug("invalid XML: %r", res.text)
     kwargs = dict(
-        code=code,
-        message=message,
+        code=code_str,
+        message=message_str,
+        method=res.request.method,
         url=res.request.url,
         status=res.status_code,
         headers=res.headers,
@@ -172,4 +205,4 @@ def from_response(res: requests.Response):
     log.warning("RPC failed: %s", kwargs)
     status = HttpStatus(res.status_code)
     error_type = ERROR_TYPES_MAP.get(status, UnexpectedError)
-    raise error_type(**kwargs)
+    return error_type(**kwargs)

vastdb 0.1.1__py3-none-any.whl → 0.1.3__py3-none-any.whl

vastdb 0.1.1py3-none-any.whl → 0.1.3py3-none-any.whl