PyPI - quasardb - Versions diffs - 3.14.2.dev4__cp311-cp311-macosx_11_0_arm64.whl → 3.14.2.dev6__cp311-cp311-macosx_11_0_arm64.whl - Mend

quasardb 3.14.2.dev4__cp311-cp311-macosx_11_0_arm64.whl → 3.14.2.dev6__cp311-cp311-macosx_11_0_arm64.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of quasardb might be problematic. Click here for more details.

Files changed (33) hide show

quasardb/CMakeFiles/CMakeDirectoryInformation.cmake +2 -2
quasardb/Makefile +20 -20
quasardb/__init__.py +21 -7
quasardb/cmake_install.cmake +5 -5
quasardb/date/CMakeFiles/CMakeDirectoryInformation.cmake +2 -2
quasardb/date/CMakeFiles/Export/a52b05f964b070ee926bcad51d3288af/dateTargets.cmake +1 -1
quasardb/date/Makefile +20 -20
quasardb/date/cmake_install.cmake +5 -5
quasardb/date/dateTargets.cmake +1 -1
quasardb/extensions/writer.py +59 -61
quasardb/firehose.py +24 -22
quasardb/libqdb_api.dylib +0 -0
quasardb/numpy/__init__.py +262 -128
quasardb/pandas/__init__.py +145 -91
quasardb/pool.py +13 -2
quasardb/pybind11/CMakeFiles/CMakeDirectoryInformation.cmake +2 -2
quasardb/pybind11/Makefile +20 -20
quasardb/pybind11/cmake_install.cmake +2 -2
quasardb/quasardb.cpython-311-darwin.so +0 -0
quasardb/range-v3/CMakeFiles/CMakeDirectoryInformation.cmake +2 -2
quasardb/range-v3/CMakeFiles/Export/d94ef200eca10a819b5858b33e808f5b/range-v3-targets.cmake +1 -1
quasardb/range-v3/CMakeFiles/range.v3.headers.dir/build.make +17 -17
quasardb/range-v3/Makefile +25 -25
quasardb/range-v3/cmake_install.cmake +8 -8
quasardb/range-v3/range-v3-config.cmake +1 -1
quasardb/stats.py +245 -120
quasardb/table_cache.py +5 -1
{quasardb-3.14.2.dev4.dist-info → quasardb-3.14.2.dev6.dist-info}/METADATA +3 -2
quasardb-3.14.2.dev6.dist-info/RECORD +45 -0
{quasardb-3.14.2.dev4.dist-info → quasardb-3.14.2.dev6.dist-info}/WHEEL +1 -1
quasardb-3.14.2.dev4.dist-info/RECORD +0 -45
{quasardb-3.14.2.dev4.dist-info → quasardb-3.14.2.dev6.dist-info/licenses}/LICENSE.md +0 -0
{quasardb-3.14.2.dev4.dist-info → quasardb-3.14.2.dev6.dist-info}/top_level.txt +0 -0

quasardb/extensions/writer.py CHANGED Viewed

@@ -5,9 +5,10 @@ import numpy.ma as ma
 __all__ = []
 def _ensure_ctype(self, idx, ctype):
-    assert 'table' in self._legacy_state
-    infos = self._legacy_state['table'].list_columns()
+    assert "table" in self._legacy_state
+    infos = self._legacy_state["table"].list_columns()
     cinfo = infos[idx]
     ctype_data = copy.copy(ctype)
@@ -24,80 +25,81 @@ def _ensure_ctype(self, idx, ctype):
 def _legacy_next_row(self, table):
-    if 'pending' not in self._legacy_state:
-        self._legacy_state['pending'] = []
+    if "pending" not in self._legacy_state:
+        self._legacy_state["pending"] = []
-    if 'table' not in self._legacy_state:
-        self._legacy_state['table'] = table
+    if "table" not in self._legacy_state:
+        self._legacy_state["table"] = table
-    self._legacy_state['pending'].append({'by_index': {}})
+    self._legacy_state["pending"].append({"by_index": {}})
     # Return reference to the row inside the buffer
-    return self._legacy_state['pending'][-1]
+    return self._legacy_state["pending"][-1]
 def _legacy_current_row(self):
-    return self._legacy_state['pending'][-1]
+    return self._legacy_state["pending"][-1]
 def _legacy_start_row(self, table, x):
     row = _legacy_next_row(self, table)
-    assert '$timestamp' not in row
-    row['$timestamp'] = x
+    assert "$timestamp" not in row
+    row["$timestamp"] = x
 def _legacy_set_double(self, idx, x):
     _ensure_ctype(self, idx, quasardb.ColumnType.Double)
     assert isinstance(x, float)
-    assert idx not in _legacy_current_row(self)['by_index']
-    _legacy_current_row(self)['by_index'][idx] = x
+    assert idx not in _legacy_current_row(self)["by_index"]
+    _legacy_current_row(self)["by_index"][idx] = x
 def _legacy_set_int64(self, idx, x):
     _ensure_ctype(self, idx, quasardb.ColumnType.Int64)
     assert isinstance(x, int)
-    assert idx not in _legacy_current_row(self)['by_index']
-    _legacy_current_row(self)['by_index'][idx] = x
+    assert idx not in _legacy_current_row(self)["by_index"]
+    _legacy_current_row(self)["by_index"][idx] = x
 def _legacy_set_timestamp(self, idx, x):
     _ensure_ctype(self, idx, quasardb.ColumnType.Timestamp)
-    assert idx not in _legacy_current_row(self)['by_index']
-    _legacy_current_row(self)['by_index'][idx] = x
+    assert idx not in _legacy_current_row(self)["by_index"]
+    _legacy_current_row(self)["by_index"][idx] = x
 def _legacy_set_string(self, idx, x):
     _ensure_ctype(self, idx, quasardb.ColumnType.String)
     assert isinstance(x, str)
-    assert idx not in _legacy_current_row(self)['by_index']
+    assert idx not in _legacy_current_row(self)["by_index"]
-    _legacy_current_row(self)['by_index'][idx] = x
+    _legacy_current_row(self)["by_index"][idx] = x
 def _legacy_set_blob(self, idx, x):
     _ensure_ctype(self, idx, quasardb.ColumnType.Blob)
     assert isinstance(x, bytes)
-    assert idx not in _legacy_current_row(self)['by_index']
+    assert idx not in _legacy_current_row(self)["by_index"]
-    _legacy_current_row(self)['by_index'][idx] = x
+    _legacy_current_row(self)["by_index"][idx] = x
 def _legacy_push(self):
-    if 'pending' not in self._legacy_state:
+    if "pending" not in self._legacy_state:
         # Extremely likely default case, no "old" rows
         return
-    assert 'table' in self._legacy_state
-    table = self._legacy_state['table']
+    assert "table" in self._legacy_state
+    table = self._legacy_state["table"]
     # Some useful constants
-    dtype_by_ctype = {quasardb.ColumnType.Double: np.dtype('float64'),
-                      quasardb.ColumnType.Int64: np.dtype('int64'),
-                      quasardb.ColumnType.Timestamp: np.dtype('datetime64[ns]'),
-                      quasardb.ColumnType.String: np.dtype('unicode'),
-                      quasardb.ColumnType.Symbol: np.dtype('unicode'),
-                      quasardb.ColumnType.Blob: np.dtype('bytes')
-                    }
+    dtype_by_ctype = {
+        quasardb.ColumnType.Double: np.dtype("float64"),
+        quasardb.ColumnType.Int64: np.dtype("int64"),
+        quasardb.ColumnType.Timestamp: np.dtype("datetime64[ns]"),
+        quasardb.ColumnType.String: np.dtype("unicode"),
+        quasardb.ColumnType.Symbol: np.dtype("unicode"),
+        quasardb.ColumnType.Blob: np.dtype("bytes"),
+    }
     ctype_by_idx = {}
     cinfos = table.list_columns()
@@ -107,31 +109,30 @@ def _legacy_push(self):
     all_idx = set(ctype_by_idx.keys())
     # Prepare data structure
-    pivoted = {'$timestamp': [],
-               'by_index': {}}
+    pivoted = {"$timestamp": [], "by_index": {}}
     for i in all_idx:
-        pivoted['by_index'][i] = []
+        pivoted["by_index"][i] = []
     # Do the actual pivot
-    for row in self._legacy_state['pending']:
-        assert '$timestamp' in row
-        assert 'by_index' in row
+    for row in self._legacy_state["pending"]:
+        assert "$timestamp" in row
+        assert "by_index" in row
-        pivoted['$timestamp'].append(row['$timestamp'])
+        pivoted["$timestamp"].append(row["$timestamp"])
-        for idx in pivoted['by_index'].keys():
-            val = row['by_index'].get(idx, None)
-            pivoted['by_index'][idx].append(val)
+        for idx in pivoted["by_index"].keys():
+            val = row["by_index"].get(idx, None)
+            pivoted["by_index"][idx].append(val)
     # Validation / verification, not strictly necessary. Effectively
     # ensures that we have the exact same amount of values for every
     # column
-    for xs in pivoted['by_index'].values():
-        assert len(xs) == len(pivoted['$timestamp'])
+    for xs in pivoted["by_index"].values():
+        assert len(xs) == len(pivoted["$timestamp"])
     column_data = []
-    for idx,xs in pivoted['by_index'].items():
+    for idx, xs in pivoted["by_index"].items():
         ctype = ctype_by_idx[idx]
         dtype = dtype_by_ctype[ctype]
@@ -141,22 +142,19 @@ def _legacy_push(self):
         xs_ = []
         if all(mask):
-            xs_ = ma.masked_all(len(xs),
-                                dtype=dtype)
+            xs_ = ma.masked_all(len(xs), dtype=dtype)
         else:
             xs_ = ma.masked_array(data=np.array(xs, dtype), mask=mask)
-        assert len(xs_) == len(pivoted['$timestamp'])
+        assert len(xs_) == len(pivoted["$timestamp"])
         column_data.append(xs_)
     push_data = quasardb.WriterData()
-    index = np.array(pivoted['$timestamp'], np.dtype('datetime64[ns]'))
+    index = np.array(pivoted["$timestamp"], np.dtype("datetime64[ns]"))
     push_data.append(table, index, column_data)
     self._legacy_state = {}
     return push_data
@@ -180,14 +178,14 @@ def extend_writer(x):
     in C++ with few benefits.
     """
-    x.start_row      = _legacy_start_row
-    x.set_double     = _legacy_set_double
-    x.set_int64      = _legacy_set_int64
-    x.set_string     = _legacy_set_string
-    x.set_blob       = _legacy_set_blob
-    x.set_timestamp  = _legacy_set_timestamp
-    x.push           = _wrap_fn(x.push, _legacy_push)
-    x.push_fast      = _wrap_fn(x.push_fast, _legacy_push)
-    x.push_async     = _wrap_fn(x.push_async, _legacy_push)
-    x.push_truncate  = _wrap_fn(x.push_truncate, _legacy_push)
+    x.start_row = _legacy_start_row
+    x.set_double = _legacy_set_double
+    x.set_int64 = _legacy_set_int64
+    x.set_string = _legacy_set_string
+    x.set_blob = _legacy_set_blob
+    x.set_timestamp = _legacy_set_timestamp
+    x.push = _wrap_fn(x.push, _legacy_push)
+    x.push_fast = _wrap_fn(x.push_fast, _legacy_push)
+    x.push_async = _wrap_fn(x.push_async, _legacy_push)
+    x.push_truncate = _wrap_fn(x.push_truncate, _legacy_push)

quasardb/firehose.py CHANGED Viewed

@@ -6,15 +6,14 @@ import numpy as np
 FIREHOSE_TABLE = "$qdb.firehose"
 POLL_INTERVAL = 0.1
-logger = logging.getLogger('quasardb.firehose')
+logger = logging.getLogger("quasardb.firehose")
 def _init():
     """
     Initialize our internal state.
     """
-    return {'last': None,
-            'seen': set()}
+    return {"last": None, "seen": set()}
 def _get_transactions_since(conn, table_name, last):
@@ -24,10 +23,12 @@ def _get_transactions_since(conn, table_name, last):
     """
     if last is None:
         q = "SELECT $timestamp, transaction_id, begin, end FROM \"{}\" WHERE table = '{}' ORDER BY $timestamp".format(
-            FIREHOSE_TABLE, table_name)
+            FIREHOSE_TABLE, table_name
+        )
     else:
         q = "SELECT $timestamp, transaction_id, begin, end FROM \"{}\" IN RANGE ({}, +1y) WHERE table = '{}' ORDER BY $timestamp".format(
-            FIREHOSE_TABLE, last['$timestamp'], table_name)
+            FIREHOSE_TABLE, last["$timestamp"], table_name
+        )
     return conn.query(q)
@@ -36,8 +37,7 @@ def _get_transaction_data(conn, table_name, begin, end):
     """
     Gets all data from a certain table.
     """
-    q = "SELECT * FROM \"{}\" IN RANGE ({}, {}) ".format(
-        table_name, begin, end)
+    q = 'SELECT * FROM "{}" IN RANGE ({}, {}) '.format(table_name, begin, end)
     return conn.query(q)
@@ -50,33 +50,35 @@ def _get_next(conn, table_name, state):
     # 3. For each of the transactions, pull in all data
     # 4. Concatenate all this data (in order of quasardb transaction)
-    txs = _get_transactions_since(conn, table_name, state['last'])
+    txs = _get_transactions_since(conn, table_name, state["last"])
     xs = list()
     for tx in txs:
-        txid = tx['transaction_id']
+        txid = tx["transaction_id"]
-        if state['last'] is not None and tx['$timestamp'] > state['last']['$timestamp']:
+        if state["last"] is not None and tx["$timestamp"] > state["last"]["$timestamp"]:
             # At this point we are guaranteed that the transaction we encounter is
             # 'new', will not conflict with any other transaction ids. It is thus
             # safe to reset the txid set.
-            state['seen'] = set()
-        if txid not in state['seen']:
-            xs = xs + _get_transaction_data(conn,
-                                            table_name,
-                                            tx['begin'],
-                                            # The firehose logs transaction `end` span as
-                                            # end inclusive, while our bulk reader and/or query
-                                            # language are end exclusive.
-                                            tx['end'] + np.timedelta64(1, 'ns'))
+            state["seen"] = set()
+        if txid not in state["seen"]:
+            xs = xs + _get_transaction_data(
+                conn,
+                table_name,
+                tx["begin"],
+                # The firehose logs transaction `end` span as
+                # end inclusive, while our bulk reader and/or query
+                # language are end exclusive.
+                tx["end"] + np.timedelta64(1, "ns"),
+            )
             # Because it is possible that multiple firehose changes are stored with the
             # exact same $timestamp, we also keep track of the actually seen
             # transaction ids.
-            state['seen'].add(txid)
+            state["seen"].add(txid)
-        state['last'] = tx
+        state["last"] = tx
     return (state, xs)

quasardb/libqdb_api.dylib CHANGED Viewed

Binary file