PyPI - clickhouse-driver - Versions diffs - 0.2.1__cp39-cp39-win_amd64.whl → 0.2.8__cp39-cp39-win_amd64.whl - Mend

clickhouse-driver 0.2.1__cp39-cp39-win_amd64.whl → 0.2.8__cp39-cp39-win_amd64.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (85) hide show

clickhouse_driver/__init__.py +9 -9
clickhouse_driver/block.py +227 -195
clickhouse_driver/blockstreamprofileinfo.py +22 -22
clickhouse_driver/bufferedreader.cp39-win_amd64.pyd +0 -0
clickhouse_driver/bufferedwriter.cp39-win_amd64.pyd +0 -0
clickhouse_driver/client.py +896 -666
clickhouse_driver/clientinfo.py +119 -80
clickhouse_driver/columns/arraycolumn.py +161 -150
clickhouse_driver/columns/base.py +221 -147
clickhouse_driver/columns/boolcolumn.py +7 -0
clickhouse_driver/columns/datecolumn.py +108 -49
clickhouse_driver/columns/datetimecolumn.py +202 -207
clickhouse_driver/columns/decimalcolumn.py +116 -118
clickhouse_driver/columns/enumcolumn.py +119 -119
clickhouse_driver/columns/exceptions.py +12 -12
clickhouse_driver/columns/floatcolumn.py +34 -34
clickhouse_driver/columns/intcolumn.py +157 -157
clickhouse_driver/columns/intervalcolumn.py +33 -33
clickhouse_driver/columns/ipcolumn.py +118 -118
clickhouse_driver/columns/jsoncolumn.py +37 -0
clickhouse_driver/columns/largeint.cp39-win_amd64.pyd +0 -0
clickhouse_driver/columns/lowcardinalitycolumn.py +142 -123
clickhouse_driver/columns/mapcolumn.py +73 -58
clickhouse_driver/columns/nestedcolumn.py +10 -0
clickhouse_driver/columns/nothingcolumn.py +13 -13
clickhouse_driver/columns/nullablecolumn.py +7 -7
clickhouse_driver/columns/nullcolumn.py +15 -15
clickhouse_driver/columns/numpy/base.py +47 -14
clickhouse_driver/columns/numpy/boolcolumn.py +8 -0
clickhouse_driver/columns/numpy/datecolumn.py +19 -12
clickhouse_driver/columns/numpy/datetimecolumn.py +143 -145
clickhouse_driver/columns/numpy/floatcolumn.py +24 -13
clickhouse_driver/columns/numpy/intcolumn.py +43 -43
clickhouse_driver/columns/numpy/lowcardinalitycolumn.py +96 -83
clickhouse_driver/columns/numpy/service.py +58 -80
clickhouse_driver/columns/numpy/stringcolumn.py +78 -76
clickhouse_driver/columns/numpy/tuplecolumn.py +37 -0
clickhouse_driver/columns/service.py +185 -131
clickhouse_driver/columns/simpleaggregatefunctioncolumn.py +7 -7
clickhouse_driver/columns/stringcolumn.py +73 -73
clickhouse_driver/columns/tuplecolumn.py +63 -65
clickhouse_driver/columns/util.py +60 -0
clickhouse_driver/columns/uuidcolumn.py +64 -64
clickhouse_driver/compression/__init__.py +28 -28
clickhouse_driver/compression/base.py +87 -52
clickhouse_driver/compression/lz4.py +21 -55
clickhouse_driver/compression/lz4hc.py +9 -9
clickhouse_driver/compression/zstd.py +20 -51
clickhouse_driver/connection.py +784 -632
clickhouse_driver/context.py +36 -36
clickhouse_driver/dbapi/__init__.py +62 -62
clickhouse_driver/dbapi/connection.py +99 -96
clickhouse_driver/dbapi/cursor.py +370 -368
clickhouse_driver/dbapi/errors.py +40 -40
clickhouse_driver/dbapi/extras.py +73 -0
clickhouse_driver/defines.py +55 -42
clickhouse_driver/errors.py +453 -446
clickhouse_driver/log.py +48 -44
clickhouse_driver/numpy/block.py +8 -8
clickhouse_driver/numpy/helpers.py +25 -25
clickhouse_driver/numpy/result.py +123 -123
clickhouse_driver/opentelemetry.py +43 -0
clickhouse_driver/progress.py +38 -32
clickhouse_driver/protocol.py +114 -105
clickhouse_driver/queryprocessingstage.py +8 -8
clickhouse_driver/reader.py +69 -69
clickhouse_driver/readhelpers.py +26 -26
clickhouse_driver/result.py +144 -144
clickhouse_driver/settings/available.py +405 -405
clickhouse_driver/settings/types.py +50 -50
clickhouse_driver/settings/writer.py +34 -29
clickhouse_driver/streams/compressed.py +88 -88
clickhouse_driver/streams/native.py +102 -90
clickhouse_driver/util/compat.py +39 -0
clickhouse_driver/util/escape.py +94 -55
clickhouse_driver/util/helpers.py +57 -57
clickhouse_driver/varint.cp39-win_amd64.pyd +0 -0
clickhouse_driver/writer.py +67 -67
{clickhouse_driver-0.2.1.dist-info → clickhouse_driver-0.2.8.dist-info}/LICENSE +21 -21
clickhouse_driver-0.2.8.dist-info/METADATA +201 -0
clickhouse_driver-0.2.8.dist-info/RECORD +89 -0
{clickhouse_driver-0.2.1.dist-info → clickhouse_driver-0.2.8.dist-info}/WHEEL +1 -1
clickhouse_driver-0.2.1.dist-info/METADATA +0 -24
clickhouse_driver-0.2.1.dist-info/RECORD +0 -80
{clickhouse_driver-0.2.1.dist-info → clickhouse_driver-0.2.8.dist-info}/top_level.txt +0 -0

clickhouse_driver/log.py CHANGED Viewed

@@ -1,44 +1,48 @@
-import logging
-logger = logging.getLogger(__name__)
-log_priorities = (
-    'Unknown',
-    'Fatal',
-    'Critical',
-    'Error',
-    'Warning',
-    'Notice',
-    'Information',
-    'Debug',
-    'Trace'
-)
-def log_block(block):
-    if block is None:
-        return
-    column_names = [x[0] for x in block.columns_with_types]
-    for row in block.get_rows():
-        row = dict(zip(column_names, row))
-        if 1 <= row['priority'] <= 8:
-            priority = log_priorities[row['priority']]
-        else:
-            priority = row[0]
-        # thread_number in servers prior 20.x
-        thread_id = row.get('thread_id') or row['thread_number']
-        logger.info(
-            '[ %s ] [ %s ] {%s} <%s> %s: %s',
-            row['host_name'],
-            thread_id,
-            row['query_id'],
-            priority,
-            row['source'],
-            row['text']
-        )
+import logging
+logger = logging.getLogger(__name__)
+# Keep in sync with ClickHouse priorities
+# https://github.com/ClickHouse/ClickHouse/blob/master/src/Interpreters/InternalTextLogsQueue.cpp
+log_priorities = (
+    'Unknown',
+    'Fatal',
+    'Critical',
+    'Error',
+    'Warning',
+    'Notice',
+    'Information',
+    'Debug',
+    'Trace',
+    'Test',
+)
+num_priorities = len(log_priorities)
+def log_block(block):
+    if block is None:
+        return
+    column_names = [x[0] for x in block.columns_with_types]
+    for row in block.get_rows():
+        row = dict(zip(column_names, row))
+        if 1 <= row['priority'] <= num_priorities:
+            priority = log_priorities[row['priority']]
+        else:
+            priority = row[0]
+        # thread_number in servers prior 20.x
+        thread_id = row.get('thread_id') or row['thread_number']
+        logger.info(
+            '[ %s ] [ %s ] {%s} <%s> %s: %s',
+            row['host_name'],
+            thread_id,
+            row['query_id'],
+            priority,
+            row['source'],
+            row['text']
+        )

clickhouse_driver/numpy/block.py CHANGED Viewed

@@ -1,8 +1,8 @@
-import numpy as np
-from ..block import ColumnOrientedBlock
-class NumpyColumnOrientedBlock(ColumnOrientedBlock):
-    def transposed(self):
-        return np.transpose(self.data)
+import numpy as np
+from ..block import ColumnOrientedBlock
+class NumpyColumnOrientedBlock(ColumnOrientedBlock):
+    def transposed(self):
+        return np.transpose(self.data)

clickhouse_driver/numpy/helpers.py CHANGED Viewed

@@ -1,25 +1,25 @@
-import numpy as np
-import pandas as pd
-def column_chunks(columns, n):
-    for column in columns:
-        if not isinstance(column, (np.ndarray, pd.DatetimeIndex)):
-            raise TypeError(
-                'Unsupported column type: {}. '
-                'ndarray/DatetimeIndex is expected.'
-                .format(type(column))
-            )
-    # create chunk generator for every column
-    chunked = [
-        iter(np.array_split(c, range(0, len(c), n)) if len(c) > n else [c])
-        for c in columns
-    ]
-    while True:
-        # get next chunk for every column
-        item = [next(column, []) for column in chunked]
-        if not any(len(x) for x in item):
-            break
-        yield item
+import numpy as np
+import pandas as pd
+def column_chunks(columns, n):
+    for column in columns:
+        if not isinstance(column, (np.ndarray, pd.DatetimeIndex)):
+            raise TypeError(
+                'Unsupported column type: {}. '
+                'ndarray/DatetimeIndex is expected.'
+                .format(type(column))
+            )
+    # create chunk generator for every column
+    chunked = [
+        iter(np.array_split(c, len(c) // n) if len(c) > n else [c])
+        for c in columns
+    ]
+    while True:
+        # get next chunk for every column
+        item = [next(column, []) for column in chunked]
+        if not any(len(x) for x in item):
+            break
+        yield item

clickhouse_driver/numpy/result.py CHANGED Viewed

@@ -1,123 +1,123 @@
-from itertools import chain
-import numpy as np
-import pandas as pd
-from pandas.api.types import union_categoricals
-from ..progress import Progress
-from ..result import QueryResult
-class NumpyQueryResult(QueryResult):
-    """
-    Stores query result from multiple blocks as numpy arrays.
-    """
-    def store(self, packet):
-        block = getattr(packet, 'block', None)
-        if block is None:
-            return
-        # Header block contains no rows. Pick columns from it.
-        if block.num_rows:
-            if self.columnar:
-                self.data.append(block.get_columns())
-            else:
-                self.data.extend(block.get_rows())
-        elif not self.columns_with_types:
-            self.columns_with_types = block.columns_with_types
-    def get_result(self):
-        """
-        :return: stored query result.
-        """
-        for packet in self.packet_generator:
-            self.store(packet)
-        if self.columnar:
-            data = []
-            # Transpose to a list of columns, each column is list of chunks
-            for column_chunks in zip(*self.data):
-                # Concatenate chunks for each column
-                if isinstance(column_chunks[0], np.ndarray):
-                    column = np.concatenate(column_chunks)
-                elif isinstance(column_chunks[0], pd.Categorical):
-                    column = union_categoricals(column_chunks)
-                else:
-                    column = tuple(chain.from_iterable(column_chunks))
-                data.append(column)
-        else:
-            data = self.data
-        if self.with_column_types:
-            return data, self.columns_with_types
-        else:
-            return data
-class NumpyProgressQueryResult(NumpyQueryResult):
-    """
-    Stores query result and progress information from multiple blocks.
-    Provides iteration over query progress.
-    """
-    def __init__(self, *args, **kwargs):
-        self.progress_totals = Progress()
-        super(NumpyProgressQueryResult, self).__init__(*args, **kwargs)
-    def __iter__(self):
-        return self
-    def __next__(self):
-        while True:
-            packet = next(self.packet_generator)
-            progress_packet = getattr(packet, 'progress', None)
-            if progress_packet:
-                self.progress_totals.increment(progress_packet)
-                return (
-                    self.progress_totals.rows, self.progress_totals.total_rows
-                )
-            else:
-                self.store(packet)
-    def get_result(self):
-        # Read all progress packets.
-        for _ in self:
-            pass
-        return super(NumpyProgressQueryResult, self).get_result()
-class NumpyIterQueryResult(object):
-    """
-    Provides iteration over returned data by chunks (streaming by chunks).
-    """
-    def __init__(
-            self, packet_generator,
-            with_column_types=False):
-        self.packet_generator = packet_generator
-        self.with_column_types = with_column_types
-        self.first_block = True
-        super(NumpyIterQueryResult, self).__init__()
-    def __iter__(self):
-        return self
-    def __next__(self):
-        packet = next(self.packet_generator)
-        block = getattr(packet, 'block', None)
-        if block is None:
-            return []
-        if self.first_block and self.with_column_types:
-            self.first_block = False
-            rv = [block.columns_with_types]
-            rv.extend(block.get_rows())
-            return rv
-        else:
-            return block.get_rows()
+from itertools import chain
+import numpy as np
+import pandas as pd
+from pandas.api.types import union_categoricals
+from ..progress import Progress
+from ..result import QueryResult
+class NumpyQueryResult(QueryResult):
+    """
+    Stores query result from multiple blocks as numpy arrays.
+    """
+    def store(self, packet):
+        block = getattr(packet, 'block', None)
+        if block is None:
+            return
+        # Header block contains no rows. Pick columns from it.
+        if block.num_rows:
+            if self.columnar:
+                self.data.append(block.get_columns())
+            else:
+                self.data.extend(block.get_rows())
+        elif not self.columns_with_types:
+            self.columns_with_types = block.columns_with_types
+    def get_result(self):
+        """
+        :return: stored query result.
+        """
+        for packet in self.packet_generator:
+            self.store(packet)
+        if self.columnar:
+            data = []
+            # Transpose to a list of columns, each column is list of chunks
+            for column_chunks in zip(*self.data):
+                # Concatenate chunks for each column
+                if isinstance(column_chunks[0], np.ndarray):
+                    column = np.concatenate(column_chunks)
+                elif isinstance(column_chunks[0], pd.Categorical):
+                    column = union_categoricals(column_chunks)
+                else:
+                    column = tuple(chain.from_iterable(column_chunks))
+                data.append(column)
+        else:
+            data = self.data
+        if self.with_column_types:
+            return data, self.columns_with_types
+        else:
+            return data
+class NumpyProgressQueryResult(NumpyQueryResult):
+    """
+    Stores query result and progress information from multiple blocks.
+    Provides iteration over query progress.
+    """
+    def __init__(self, *args, **kwargs):
+        self.progress_totals = Progress()
+        super(NumpyProgressQueryResult, self).__init__(*args, **kwargs)
+    def __iter__(self):
+        return self
+    def __next__(self):
+        while True:
+            packet = next(self.packet_generator)
+            progress_packet = getattr(packet, 'progress', None)
+            if progress_packet:
+                self.progress_totals.increment(progress_packet)
+                return (
+                    self.progress_totals.rows, self.progress_totals.total_rows
+                )
+            else:
+                self.store(packet)
+    def get_result(self):
+        # Read all progress packets.
+        for _ in self:
+            pass
+        return super(NumpyProgressQueryResult, self).get_result()
+class NumpyIterQueryResult(object):
+    """
+    Provides iteration over returned data by chunks (streaming by chunks).
+    """
+    def __init__(
+            self, packet_generator,
+            with_column_types=False):
+        self.packet_generator = packet_generator
+        self.with_column_types = with_column_types
+        self.first_block = True
+        super(NumpyIterQueryResult, self).__init__()
+    def __iter__(self):
+        return self
+    def __next__(self):
+        packet = next(self.packet_generator)
+        block = getattr(packet, 'block', None)
+        if block is None:
+            return []
+        if self.first_block and self.with_column_types:
+            self.first_block = False
+            rv = [block.columns_with_types]
+            rv.extend(block.get_rows())
+            return rv
+        else:
+            return block.get_rows()

clickhouse_driver/opentelemetry.py ADDED Viewed

@@ -0,0 +1,43 @@
+class OpenTelemetryTraceContext(object):
+    traceparent_tpl = 'xx-xxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxx-xxxxxxxxxxxxxxxx-xx'
+    translation = str.maketrans('1234567890abcdef', 'xxxxxxxxxxxxxxxx')
+    def __init__(self, traceparent, tracestate):
+        # xx-xxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxx-xxxxxxxxxxxxxxxx-xx
+        # ^              ^                           ^         ^
+        # version     trace_id                    span_id      flags
+        self.trace_id = None  # UUID
+        self.span_id = None  # UInt64
+        self.tracestate = tracestate  # String
+        self.trace_flags = None  # UInt8
+        if traceparent is not None:
+            self.parse_traceparent(traceparent)
+        super(OpenTelemetryTraceContext, self).__init__()
+    def parse_traceparent(self, traceparent):
+        traceparent = traceparent.lower()
+        if len(traceparent) != len(self.traceparent_tpl):
+            raise ValueError('unexpected length {}, expected {}'.format(
+                len(traceparent), len(self.traceparent_tpl)
+            ))
+        if traceparent.translate(self.translation) != self.traceparent_tpl:
+            raise ValueError(
+                'Malformed traceparant header: {}'.format(traceparent)
+            )
+        parts = traceparent.split('-')
+        version = int(parts[0], 16)
+        if version != 0:
+            raise ValueError(
+                'unexpected version {}, expected 00'.format(parts[0])
+            )
+        self.trace_id = (int(parts[1][16:], 16) << 64) + int(parts[1][:16], 16)
+        self.span_id = int(parts[2], 16)
+        self.trace_flags = int(parts[3], 16)

clickhouse_driver/progress.py CHANGED Viewed

@@ -1,32 +1,38 @@
-from . import defines
-from .varint import read_varint
-class Progress(object):
-    def __init__(self):
-        self.rows = 0
-        self.bytes = 0
-        self.total_rows = 0
-        self.written_rows = 0
-        self.written_bytes = 0
-        super(Progress, self).__init__()
-    def read(self, server_revision, fin):
-        self.rows = read_varint(fin)
-        self.bytes = read_varint(fin)
-        revision = server_revision
-        if revision >= defines.DBMS_MIN_REVISION_WITH_TOTAL_ROWS_IN_PROGRESS:
-            self.total_rows = read_varint(fin)
-        if revision >= defines.DBMS_MIN_REVISION_WITH_CLIENT_WRITE_INFO:
-            self.written_rows = read_varint(fin)
-            self.written_bytes = read_varint(fin)
-    def increment(self, another_progress):
-        self.rows += another_progress.rows
-        self.bytes += another_progress.bytes
-        self.total_rows += another_progress.total_rows
-        self.written_rows += another_progress.written_rows
-        self.written_bytes += another_progress.written_bytes
+from . import defines
+from .varint import read_varint
+class Progress(object):
+    def __init__(self):
+        self.rows = 0
+        self.bytes = 0
+        self.total_rows = 0
+        self.written_rows = 0
+        self.written_bytes = 0
+        self.elapsed_ns = 0
+        super(Progress, self).__init__()
+    def read(self, server_info, fin):
+        self.rows = read_varint(fin)
+        self.bytes = read_varint(fin)
+        revision = server_info.used_revision
+        if revision >= defines.DBMS_MIN_REVISION_WITH_TOTAL_ROWS_IN_PROGRESS:
+            self.total_rows = read_varint(fin)
+        if revision >= defines.DBMS_MIN_REVISION_WITH_CLIENT_WRITE_INFO:
+            self.written_rows = read_varint(fin)
+            self.written_bytes = read_varint(fin)
+        if revision >= defines. \
+                DBMS_MIN_PROTOCOL_VERSION_WITH_SERVER_QUERY_TIME_IN_PROGRESS:
+            self.elapsed_ns = read_varint(fin)
+    def increment(self, another_progress):
+        self.rows += another_progress.rows
+        self.bytes += another_progress.bytes
+        self.total_rows += another_progress.total_rows
+        self.written_rows += another_progress.written_rows
+        self.written_bytes += another_progress.written_bytes
+        self.elapsed_ns += another_progress.elapsed_ns