chdb 3.6.0__cp38-abi3-macosx_10_15_x86_64.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of chdb might be problematic. Click here for more details.
- chdb/__init__.py +134 -0
- chdb/__main__.py +38 -0
- chdb/_chdb.abi3.so +0 -0
- chdb/dataframe/__init__.py +19 -0
- chdb/dataframe/query.py +356 -0
- chdb/dbapi/__init__.py +79 -0
- chdb/dbapi/connections.py +100 -0
- chdb/dbapi/constants/FIELD_TYPE.py +31 -0
- chdb/dbapi/constants/__init__.py +0 -0
- chdb/dbapi/converters.py +293 -0
- chdb/dbapi/cursors.py +351 -0
- chdb/dbapi/err.py +61 -0
- chdb/dbapi/times.py +20 -0
- chdb/libpybind11nonlimitedapi_chdb_3.10.dylib +0 -0
- chdb/libpybind11nonlimitedapi_chdb_3.11.dylib +0 -0
- chdb/libpybind11nonlimitedapi_chdb_3.12.dylib +0 -0
- chdb/libpybind11nonlimitedapi_chdb_3.13.dylib +0 -0
- chdb/libpybind11nonlimitedapi_chdb_3.8.dylib +0 -0
- chdb/libpybind11nonlimitedapi_chdb_3.9.dylib +0 -0
- chdb/libpybind11nonlimitedapi_stubs.dylib +0 -0
- chdb/rwabc.py +65 -0
- chdb/session/__init__.py +3 -0
- chdb/session/state.py +124 -0
- chdb/state/__init__.py +3 -0
- chdb/state/sqlitelike.py +505 -0
- chdb/udf/__init__.py +3 -0
- chdb/udf/udf.py +106 -0
- chdb/utils/__init__.py +9 -0
- chdb/utils/trace.py +74 -0
- chdb/utils/types.py +234 -0
- chdb-3.6.0.dist-info/LICENSE.txt +203 -0
- chdb-3.6.0.dist-info/METADATA +554 -0
- chdb-3.6.0.dist-info/RECORD +35 -0
- chdb-3.6.0.dist-info/WHEEL +5 -0
- chdb-3.6.0.dist-info/top_level.txt +2 -0
|
@@ -0,0 +1,100 @@
|
|
|
1
|
+
from . import err
|
|
2
|
+
from .cursors import Cursor
|
|
3
|
+
from . import converters
|
|
4
|
+
from ..state import sqlitelike as chdb_stateful
|
|
5
|
+
|
|
6
|
+
DEBUG = False
|
|
7
|
+
VERBOSE = False
|
|
8
|
+
|
|
9
|
+
|
|
10
|
+
class Connection(object):
|
|
11
|
+
"""
|
|
12
|
+
Representation of a connection with chdb.
|
|
13
|
+
"""
|
|
14
|
+
|
|
15
|
+
def __init__(self, path=None):
|
|
16
|
+
self._closed = False
|
|
17
|
+
self.encoding = "utf8"
|
|
18
|
+
self._affected_rows = 0
|
|
19
|
+
self._resp = None
|
|
20
|
+
|
|
21
|
+
# Initialize sqlitelike connection
|
|
22
|
+
connection_string = ":memory:" if path is None else f"file:{path}"
|
|
23
|
+
self._conn = chdb_stateful.Connection(connection_string)
|
|
24
|
+
|
|
25
|
+
# Test connection with a simple query
|
|
26
|
+
cursor = self._conn.cursor()
|
|
27
|
+
cursor.execute("SELECT 1")
|
|
28
|
+
cursor.close()
|
|
29
|
+
|
|
30
|
+
def close(self):
|
|
31
|
+
"""Send the quit message and close the socket."""
|
|
32
|
+
if self._closed:
|
|
33
|
+
raise err.Error("Already closed")
|
|
34
|
+
self._closed = True
|
|
35
|
+
self._conn.close()
|
|
36
|
+
|
|
37
|
+
@property
|
|
38
|
+
def open(self):
|
|
39
|
+
"""Return True if the connection is open"""
|
|
40
|
+
return not self._closed
|
|
41
|
+
|
|
42
|
+
def commit(self):
|
|
43
|
+
"""Commit changes to stable storage."""
|
|
44
|
+
# No-op for ClickHouse
|
|
45
|
+
pass
|
|
46
|
+
|
|
47
|
+
def rollback(self):
|
|
48
|
+
"""Roll back the current transaction."""
|
|
49
|
+
# No-op for ClickHouse
|
|
50
|
+
pass
|
|
51
|
+
|
|
52
|
+
def cursor(self, cursor=None):
|
|
53
|
+
"""Create a new cursor to execute queries with."""
|
|
54
|
+
if self._closed:
|
|
55
|
+
raise err.Error("Connection closed")
|
|
56
|
+
if cursor:
|
|
57
|
+
return Cursor(self)
|
|
58
|
+
return Cursor(self)
|
|
59
|
+
|
|
60
|
+
def query(self, sql, fmt="CSV"):
|
|
61
|
+
"""Execute a query and return the raw result."""
|
|
62
|
+
if self._closed:
|
|
63
|
+
raise err.InterfaceError("Connection closed")
|
|
64
|
+
|
|
65
|
+
if isinstance(sql, str):
|
|
66
|
+
sql = sql.encode(self.encoding, "surrogateescape")
|
|
67
|
+
|
|
68
|
+
try:
|
|
69
|
+
result = self._conn.query(sql.decode(), fmt)
|
|
70
|
+
self._resp = result
|
|
71
|
+
return result
|
|
72
|
+
except Exception as error:
|
|
73
|
+
raise err.InterfaceError(f"Query error: {error}")
|
|
74
|
+
|
|
75
|
+
def escape(self, obj, mapping=None):
|
|
76
|
+
"""Escape whatever value you pass to it."""
|
|
77
|
+
return converters.escape_item(obj, mapping)
|
|
78
|
+
|
|
79
|
+
def escape_string(self, s):
|
|
80
|
+
return converters.escape_string(s)
|
|
81
|
+
|
|
82
|
+
def _quote_bytes(self, s):
|
|
83
|
+
return converters.escape_bytes(s)
|
|
84
|
+
|
|
85
|
+
def __enter__(self):
|
|
86
|
+
"""Context manager that returns a Cursor"""
|
|
87
|
+
return self.cursor()
|
|
88
|
+
|
|
89
|
+
def __exit__(self, exc, value, traceback):
|
|
90
|
+
"""On successful exit, commit. On exception, rollback"""
|
|
91
|
+
if exc:
|
|
92
|
+
self.rollback()
|
|
93
|
+
else:
|
|
94
|
+
self.commit()
|
|
95
|
+
self.close()
|
|
96
|
+
|
|
97
|
+
@property
|
|
98
|
+
def resp(self):
|
|
99
|
+
"""Return the last query response"""
|
|
100
|
+
return self._resp
|
|
@@ -0,0 +1,31 @@
|
|
|
1
|
+
DECIMAL = 0
|
|
2
|
+
TINY = 1
|
|
3
|
+
SHORT = 2
|
|
4
|
+
LONG = 3
|
|
5
|
+
FLOAT = 4
|
|
6
|
+
DOUBLE = 5
|
|
7
|
+
NULL = 6
|
|
8
|
+
TIMESTAMP = 7
|
|
9
|
+
LONGLONG = 8
|
|
10
|
+
INT24 = 9
|
|
11
|
+
DATE = 10
|
|
12
|
+
TIME = 11
|
|
13
|
+
DATETIME = 12
|
|
14
|
+
YEAR = 13
|
|
15
|
+
NEWDATE = 14
|
|
16
|
+
VARCHAR = 15
|
|
17
|
+
BIT = 16
|
|
18
|
+
JSON = 245
|
|
19
|
+
NEWDECIMAL = 246
|
|
20
|
+
ENUM = 247
|
|
21
|
+
SET = 248
|
|
22
|
+
TINY_BLOB = 249
|
|
23
|
+
MEDIUM_BLOB = 250
|
|
24
|
+
LONG_BLOB = 251
|
|
25
|
+
BLOB = 252
|
|
26
|
+
VAR_STRING = 253
|
|
27
|
+
STRING = 254
|
|
28
|
+
GEOMETRY = 255
|
|
29
|
+
|
|
30
|
+
CHAR = TINY
|
|
31
|
+
INTERVAL = ENUM
|
|
File without changes
|
chdb/dbapi/converters.py
ADDED
|
@@ -0,0 +1,293 @@
|
|
|
1
|
+
import datetime
|
|
2
|
+
from decimal import Decimal
|
|
3
|
+
from .err import DataError
|
|
4
|
+
import re
|
|
5
|
+
import time
|
|
6
|
+
|
|
7
|
+
|
|
8
|
+
def escape_item(val, mapping=None):
|
|
9
|
+
if mapping is None:
|
|
10
|
+
mapping = encoders
|
|
11
|
+
encoder = mapping.get(type(val))
|
|
12
|
+
|
|
13
|
+
# Fallback to default when no encoder found
|
|
14
|
+
if not encoder:
|
|
15
|
+
try:
|
|
16
|
+
encoder = mapping[str]
|
|
17
|
+
except KeyError:
|
|
18
|
+
raise TypeError("no default type converter defined")
|
|
19
|
+
|
|
20
|
+
val = encoder(val, mapping)
|
|
21
|
+
return val
|
|
22
|
+
|
|
23
|
+
|
|
24
|
+
def escape_dict(val, mapping=None):
|
|
25
|
+
n = {}
|
|
26
|
+
for k, v in val.items():
|
|
27
|
+
quoted = escape_item(v, mapping)
|
|
28
|
+
n[k] = quoted
|
|
29
|
+
return n
|
|
30
|
+
|
|
31
|
+
|
|
32
|
+
def escape_sequence(val, mapping=None):
|
|
33
|
+
n = []
|
|
34
|
+
for item in val:
|
|
35
|
+
quoted = escape_item(item, mapping)
|
|
36
|
+
n.append(quoted)
|
|
37
|
+
return "(" + ",".join(n) + ")"
|
|
38
|
+
|
|
39
|
+
|
|
40
|
+
def escape_set(val, mapping=None):
|
|
41
|
+
return ','.join([escape_item(x, mapping) for x in val])
|
|
42
|
+
|
|
43
|
+
|
|
44
|
+
def escape_bool(value, mapping=None):
|
|
45
|
+
return str(int(value))
|
|
46
|
+
|
|
47
|
+
|
|
48
|
+
def escape_object(value, mapping=None):
|
|
49
|
+
return str(value)
|
|
50
|
+
|
|
51
|
+
|
|
52
|
+
def escape_int(value, mapping=None):
|
|
53
|
+
return str(value)
|
|
54
|
+
|
|
55
|
+
|
|
56
|
+
def escape_float(value, mapping=None):
|
|
57
|
+
return '%.15g' % value
|
|
58
|
+
|
|
59
|
+
|
|
60
|
+
_escape_table = [chr(x) for x in range(128)]
|
|
61
|
+
_escape_table[ord("'")] = u"''"
|
|
62
|
+
_escape_table[ord("\\")] = "\\\\"
|
|
63
|
+
|
|
64
|
+
|
|
65
|
+
def _escape_unicode(value, mapping=None):
|
|
66
|
+
"""escapes *value* with adding single quote.
|
|
67
|
+
|
|
68
|
+
Value should be unicode
|
|
69
|
+
"""
|
|
70
|
+
return value.translate(_escape_table)
|
|
71
|
+
|
|
72
|
+
|
|
73
|
+
escape_string = _escape_unicode
|
|
74
|
+
|
|
75
|
+
# On Python ~3.5, str.decode('ascii', 'surrogateescape') is slow.
|
|
76
|
+
# (fixed in Python 3.6, http://bugs.python.org/issue24870)
|
|
77
|
+
# Workaround is str.decode('latin1') then translate 0x80-0xff into 0udc80-0udcff.
|
|
78
|
+
# We can escape special chars and surrogateescape at once.
|
|
79
|
+
_escape_bytes_table = _escape_table + [chr(i) for i in range(0xdc80, 0xdd00)]
|
|
80
|
+
|
|
81
|
+
|
|
82
|
+
def escape_bytes(value, mapping=None):
|
|
83
|
+
return "'%s'" % value.decode('latin1').translate(_escape_bytes_table)
|
|
84
|
+
|
|
85
|
+
|
|
86
|
+
def escape_unicode(value, mapping=None):
|
|
87
|
+
return u"'%s'" % _escape_unicode(value)
|
|
88
|
+
|
|
89
|
+
|
|
90
|
+
def escape_str(value, mapping=None):
|
|
91
|
+
return "'%s'" % escape_string(str(value), mapping)
|
|
92
|
+
|
|
93
|
+
|
|
94
|
+
def escape_None(value, mapping=None):
|
|
95
|
+
return 'NULL'
|
|
96
|
+
|
|
97
|
+
|
|
98
|
+
def escape_timedelta(obj, mapping=None):
|
|
99
|
+
seconds = int(obj.seconds) % 60
|
|
100
|
+
minutes = int(obj.seconds // 60) % 60
|
|
101
|
+
hours = int(obj.seconds // 3600) % 24 + int(obj.days) * 24
|
|
102
|
+
if obj.microseconds:
|
|
103
|
+
fmt = "'{0:02d}:{1:02d}:{2:02d}.{3:06d}'"
|
|
104
|
+
else:
|
|
105
|
+
fmt = "'{0:02d}:{1:02d}:{2:02d}'"
|
|
106
|
+
return fmt.format(hours, minutes, seconds, obj.microseconds)
|
|
107
|
+
|
|
108
|
+
|
|
109
|
+
def escape_time(obj, mapping=None):
|
|
110
|
+
return "'{}'".format(obj.isoformat(timespec='microseconds'))
|
|
111
|
+
|
|
112
|
+
|
|
113
|
+
def escape_datetime(obj, mapping=None):
|
|
114
|
+
return "'{}'".format(obj.isoformat(sep=' ', timespec='microseconds'))
|
|
115
|
+
# if obj.microsecond:
|
|
116
|
+
# fmt = "'{0.year:04}-{0.month:02}-{0.day:02} {0.hour:02}:{0.minute:02}:{0.second:02}.{0.microsecond:06}'"
|
|
117
|
+
# else:
|
|
118
|
+
# fmt = "'{0.year:04}-{0.month:02}-{0.day:02} {0.hour:02}:{0.minute:02}:{0.second:02}'"
|
|
119
|
+
# return fmt.format(obj)
|
|
120
|
+
|
|
121
|
+
|
|
122
|
+
def escape_date(obj, mapping=None):
|
|
123
|
+
return "'{}'".format(obj.isoformat())
|
|
124
|
+
|
|
125
|
+
|
|
126
|
+
def escape_struct_time(obj, mapping=None):
|
|
127
|
+
return escape_datetime(datetime.datetime(*obj[:6]))
|
|
128
|
+
|
|
129
|
+
|
|
130
|
+
def _convert_second_fraction(s):
|
|
131
|
+
if not s:
|
|
132
|
+
return 0
|
|
133
|
+
# Pad zeros to ensure the fraction length in microseconds
|
|
134
|
+
s = s.ljust(6, '0')
|
|
135
|
+
return int(s[:6])
|
|
136
|
+
|
|
137
|
+
|
|
138
|
+
def convert_datetime(obj):
|
|
139
|
+
"""Returns a DATETIME or TIMESTAMP column value as a datetime object:
|
|
140
|
+
|
|
141
|
+
>>> datetime_or_None('2007-02-25 23:06:20')
|
|
142
|
+
datetime.datetime(2007, 2, 25, 23, 6, 20)
|
|
143
|
+
|
|
144
|
+
Illegal values are raise DataError
|
|
145
|
+
|
|
146
|
+
"""
|
|
147
|
+
if isinstance(obj, (bytes, bytearray)):
|
|
148
|
+
obj = obj.decode('ascii')
|
|
149
|
+
|
|
150
|
+
try:
|
|
151
|
+
time_obj = datetime.datetime.strptime(obj, '%Y-%m-%d %H:%M:%S')
|
|
152
|
+
return time_obj
|
|
153
|
+
except Exception as err:
|
|
154
|
+
raise DataError("Not valid datetime struct: %s" % err)
|
|
155
|
+
|
|
156
|
+
|
|
157
|
+
TIMEDELTA_RE = re.compile(r"(-)?(\d{1,3}):(\d{1,2}):(\d{1,2})(?:.(\d{1,6}))?")
|
|
158
|
+
|
|
159
|
+
|
|
160
|
+
def convert_timedelta(obj):
|
|
161
|
+
"""Returns a TIME column as a timedelta object:
|
|
162
|
+
|
|
163
|
+
>>> timedelta_or_None('25:06:17')
|
|
164
|
+
datetime.timedelta(1, 3977)
|
|
165
|
+
>>> timedelta_or_None('-25:06:17')
|
|
166
|
+
datetime.timedelta(-2, 83177)
|
|
167
|
+
|
|
168
|
+
Illegal values are returned as None:
|
|
169
|
+
|
|
170
|
+
>>> timedelta_or_None('random crap') is None
|
|
171
|
+
True
|
|
172
|
+
|
|
173
|
+
Note that MySQL always returns TIME columns as (+|-)HH:MM:SS, but
|
|
174
|
+
can accept values as (+|-)DD HH:MM:SS. The latter format will not
|
|
175
|
+
be parsed correctly by this function.
|
|
176
|
+
"""
|
|
177
|
+
if isinstance(obj, (bytes, bytearray)):
|
|
178
|
+
obj = obj.decode('ascii')
|
|
179
|
+
|
|
180
|
+
m = TIMEDELTA_RE.match(obj)
|
|
181
|
+
if not m:
|
|
182
|
+
return obj
|
|
183
|
+
|
|
184
|
+
try:
|
|
185
|
+
groups = list(m.groups())
|
|
186
|
+
groups[-1] = _convert_second_fraction(groups[-1])
|
|
187
|
+
negate = -1 if groups[0] else 1
|
|
188
|
+
hours, minutes, seconds, microseconds = groups[1:]
|
|
189
|
+
|
|
190
|
+
tdelta = datetime.timedelta(
|
|
191
|
+
hours=int(hours),
|
|
192
|
+
minutes=int(minutes),
|
|
193
|
+
seconds=int(seconds),
|
|
194
|
+
microseconds=int(microseconds)
|
|
195
|
+
) * negate
|
|
196
|
+
return tdelta
|
|
197
|
+
except ValueError as err:
|
|
198
|
+
raise DataError("Not valid time or timedelta struct: %s" % err)
|
|
199
|
+
|
|
200
|
+
|
|
201
|
+
def convert_time(obj):
|
|
202
|
+
"""Returns a TIME column as a time object:
|
|
203
|
+
|
|
204
|
+
>>> time_or_None('15:06:17')
|
|
205
|
+
datetime.time(15, 6, 17)
|
|
206
|
+
|
|
207
|
+
Illegal values are returned DataError:
|
|
208
|
+
|
|
209
|
+
"""
|
|
210
|
+
if isinstance(obj, (bytes, bytearray)):
|
|
211
|
+
obj = obj.decode('ascii')
|
|
212
|
+
|
|
213
|
+
try:
|
|
214
|
+
time_obj = datetime.datetime.strptime(obj, '%H:%M:%S')
|
|
215
|
+
return time_obj.time()
|
|
216
|
+
except Exception:
|
|
217
|
+
return convert_timedelta(obj)
|
|
218
|
+
|
|
219
|
+
|
|
220
|
+
def convert_date(obj):
|
|
221
|
+
"""Returns a DATE column as a date object:
|
|
222
|
+
|
|
223
|
+
>>> date_or_None('2007-02-26')
|
|
224
|
+
datetime.date(2007, 2, 26)
|
|
225
|
+
|
|
226
|
+
Illegal values are returned as None:
|
|
227
|
+
|
|
228
|
+
>>> date_or_None('2007-02-31') is None
|
|
229
|
+
True
|
|
230
|
+
>>> date_or_None('0000-00-00') is None
|
|
231
|
+
True
|
|
232
|
+
|
|
233
|
+
"""
|
|
234
|
+
if isinstance(obj, (bytes, bytearray)):
|
|
235
|
+
obj = obj.decode('ascii')
|
|
236
|
+
try:
|
|
237
|
+
time_obj = datetime.datetime.strptime(obj, '%Y-%m-%d')
|
|
238
|
+
return time_obj.date()
|
|
239
|
+
except Exception as err:
|
|
240
|
+
raise DataError("Not valid date struct: %s" % err)
|
|
241
|
+
|
|
242
|
+
|
|
243
|
+
def convert_set(s):
|
|
244
|
+
if isinstance(s, (bytes, bytearray)):
|
|
245
|
+
return set(s.split(b","))
|
|
246
|
+
return set(s.split(","))
|
|
247
|
+
|
|
248
|
+
|
|
249
|
+
def convert_characters(connection, data):
|
|
250
|
+
if connection.use_unicode:
|
|
251
|
+
data = data.decode("utf8")
|
|
252
|
+
return data
|
|
253
|
+
|
|
254
|
+
|
|
255
|
+
def convert_column_data(column_type, column_data):
|
|
256
|
+
data = column_data
|
|
257
|
+
|
|
258
|
+
# Null
|
|
259
|
+
if data is None:
|
|
260
|
+
return data
|
|
261
|
+
|
|
262
|
+
if not isinstance(column_type, str):
|
|
263
|
+
return data
|
|
264
|
+
|
|
265
|
+
column_type = column_type.lower().strip()
|
|
266
|
+
if column_type == 'time':
|
|
267
|
+
data = convert_time(column_data)
|
|
268
|
+
elif column_type == 'date':
|
|
269
|
+
data = convert_date(column_data)
|
|
270
|
+
elif column_type == 'datetime':
|
|
271
|
+
data = convert_datetime(column_data)
|
|
272
|
+
|
|
273
|
+
return data
|
|
274
|
+
|
|
275
|
+
|
|
276
|
+
encoders = {
|
|
277
|
+
bool: escape_bool,
|
|
278
|
+
int: escape_int,
|
|
279
|
+
float: escape_float,
|
|
280
|
+
str: escape_unicode,
|
|
281
|
+
tuple: escape_sequence,
|
|
282
|
+
list: escape_sequence,
|
|
283
|
+
set: escape_sequence,
|
|
284
|
+
frozenset: escape_sequence,
|
|
285
|
+
dict: escape_dict,
|
|
286
|
+
type(None): escape_None,
|
|
287
|
+
datetime.date: escape_date,
|
|
288
|
+
datetime.datetime: escape_datetime,
|
|
289
|
+
datetime.timedelta: escape_timedelta,
|
|
290
|
+
datetime.time: escape_time,
|
|
291
|
+
time.struct_time: escape_struct_time,
|
|
292
|
+
Decimal: escape_object,
|
|
293
|
+
}
|