pg 1.3.0.rc2-x64-mingw-ucrt
Sign up to get free protection for your applications and to get access to all the features.
- checksums.yaml +7 -0
- checksums.yaml.gz.sig +3 -0
- data/.appveyor.yml +36 -0
- data/.gems +6 -0
- data/.gemtest +0 -0
- data/.github/workflows/binary-gems.yml +85 -0
- data/.github/workflows/source-gem.yml +130 -0
- data/.gitignore +13 -0
- data/.hgsigs +34 -0
- data/.hgtags +41 -0
- data/.irbrc +23 -0
- data/.pryrc +23 -0
- data/.tm_properties +21 -0
- data/.travis.yml +49 -0
- data/BSDL +22 -0
- data/Contributors.rdoc +46 -0
- data/Gemfile +14 -0
- data/History.rdoc +648 -0
- data/LICENSE +56 -0
- data/Manifest.txt +72 -0
- data/POSTGRES +23 -0
- data/README-OS_X.rdoc +68 -0
- data/README-Windows.rdoc +56 -0
- data/README.ja.rdoc +13 -0
- data/README.rdoc +214 -0
- data/Rakefile +106 -0
- data/Rakefile.cross +300 -0
- data/certs/ged.pem +24 -0
- data/ext/errorcodes.def +1040 -0
- data/ext/errorcodes.rb +45 -0
- data/ext/errorcodes.txt +496 -0
- data/ext/extconf.rb +165 -0
- data/ext/gvl_wrappers.c +21 -0
- data/ext/gvl_wrappers.h +264 -0
- data/ext/pg.c +732 -0
- data/ext/pg.h +385 -0
- data/ext/pg_binary_decoder.c +229 -0
- data/ext/pg_binary_encoder.c +163 -0
- data/ext/pg_coder.c +615 -0
- data/ext/pg_connection.c +4415 -0
- data/ext/pg_copy_coder.c +628 -0
- data/ext/pg_errors.c +95 -0
- data/ext/pg_record_coder.c +519 -0
- data/ext/pg_result.c +1683 -0
- data/ext/pg_text_decoder.c +987 -0
- data/ext/pg_text_encoder.c +814 -0
- data/ext/pg_tuple.c +575 -0
- data/ext/pg_type_map.c +199 -0
- data/ext/pg_type_map_all_strings.c +129 -0
- data/ext/pg_type_map_by_class.c +269 -0
- data/ext/pg_type_map_by_column.c +349 -0
- data/ext/pg_type_map_by_mri_type.c +313 -0
- data/ext/pg_type_map_by_oid.c +385 -0
- data/ext/pg_type_map_in_ruby.c +330 -0
- data/ext/pg_util.c +149 -0
- data/ext/pg_util.h +65 -0
- data/ext/vc/pg.sln +26 -0
- data/ext/vc/pg_18/pg.vcproj +216 -0
- data/ext/vc/pg_19/pg_19.vcproj +209 -0
- data/lib/3.1/pg_ext.so +0 -0
- data/lib/pg/basic_type_map_based_on_result.rb +47 -0
- data/lib/pg/basic_type_map_for_queries.rb +193 -0
- data/lib/pg/basic_type_map_for_results.rb +81 -0
- data/lib/pg/basic_type_registry.rb +296 -0
- data/lib/pg/binary_decoder.rb +23 -0
- data/lib/pg/coder.rb +104 -0
- data/lib/pg/connection.rb +813 -0
- data/lib/pg/constants.rb +12 -0
- data/lib/pg/exceptions.rb +12 -0
- data/lib/pg/result.rb +43 -0
- data/lib/pg/text_decoder.rb +46 -0
- data/lib/pg/text_encoder.rb +59 -0
- data/lib/pg/tuple.rb +30 -0
- data/lib/pg/type_map_by_column.rb +16 -0
- data/lib/pg/version.rb +4 -0
- data/lib/pg.rb +87 -0
- data/lib/x64-mingw-ucrt/libpq.dll +0 -0
- data/misc/openssl-pg-segfault.rb +31 -0
- data/misc/postgres/History.txt +9 -0
- data/misc/postgres/Manifest.txt +5 -0
- data/misc/postgres/README.txt +21 -0
- data/misc/postgres/Rakefile +21 -0
- data/misc/postgres/lib/postgres.rb +16 -0
- data/misc/ruby-pg/History.txt +9 -0
- data/misc/ruby-pg/Manifest.txt +5 -0
- data/misc/ruby-pg/README.txt +21 -0
- data/misc/ruby-pg/Rakefile +21 -0
- data/misc/ruby-pg/lib/ruby/pg.rb +16 -0
- data/pg.gemspec +32 -0
- data/sample/array_insert.rb +20 -0
- data/sample/async_api.rb +106 -0
- data/sample/async_copyto.rb +39 -0
- data/sample/async_mixed.rb +56 -0
- data/sample/check_conn.rb +21 -0
- data/sample/copydata.rb +71 -0
- data/sample/copyfrom.rb +81 -0
- data/sample/copyto.rb +19 -0
- data/sample/cursor.rb +21 -0
- data/sample/disk_usage_report.rb +177 -0
- data/sample/issue-119.rb +94 -0
- data/sample/losample.rb +69 -0
- data/sample/minimal-testcase.rb +17 -0
- data/sample/notify_wait.rb +72 -0
- data/sample/pg_statistics.rb +285 -0
- data/sample/replication_monitor.rb +222 -0
- data/sample/test_binary_values.rb +33 -0
- data/sample/wal_shipper.rb +434 -0
- data/sample/warehouse_partitions.rb +311 -0
- data.tar.gz.sig +0 -0
- metadata +188 -0
- metadata.gz.sig +0 -0
@@ -0,0 +1,814 @@
|
|
1
|
+
/*
|
2
|
+
* pg_text_encoder.c - PG::TextEncoder module
|
3
|
+
* $Id$
|
4
|
+
*
|
5
|
+
*/
|
6
|
+
|
7
|
+
/*
|
8
|
+
*
|
9
|
+
* Type casts for encoding Ruby objects to PostgreSQL string representations.
|
10
|
+
*
|
11
|
+
* Encoder classes are defined with pg_define_coder(). This creates a new coder class and
|
12
|
+
* assigns an encoder function. The encoder function can decide between two different options
|
13
|
+
* to return the encoded data. It can either return it as a Ruby String object or write the
|
14
|
+
* encoded data to a memory space provided by the caller. In the second case, the encoder
|
15
|
+
* function is called twice, once for deciding the encoding option and returning the expected
|
16
|
+
* data length, and a second time when the requested memory space was made available by the
|
17
|
+
* calling function, to do the actual conversion and writing. Parameter intermediate can be
|
18
|
+
* used to store data between these two calls.
|
19
|
+
*
|
20
|
+
* Signature of all type cast encoders is:
|
21
|
+
* int encoder_function(t_pg_coder *this, VALUE value, char *out, VALUE *intermediate)
|
22
|
+
*
|
23
|
+
* Params:
|
24
|
+
* this - The data part of the coder object that belongs to the encoder function.
|
25
|
+
* value - The Ruby object to cast.
|
26
|
+
* out - NULL for the first call,
|
27
|
+
* pointer to a buffer with the requested size for the second call.
|
28
|
+
* intermediate - Pointer to a VALUE that might be set by the encoding function to some
|
29
|
+
* value in the first call that can be retrieved later in the second call.
|
30
|
+
* This VALUE is not yet initialized by the caller.
|
31
|
+
* enc_idx - Index of the output Encoding that strings should be converted to.
|
32
|
+
*
|
33
|
+
* Returns:
|
34
|
+
* >= 0 - If out==NULL the encoder function must return the expected output buffer size.
|
35
|
+
* This can be larger than the size of the second call, but may not be smaller.
|
36
|
+
* If out!=NULL the encoder function must return the actually used output buffer size
|
37
|
+
* without a termination character.
|
38
|
+
* -1 - The encoder function can alternatively return -1 to indicate that no second call
|
39
|
+
* is required, but the String value in *intermediate should be used instead.
|
40
|
+
*/
|
41
|
+
|
42
|
+
|
43
|
+
#include "pg.h"
|
44
|
+
#include "pg_util.h"
|
45
|
+
#ifdef HAVE_INTTYPES_H
|
46
|
+
#include <inttypes.h>
|
47
|
+
#endif
|
48
|
+
#include <math.h>
|
49
|
+
|
50
|
+
VALUE rb_mPG_TextEncoder;
|
51
|
+
static ID s_id_encode;
|
52
|
+
static ID s_id_to_i;
|
53
|
+
static ID s_id_to_s;
|
54
|
+
static ID s_cBigDecimal;
|
55
|
+
static VALUE s_str_F;
|
56
|
+
|
57
|
+
static int pg_text_enc_integer(t_pg_coder *this, VALUE value, char *out, VALUE *intermediate, int enc_idx);
|
58
|
+
|
59
|
+
VALUE
|
60
|
+
pg_obj_to_i( VALUE value )
|
61
|
+
{
|
62
|
+
switch (TYPE(value)) {
|
63
|
+
case T_FIXNUM:
|
64
|
+
case T_FLOAT:
|
65
|
+
case T_BIGNUM:
|
66
|
+
return value;
|
67
|
+
default:
|
68
|
+
return rb_funcall(value, s_id_to_i, 0);
|
69
|
+
}
|
70
|
+
}
|
71
|
+
|
72
|
+
/*
|
73
|
+
* Document-class: PG::TextEncoder::Boolean < PG::SimpleEncoder
|
74
|
+
*
|
75
|
+
* This is the encoder class for the PostgreSQL bool type.
|
76
|
+
*
|
77
|
+
* Ruby value false is encoded as SQL +FALSE+ value.
|
78
|
+
* Ruby value true is encoded as SQL +TRUE+ value.
|
79
|
+
* Any other value is sent as it's string representation.
|
80
|
+
*
|
81
|
+
*/
|
82
|
+
static int
|
83
|
+
pg_text_enc_boolean(t_pg_coder *this, VALUE value, char *out, VALUE *intermediate, int enc_idx)
|
84
|
+
{
|
85
|
+
switch( TYPE(value) ){
|
86
|
+
case T_FALSE:
|
87
|
+
if(out) *out = 'f';
|
88
|
+
return 1;
|
89
|
+
case T_TRUE:
|
90
|
+
if(out) *out = 't';
|
91
|
+
return 1;
|
92
|
+
case T_FIXNUM:
|
93
|
+
case T_BIGNUM:
|
94
|
+
if( NUM2LONG(value) == 0 ){
|
95
|
+
if(out) *out = '0';
|
96
|
+
return 1;
|
97
|
+
} else if( NUM2LONG(value) == 1 ){
|
98
|
+
if(out) *out = '1';
|
99
|
+
return 1;
|
100
|
+
} else {
|
101
|
+
return pg_text_enc_integer(this, value, out, intermediate, enc_idx);
|
102
|
+
}
|
103
|
+
default:
|
104
|
+
return pg_coder_enc_to_s(this, value, out, intermediate, enc_idx);
|
105
|
+
}
|
106
|
+
/* never reached */
|
107
|
+
return 0;
|
108
|
+
}
|
109
|
+
|
110
|
+
|
111
|
+
/*
|
112
|
+
* Document-class: PG::TextEncoder::String < PG::SimpleEncoder
|
113
|
+
*
|
114
|
+
* This is the encoder class for the PostgreSQL text types.
|
115
|
+
*
|
116
|
+
* Non-String values are expected to have method +to_s+ defined.
|
117
|
+
*
|
118
|
+
*/
|
119
|
+
int
|
120
|
+
pg_coder_enc_to_s(t_pg_coder *this, VALUE value, char *out, VALUE *intermediate, int enc_idx)
|
121
|
+
{
|
122
|
+
VALUE str = rb_obj_as_string(value);
|
123
|
+
if( ENCODING_GET(str) == enc_idx ){
|
124
|
+
*intermediate = str;
|
125
|
+
}else{
|
126
|
+
*intermediate = rb_str_export_to_enc(str, rb_enc_from_index(enc_idx));
|
127
|
+
}
|
128
|
+
return -1;
|
129
|
+
}
|
130
|
+
|
131
|
+
static int
|
132
|
+
count_leading_zero_bits(unsigned long long x)
|
133
|
+
{
|
134
|
+
#if defined(__GNUC__) || defined(__clang__)
|
135
|
+
return __builtin_clzll(x);
|
136
|
+
#elif defined(_MSC_VER)
|
137
|
+
DWORD r = 0;
|
138
|
+
_BitScanForward64(&r, x);
|
139
|
+
return (int)r;
|
140
|
+
#else
|
141
|
+
unsigned int a;
|
142
|
+
for(a=0; a < sizeof(unsigned long long) * 8; a++){
|
143
|
+
if( x & (1 << (sizeof(unsigned long long) * 8 - 1))) return a;
|
144
|
+
x <<= 1;
|
145
|
+
}
|
146
|
+
return a;
|
147
|
+
#endif
|
148
|
+
}
|
149
|
+
|
150
|
+
/*
|
151
|
+
* Document-class: PG::TextEncoder::Integer < PG::SimpleEncoder
|
152
|
+
*
|
153
|
+
* This is the encoder class for the PostgreSQL integer types.
|
154
|
+
*
|
155
|
+
* Non-Integer values are expected to have method +to_i+ defined.
|
156
|
+
*
|
157
|
+
*/
|
158
|
+
static int
|
159
|
+
pg_text_enc_integer(t_pg_coder *this, VALUE value, char *out, VALUE *intermediate, int enc_idx)
|
160
|
+
{
|
161
|
+
if(out){
|
162
|
+
if(TYPE(*intermediate) == T_STRING){
|
163
|
+
return pg_coder_enc_to_s(this, value, out, intermediate, enc_idx);
|
164
|
+
}else{
|
165
|
+
char *start = out;
|
166
|
+
int len;
|
167
|
+
int neg = 0;
|
168
|
+
long long sll = NUM2LL(*intermediate);
|
169
|
+
unsigned long long ll;
|
170
|
+
|
171
|
+
if (sll < 0) {
|
172
|
+
/* Avoid problems with the most negative integer not being representable
|
173
|
+
* as a positive integer, by using unsigned long long for encoding.
|
174
|
+
*/
|
175
|
+
ll = -sll;
|
176
|
+
neg = 1;
|
177
|
+
} else {
|
178
|
+
ll = sll;
|
179
|
+
}
|
180
|
+
|
181
|
+
/* Compute the result string backwards. */
|
182
|
+
do {
|
183
|
+
unsigned long long remainder;
|
184
|
+
unsigned long long oldval = ll;
|
185
|
+
|
186
|
+
ll /= 10;
|
187
|
+
remainder = oldval - ll * 10;
|
188
|
+
*out++ = '0' + remainder;
|
189
|
+
} while (ll != 0);
|
190
|
+
|
191
|
+
if (neg)
|
192
|
+
*out++ = '-';
|
193
|
+
|
194
|
+
len = (int)(out - start);
|
195
|
+
|
196
|
+
/* Reverse string. */
|
197
|
+
out--;
|
198
|
+
while (start < out)
|
199
|
+
{
|
200
|
+
char swap = *start;
|
201
|
+
|
202
|
+
*start++ = *out;
|
203
|
+
*out-- = swap;
|
204
|
+
}
|
205
|
+
|
206
|
+
return len;
|
207
|
+
}
|
208
|
+
}else{
|
209
|
+
*intermediate = pg_obj_to_i(value);
|
210
|
+
if(TYPE(*intermediate) == T_FIXNUM){
|
211
|
+
long long sll = NUM2LL(*intermediate);
|
212
|
+
unsigned long long ll = sll < 0 ? -sll : sll;
|
213
|
+
int len = (sizeof(unsigned long long) * 8 - count_leading_zero_bits(ll)) / 3;
|
214
|
+
return sll < 0 ? len+2 : len+1;
|
215
|
+
}else{
|
216
|
+
return pg_coder_enc_to_s(this, *intermediate, NULL, intermediate, enc_idx);
|
217
|
+
}
|
218
|
+
}
|
219
|
+
}
|
220
|
+
|
221
|
+
#define MAX_DOUBLE_DIGITS 16
|
222
|
+
|
223
|
+
/*
|
224
|
+
* Document-class: PG::TextEncoder::Float < PG::SimpleEncoder
|
225
|
+
*
|
226
|
+
* This is the encoder class for the PostgreSQL float types.
|
227
|
+
*
|
228
|
+
*/
|
229
|
+
static int
|
230
|
+
pg_text_enc_float(t_pg_coder *conv, VALUE value, char *out, VALUE *intermediate, int enc_idx)
|
231
|
+
{
|
232
|
+
if(out){
|
233
|
+
double dvalue = NUM2DBL(value);
|
234
|
+
int len = 0;
|
235
|
+
int neg = 0;
|
236
|
+
int exp2i, exp10i, i;
|
237
|
+
unsigned long long ll, remainder, oldval;
|
238
|
+
VALUE intermediate;
|
239
|
+
|
240
|
+
/* Cast to the same strings as value.to_s . */
|
241
|
+
if( isinf(dvalue) ){
|
242
|
+
if( dvalue < 0 ){
|
243
|
+
memcpy( out, "-Infinity", 9);
|
244
|
+
return 9;
|
245
|
+
} else {
|
246
|
+
memcpy( out, "Infinity", 8);
|
247
|
+
return 8;
|
248
|
+
}
|
249
|
+
} else if (isnan(dvalue)) {
|
250
|
+
memcpy( out, "NaN", 3);
|
251
|
+
return 3;
|
252
|
+
}
|
253
|
+
|
254
|
+
/*
|
255
|
+
* The following computation is roughly a conversion kind of
|
256
|
+
* sprintf( out, "%.16E", dvalue);
|
257
|
+
*/
|
258
|
+
|
259
|
+
/* write the algebraic sign */
|
260
|
+
if( dvalue < 0 ) {
|
261
|
+
dvalue = -dvalue;
|
262
|
+
*out++ = '-';
|
263
|
+
neg++;
|
264
|
+
}
|
265
|
+
|
266
|
+
/* retrieve the power of 2 exponent */
|
267
|
+
frexp(dvalue, &exp2i);
|
268
|
+
/* compute the power of 10 exponent */
|
269
|
+
exp10i = (int)floor(exp2i * 0.30102999566398114); /* Math.log(2)/Math.log(10) */
|
270
|
+
/* move the decimal point, so that we get an integer of MAX_DOUBLE_DIGITS decimal digits */
|
271
|
+
ll = (unsigned long long)(dvalue * pow(10, MAX_DOUBLE_DIGITS - 1 - exp10i) + 0.5);
|
272
|
+
|
273
|
+
/* avoid leading zeros due to inaccuracy of deriving exp10i from exp2i */
|
274
|
+
/* otherwise we would print "09.0" instead of "9.0" */
|
275
|
+
if( ll < 1000000000000000 ){ /* pow(10, MAX_DOUBLE_DIGITS-1) */
|
276
|
+
exp10i--;
|
277
|
+
ll *= 10;
|
278
|
+
}
|
279
|
+
|
280
|
+
if( exp10i <= -5 || exp10i >= 15 ) {
|
281
|
+
/* Write the float in exponent format (1.23e45) */
|
282
|
+
|
283
|
+
/* write fraction digits from right to left */
|
284
|
+
for( i = MAX_DOUBLE_DIGITS; i > 1; i--){
|
285
|
+
oldval = ll;
|
286
|
+
ll /= 10;
|
287
|
+
remainder = oldval - ll * 10;
|
288
|
+
/* omit trailing zeros */
|
289
|
+
if(remainder != 0 || len ) {
|
290
|
+
out[i] = '0' + remainder;
|
291
|
+
len++;
|
292
|
+
}
|
293
|
+
}
|
294
|
+
|
295
|
+
/* write decimal point */
|
296
|
+
if( len ){
|
297
|
+
out[1] = '.';
|
298
|
+
len++;
|
299
|
+
}
|
300
|
+
|
301
|
+
/* write remaining single digit left to the decimal point */
|
302
|
+
oldval = ll;
|
303
|
+
ll /= 10;
|
304
|
+
remainder = oldval - ll * 10;
|
305
|
+
out[0] = '0' + remainder;
|
306
|
+
len++;
|
307
|
+
|
308
|
+
/* write exponent */
|
309
|
+
out[len++] = 'e';
|
310
|
+
intermediate = INT2NUM(exp10i);
|
311
|
+
|
312
|
+
return neg + len + pg_text_enc_integer(conv, Qnil, out + len, &intermediate, enc_idx);
|
313
|
+
} else {
|
314
|
+
/* write the float in non exponent format (0.001234 or 123450.0) */
|
315
|
+
|
316
|
+
/* write digits from right to left */
|
317
|
+
int lz = exp10i < 0 ? 0 : exp10i;
|
318
|
+
for( i = MAX_DOUBLE_DIGITS - (exp10i < 0 ? exp10i : 0); i >= 0; i-- ){
|
319
|
+
oldval = ll;
|
320
|
+
ll /= 10;
|
321
|
+
remainder = oldval - ll * 10;
|
322
|
+
/* write decimal point */
|
323
|
+
if( i - 1 == lz ){
|
324
|
+
out[i--] = '.';
|
325
|
+
len++;
|
326
|
+
}
|
327
|
+
/* if possible then omit trailing zeros */
|
328
|
+
if(remainder != 0 || len || i - 2 == lz) {
|
329
|
+
out[i] = '0' + remainder;
|
330
|
+
len++;
|
331
|
+
}
|
332
|
+
}
|
333
|
+
return neg + len;
|
334
|
+
}
|
335
|
+
}else{
|
336
|
+
return 1 /*sign*/ + MAX_DOUBLE_DIGITS + 1 /*dot*/ + 1 /*e*/ + 1 /*exp sign*/ + 3 /*exp digits*/;
|
337
|
+
}
|
338
|
+
}
|
339
|
+
|
340
|
+
|
341
|
+
/*
|
342
|
+
* Document-class: PG::TextEncoder::Numeric < PG::SimpleEncoder
|
343
|
+
*
|
344
|
+
* This is the encoder class for the PostgreSQL numeric types.
|
345
|
+
*
|
346
|
+
* It converts Integer, Float and BigDecimal objects.
|
347
|
+
* All other objects are expected to respond to +to_s+.
|
348
|
+
*/
|
349
|
+
static int
|
350
|
+
pg_text_enc_numeric(t_pg_coder *this, VALUE value, char *out, VALUE *intermediate, int enc_idx)
|
351
|
+
{
|
352
|
+
switch(TYPE(value)){
|
353
|
+
case T_FIXNUM:
|
354
|
+
case T_BIGNUM:
|
355
|
+
return pg_text_enc_integer(this, value, out, intermediate, enc_idx);
|
356
|
+
case T_FLOAT:
|
357
|
+
return pg_text_enc_float(this, value, out, intermediate, enc_idx);
|
358
|
+
default:
|
359
|
+
if(out){ /* second pass */
|
360
|
+
rb_bug("unexpected value type: %d", TYPE(value));
|
361
|
+
} else { /* first pass */
|
362
|
+
if( rb_obj_is_kind_of(value, s_cBigDecimal) ){
|
363
|
+
/* value.to_s('F') */
|
364
|
+
*intermediate = rb_funcall(value, s_id_to_s, 1, s_str_F);
|
365
|
+
return -1; /* no second pass */
|
366
|
+
} else {
|
367
|
+
return pg_coder_enc_to_s(this, value, NULL, intermediate, enc_idx);
|
368
|
+
/* no second pass */
|
369
|
+
}
|
370
|
+
}
|
371
|
+
}
|
372
|
+
}
|
373
|
+
|
374
|
+
|
375
|
+
static const char hextab[] = {
|
376
|
+
'0', '1', '2', '3', '4', '5', '6', '7', '8', '9', 'a', 'b', 'c', 'd', 'e', 'f'
|
377
|
+
};
|
378
|
+
|
379
|
+
/*
|
380
|
+
* Document-class: PG::TextEncoder::Bytea < PG::SimpleEncoder
|
381
|
+
*
|
382
|
+
* This is an encoder class for the PostgreSQL +bytea+ type.
|
383
|
+
*
|
384
|
+
* The binary String is converted to hexadecimal representation for transmission
|
385
|
+
* in text format. For query bind parameters it is recommended to use
|
386
|
+
* PG::BinaryEncoder::Bytea instead, in order to decrease network traffic and
|
387
|
+
* CPU usage.
|
388
|
+
*
|
389
|
+
*/
|
390
|
+
static int
|
391
|
+
pg_text_enc_bytea(t_pg_coder *conv, VALUE value, char *out, VALUE *intermediate, int enc_idx)
|
392
|
+
{
|
393
|
+
if(out){
|
394
|
+
size_t strlen = RSTRING_LEN(*intermediate);
|
395
|
+
char *iptr = RSTRING_PTR(*intermediate);
|
396
|
+
char *eptr = iptr + strlen;
|
397
|
+
char *optr = out;
|
398
|
+
*optr++ = '\\';
|
399
|
+
*optr++ = 'x';
|
400
|
+
|
401
|
+
for( ; iptr < eptr; iptr++ ){
|
402
|
+
unsigned char c = *iptr;
|
403
|
+
*optr++ = hextab[c >> 4];
|
404
|
+
*optr++ = hextab[c & 0xf];
|
405
|
+
}
|
406
|
+
return (int)(optr - out);
|
407
|
+
}else{
|
408
|
+
*intermediate = rb_obj_as_string(value);
|
409
|
+
/* The output starts with "\x" and each character is converted to hex. */
|
410
|
+
return 2 + RSTRING_LENINT(*intermediate) * 2;
|
411
|
+
}
|
412
|
+
}
|
413
|
+
|
414
|
+
typedef int (*t_quote_func)( void *_this, char *p_in, int strlen, char *p_out );
|
415
|
+
|
416
|
+
static int
|
417
|
+
quote_array_buffer( void *_this, char *p_in, int strlen, char *p_out ){
|
418
|
+
t_pg_composite_coder *this = _this;
|
419
|
+
char *ptr1;
|
420
|
+
char *ptr2;
|
421
|
+
int backslashs = 0;
|
422
|
+
int needquote;
|
423
|
+
|
424
|
+
/* count data plus backslashes; detect chars needing quotes */
|
425
|
+
if (strlen == 0)
|
426
|
+
needquote = 1; /* force quotes for empty string */
|
427
|
+
else if (strlen == 4 && rbpg_strncasecmp(p_in, "NULL", strlen) == 0)
|
428
|
+
needquote = 1; /* force quotes for literal NULL */
|
429
|
+
else
|
430
|
+
needquote = 0;
|
431
|
+
|
432
|
+
/* count required backlashs */
|
433
|
+
for(ptr1 = p_in; ptr1 != p_in + strlen; ptr1++) {
|
434
|
+
char ch = *ptr1;
|
435
|
+
|
436
|
+
if (ch == '"' || ch == '\\'){
|
437
|
+
needquote = 1;
|
438
|
+
backslashs++;
|
439
|
+
} else if (ch == '{' || ch == '}' || ch == this->delimiter ||
|
440
|
+
ch == ' ' || ch == '\t' || ch == '\n' || ch == '\r' || ch == '\v' || ch == '\f'){
|
441
|
+
needquote = 1;
|
442
|
+
}
|
443
|
+
}
|
444
|
+
|
445
|
+
if( needquote ){
|
446
|
+
ptr1 = p_in + strlen;
|
447
|
+
ptr2 = p_out + strlen + backslashs + 2;
|
448
|
+
/* Write end quote */
|
449
|
+
*--ptr2 = '"';
|
450
|
+
|
451
|
+
/* Then store the escaped string on the final position, walking
|
452
|
+
* right to left, until all backslashs are placed. */
|
453
|
+
while( ptr1 != p_in ) {
|
454
|
+
*--ptr2 = *--ptr1;
|
455
|
+
if(*ptr2 == '"' || *ptr2 == '\\'){
|
456
|
+
*--ptr2 = '\\';
|
457
|
+
}
|
458
|
+
}
|
459
|
+
/* Write start quote */
|
460
|
+
*p_out = '"';
|
461
|
+
return strlen + backslashs + 2;
|
462
|
+
} else {
|
463
|
+
if( p_in != p_out )
|
464
|
+
memcpy( p_out, p_in, strlen );
|
465
|
+
return strlen;
|
466
|
+
}
|
467
|
+
}
|
468
|
+
|
469
|
+
static char *
|
470
|
+
quote_string(t_pg_coder *this, VALUE value, VALUE string, char *current_out, int with_quote, t_quote_func quote_buffer, void *func_data, int enc_idx)
|
471
|
+
{
|
472
|
+
int strlen;
|
473
|
+
VALUE subint;
|
474
|
+
t_pg_coder_enc_func enc_func = pg_coder_enc_func(this);
|
475
|
+
|
476
|
+
strlen = enc_func(this, value, NULL, &subint, enc_idx);
|
477
|
+
|
478
|
+
if( strlen == -1 ){
|
479
|
+
/* we can directly use String value in subint */
|
480
|
+
strlen = RSTRING_LENINT(subint);
|
481
|
+
|
482
|
+
if(with_quote){
|
483
|
+
/* size of string assuming the worst case, that every character must be escaped. */
|
484
|
+
current_out = pg_rb_str_ensure_capa( string, strlen * 2 + 2, current_out, NULL );
|
485
|
+
|
486
|
+
current_out += quote_buffer( func_data, RSTRING_PTR(subint), strlen, current_out );
|
487
|
+
} else {
|
488
|
+
current_out = pg_rb_str_ensure_capa( string, strlen, current_out, NULL );
|
489
|
+
memcpy( current_out, RSTRING_PTR(subint), strlen );
|
490
|
+
current_out += strlen;
|
491
|
+
}
|
492
|
+
|
493
|
+
} else {
|
494
|
+
|
495
|
+
if(with_quote){
|
496
|
+
/* size of string assuming the worst case, that every character must be escaped
|
497
|
+
* plus two bytes for quotation.
|
498
|
+
*/
|
499
|
+
current_out = pg_rb_str_ensure_capa( string, 2 * strlen + 2, current_out, NULL );
|
500
|
+
|
501
|
+
/* Place the unescaped string at current output position. */
|
502
|
+
strlen = enc_func(this, value, current_out, &subint, enc_idx);
|
503
|
+
|
504
|
+
current_out += quote_buffer( func_data, current_out, strlen, current_out );
|
505
|
+
}else{
|
506
|
+
/* size of the unquoted string */
|
507
|
+
current_out = pg_rb_str_ensure_capa( string, strlen, current_out, NULL );
|
508
|
+
current_out += enc_func(this, value, current_out, &subint, enc_idx);
|
509
|
+
}
|
510
|
+
}
|
511
|
+
return current_out;
|
512
|
+
}
|
513
|
+
|
514
|
+
static char *
|
515
|
+
write_array(t_pg_composite_coder *this, VALUE value, char *current_out, VALUE string, int quote, int enc_idx)
|
516
|
+
{
|
517
|
+
int i;
|
518
|
+
|
519
|
+
/* size of "{}" */
|
520
|
+
current_out = pg_rb_str_ensure_capa( string, 2, current_out, NULL );
|
521
|
+
*current_out++ = '{';
|
522
|
+
|
523
|
+
for( i=0; i<RARRAY_LEN(value); i++){
|
524
|
+
VALUE entry = rb_ary_entry(value, i);
|
525
|
+
|
526
|
+
if( i > 0 ){
|
527
|
+
current_out = pg_rb_str_ensure_capa( string, 1, current_out, NULL );
|
528
|
+
*current_out++ = this->delimiter;
|
529
|
+
}
|
530
|
+
|
531
|
+
switch(TYPE(entry)){
|
532
|
+
case T_ARRAY:
|
533
|
+
current_out = write_array(this, entry, current_out, string, quote, enc_idx);
|
534
|
+
break;
|
535
|
+
case T_NIL:
|
536
|
+
current_out = pg_rb_str_ensure_capa( string, 4, current_out, NULL );
|
537
|
+
*current_out++ = 'N';
|
538
|
+
*current_out++ = 'U';
|
539
|
+
*current_out++ = 'L';
|
540
|
+
*current_out++ = 'L';
|
541
|
+
break;
|
542
|
+
default:
|
543
|
+
current_out = quote_string( this->elem, entry, string, current_out, quote, quote_array_buffer, this, enc_idx );
|
544
|
+
}
|
545
|
+
}
|
546
|
+
current_out = pg_rb_str_ensure_capa( string, 1, current_out, NULL );
|
547
|
+
*current_out++ = '}';
|
548
|
+
return current_out;
|
549
|
+
}
|
550
|
+
|
551
|
+
|
552
|
+
/*
|
553
|
+
* Document-class: PG::TextEncoder::Array < PG::CompositeEncoder
|
554
|
+
*
|
555
|
+
* This is the encoder class for PostgreSQL array types.
|
556
|
+
*
|
557
|
+
* All values are encoded according to the #elements_type
|
558
|
+
* accessor. Sub-arrays are encoded recursively.
|
559
|
+
*
|
560
|
+
* This encoder expects an Array of values or sub-arrays as input.
|
561
|
+
* Other values are passed through as text without interpretation.
|
562
|
+
*
|
563
|
+
*/
|
564
|
+
static int
|
565
|
+
pg_text_enc_array(t_pg_coder *conv, VALUE value, char *out, VALUE *intermediate, int enc_idx)
|
566
|
+
{
|
567
|
+
char *end_ptr;
|
568
|
+
t_pg_composite_coder *this = (t_pg_composite_coder *)conv;
|
569
|
+
|
570
|
+
if( TYPE(value) == T_ARRAY){
|
571
|
+
VALUE out_str = rb_str_new(NULL, 0);
|
572
|
+
PG_ENCODING_SET_NOCHECK(out_str, enc_idx);
|
573
|
+
|
574
|
+
end_ptr = write_array(this, value, RSTRING_PTR(out_str), out_str, this->needs_quotation, enc_idx);
|
575
|
+
|
576
|
+
rb_str_set_len( out_str, end_ptr - RSTRING_PTR(out_str) );
|
577
|
+
*intermediate = out_str;
|
578
|
+
|
579
|
+
return -1;
|
580
|
+
} else {
|
581
|
+
return pg_coder_enc_to_s( conv, value, out, intermediate, enc_idx );
|
582
|
+
}
|
583
|
+
}
|
584
|
+
|
585
|
+
static char *
|
586
|
+
quote_identifier( VALUE value, VALUE out_string, char *current_out ){
|
587
|
+
char *p_in = RSTRING_PTR(value);
|
588
|
+
size_t strlen = RSTRING_LEN(value);
|
589
|
+
char *p_inend = p_in + strlen;
|
590
|
+
char *end_capa = current_out;
|
591
|
+
|
592
|
+
PG_RB_STR_ENSURE_CAPA( out_string, strlen + 2, current_out, end_capa );
|
593
|
+
*current_out++ = '"';
|
594
|
+
for(; p_in != p_inend; p_in++) {
|
595
|
+
char c = *p_in;
|
596
|
+
if (c == '"'){
|
597
|
+
PG_RB_STR_ENSURE_CAPA( out_string, p_inend - p_in + 2, current_out, end_capa );
|
598
|
+
*current_out++ = '"';
|
599
|
+
} else if (c == 0){
|
600
|
+
rb_raise(rb_eArgError, "string contains null byte");
|
601
|
+
}
|
602
|
+
*current_out++ = c;
|
603
|
+
}
|
604
|
+
PG_RB_STR_ENSURE_CAPA( out_string, 1, current_out, end_capa );
|
605
|
+
*current_out++ = '"';
|
606
|
+
|
607
|
+
return current_out;
|
608
|
+
}
|
609
|
+
|
610
|
+
static char *
|
611
|
+
pg_text_enc_array_identifier(VALUE value, VALUE string, char *out, int enc_idx)
|
612
|
+
{
|
613
|
+
long i;
|
614
|
+
long nr_elems;
|
615
|
+
|
616
|
+
Check_Type(value, T_ARRAY);
|
617
|
+
nr_elems = RARRAY_LEN(value);
|
618
|
+
|
619
|
+
for( i=0; i<nr_elems; i++){
|
620
|
+
VALUE entry = rb_ary_entry(value, i);
|
621
|
+
|
622
|
+
StringValue(entry);
|
623
|
+
if( ENCODING_GET(entry) != enc_idx ){
|
624
|
+
entry = rb_str_export_to_enc(entry, rb_enc_from_index(enc_idx));
|
625
|
+
}
|
626
|
+
out = quote_identifier(entry, string, out);
|
627
|
+
if( i < nr_elems-1 ){
|
628
|
+
out = pg_rb_str_ensure_capa( string, 1, out, NULL );
|
629
|
+
*out++ = '.';
|
630
|
+
}
|
631
|
+
}
|
632
|
+
return out;
|
633
|
+
}
|
634
|
+
|
635
|
+
/*
|
636
|
+
* Document-class: PG::TextEncoder::Identifier < PG::SimpleEncoder
|
637
|
+
*
|
638
|
+
* This is the encoder class for PostgreSQL identifiers.
|
639
|
+
*
|
640
|
+
* An Array value can be used for identifiers of the kind "schema.table.column".
|
641
|
+
* This ensures that each element is properly quoted:
|
642
|
+
* PG::TextEncoder::Identifier.new.encode(['schema', 'table', 'column'])
|
643
|
+
* => '"schema"."table"."column"'
|
644
|
+
*
|
645
|
+
* This encoder can also be used per PG::Connection#quote_ident .
|
646
|
+
*/
|
647
|
+
int
|
648
|
+
pg_text_enc_identifier(t_pg_coder *this, VALUE value, char *out, VALUE *intermediate, int enc_idx)
|
649
|
+
{
|
650
|
+
VALUE out_str;
|
651
|
+
UNUSED( this );
|
652
|
+
if( TYPE(value) == T_ARRAY){
|
653
|
+
out_str = rb_str_new(NULL, 0);
|
654
|
+
out = RSTRING_PTR(out_str);
|
655
|
+
out = pg_text_enc_array_identifier(value, out_str, out, enc_idx);
|
656
|
+
} else {
|
657
|
+
StringValue(value);
|
658
|
+
if( ENCODING_GET(value) != enc_idx ){
|
659
|
+
value = rb_str_export_to_enc(value, rb_enc_from_index(enc_idx));
|
660
|
+
}
|
661
|
+
out_str = rb_str_new(NULL, RSTRING_LEN(value) + 2);
|
662
|
+
out = RSTRING_PTR(out_str);
|
663
|
+
out = quote_identifier(value, out_str, out);
|
664
|
+
}
|
665
|
+
rb_str_set_len( out_str, out - RSTRING_PTR(out_str) );
|
666
|
+
PG_ENCODING_SET_NOCHECK(out_str, enc_idx);
|
667
|
+
*intermediate = out_str;
|
668
|
+
return -1;
|
669
|
+
}
|
670
|
+
|
671
|
+
|
672
|
+
static int
|
673
|
+
quote_literal_buffer( void *_this, char *p_in, int strlen, char *p_out ){
|
674
|
+
char *ptr1;
|
675
|
+
char *ptr2;
|
676
|
+
int backslashs = 0;
|
677
|
+
|
678
|
+
/* count required backlashs */
|
679
|
+
for(ptr1 = p_in; ptr1 != p_in + strlen; ptr1++) {
|
680
|
+
if (*ptr1 == '\''){
|
681
|
+
backslashs++;
|
682
|
+
}
|
683
|
+
}
|
684
|
+
|
685
|
+
ptr1 = p_in + strlen;
|
686
|
+
ptr2 = p_out + strlen + backslashs + 2;
|
687
|
+
/* Write end quote */
|
688
|
+
*--ptr2 = '\'';
|
689
|
+
|
690
|
+
/* Then store the escaped string on the final position, walking
|
691
|
+
* right to left, until all backslashs are placed. */
|
692
|
+
while( ptr1 != p_in ) {
|
693
|
+
*--ptr2 = *--ptr1;
|
694
|
+
if(*ptr2 == '\''){
|
695
|
+
*--ptr2 = '\'';
|
696
|
+
}
|
697
|
+
}
|
698
|
+
/* Write start quote */
|
699
|
+
*p_out = '\'';
|
700
|
+
return strlen + backslashs + 2;
|
701
|
+
}
|
702
|
+
|
703
|
+
|
704
|
+
/*
|
705
|
+
* Document-class: PG::TextEncoder::QuotedLiteral < PG::CompositeEncoder
|
706
|
+
*
|
707
|
+
* This is the encoder class for PostgreSQL literals.
|
708
|
+
*
|
709
|
+
* A literal is quoted and escaped by the <tt>'</tt> character, so that it can be inserted into SQL queries.
|
710
|
+
* It works equal to PG::Connection#escape_literal, but integrates into the type cast system of ruby-pg.
|
711
|
+
*
|
712
|
+
* Both expressions have the same result:
|
713
|
+
* conn.escape_literal(PG::TextEncoder::Array.new.encode(["v1","v2"])) # => "'{v1,v2}'"
|
714
|
+
* PG::TextEncoder::QuotedLiteral.new(elements_type: PG::TextEncoder::Array.new).encode(["v1","v2"]) # => "'{v1,v2}'"
|
715
|
+
* While escape_literal requires a intermediate ruby string allocation, QuotedLiteral encodes the values directly to the result string.
|
716
|
+
*
|
717
|
+
*/
|
718
|
+
static int
|
719
|
+
pg_text_enc_quoted_literal(t_pg_coder *conv, VALUE value, char *out, VALUE *intermediate, int enc_idx)
|
720
|
+
{
|
721
|
+
t_pg_composite_coder *this = (t_pg_composite_coder *)conv;
|
722
|
+
VALUE out_str = rb_str_new(NULL, 0);
|
723
|
+
PG_ENCODING_SET_NOCHECK(out_str, enc_idx);
|
724
|
+
|
725
|
+
out = RSTRING_PTR(out_str);
|
726
|
+
out = quote_string(this->elem, value, out_str, out, this->needs_quotation, quote_literal_buffer, this, enc_idx);
|
727
|
+
rb_str_set_len( out_str, out - RSTRING_PTR(out_str) );
|
728
|
+
*intermediate = out_str;
|
729
|
+
return -1;
|
730
|
+
}
|
731
|
+
|
732
|
+
/*
|
733
|
+
* Document-class: PG::TextEncoder::ToBase64 < PG::CompositeEncoder
|
734
|
+
*
|
735
|
+
* This is an encoder class for conversion of binary to base64 data.
|
736
|
+
*
|
737
|
+
*/
|
738
|
+
static int
|
739
|
+
pg_text_enc_to_base64(t_pg_coder *conv, VALUE value, char *out, VALUE *intermediate, int enc_idx)
|
740
|
+
{
|
741
|
+
int strlen;
|
742
|
+
VALUE subint;
|
743
|
+
t_pg_composite_coder *this = (t_pg_composite_coder *)conv;
|
744
|
+
t_pg_coder_enc_func enc_func = pg_coder_enc_func(this->elem);
|
745
|
+
|
746
|
+
if(out){
|
747
|
+
/* Second encoder pass, if required */
|
748
|
+
strlen = enc_func(this->elem, value, out, intermediate, enc_idx);
|
749
|
+
base64_encode( out, out, strlen );
|
750
|
+
|
751
|
+
return BASE64_ENCODED_SIZE(strlen);
|
752
|
+
} else {
|
753
|
+
/* First encoder pass */
|
754
|
+
strlen = enc_func(this->elem, value, NULL, &subint, enc_idx);
|
755
|
+
|
756
|
+
if( strlen == -1 ){
|
757
|
+
/* Encoded string is returned in subint */
|
758
|
+
VALUE out_str;
|
759
|
+
|
760
|
+
strlen = RSTRING_LENINT(subint);
|
761
|
+
out_str = rb_str_new(NULL, BASE64_ENCODED_SIZE(strlen));
|
762
|
+
PG_ENCODING_SET_NOCHECK(out_str, enc_idx);
|
763
|
+
|
764
|
+
base64_encode( RSTRING_PTR(out_str), RSTRING_PTR(subint), strlen);
|
765
|
+
*intermediate = out_str;
|
766
|
+
|
767
|
+
return -1;
|
768
|
+
} else {
|
769
|
+
*intermediate = subint;
|
770
|
+
|
771
|
+
return BASE64_ENCODED_SIZE(strlen);
|
772
|
+
}
|
773
|
+
}
|
774
|
+
}
|
775
|
+
|
776
|
+
|
777
|
+
void
|
778
|
+
init_pg_text_encoder()
|
779
|
+
{
|
780
|
+
s_id_encode = rb_intern("encode");
|
781
|
+
s_id_to_i = rb_intern("to_i");
|
782
|
+
s_id_to_s = rb_intern("to_s");
|
783
|
+
s_str_F = rb_str_freeze(rb_str_new_cstr("F"));
|
784
|
+
rb_global_variable(&s_str_F);
|
785
|
+
rb_require("bigdecimal");
|
786
|
+
s_cBigDecimal = rb_const_get(rb_cObject, rb_intern("BigDecimal"));
|
787
|
+
|
788
|
+
|
789
|
+
/* This module encapsulates all encoder classes with text output format */
|
790
|
+
rb_mPG_TextEncoder = rb_define_module_under( rb_mPG, "TextEncoder" );
|
791
|
+
|
792
|
+
/* Make RDoc aware of the encoder classes... */
|
793
|
+
/* dummy = rb_define_class_under( rb_mPG_TextEncoder, "Boolean", rb_cPG_SimpleEncoder ); */
|
794
|
+
pg_define_coder( "Boolean", pg_text_enc_boolean, rb_cPG_SimpleEncoder, rb_mPG_TextEncoder );
|
795
|
+
/* dummy = rb_define_class_under( rb_mPG_TextEncoder, "Integer", rb_cPG_SimpleEncoder ); */
|
796
|
+
pg_define_coder( "Integer", pg_text_enc_integer, rb_cPG_SimpleEncoder, rb_mPG_TextEncoder );
|
797
|
+
/* dummy = rb_define_class_under( rb_mPG_TextEncoder, "Float", rb_cPG_SimpleEncoder ); */
|
798
|
+
pg_define_coder( "Float", pg_text_enc_float, rb_cPG_SimpleEncoder, rb_mPG_TextEncoder );
|
799
|
+
/* dummy = rb_define_class_under( rb_mPG_TextEncoder, "Numeric", rb_cPG_SimpleEncoder ); */
|
800
|
+
pg_define_coder( "Numeric", pg_text_enc_numeric, rb_cPG_SimpleEncoder, rb_mPG_TextEncoder );
|
801
|
+
/* dummy = rb_define_class_under( rb_mPG_TextEncoder, "String", rb_cPG_SimpleEncoder ); */
|
802
|
+
pg_define_coder( "String", pg_coder_enc_to_s, rb_cPG_SimpleEncoder, rb_mPG_TextEncoder );
|
803
|
+
/* dummy = rb_define_class_under( rb_mPG_TextEncoder, "Bytea", rb_cPG_SimpleEncoder ); */
|
804
|
+
pg_define_coder( "Bytea", pg_text_enc_bytea, rb_cPG_SimpleEncoder, rb_mPG_TextEncoder );
|
805
|
+
/* dummy = rb_define_class_under( rb_mPG_TextEncoder, "Identifier", rb_cPG_SimpleEncoder ); */
|
806
|
+
pg_define_coder( "Identifier", pg_text_enc_identifier, rb_cPG_SimpleEncoder, rb_mPG_TextEncoder );
|
807
|
+
|
808
|
+
/* dummy = rb_define_class_under( rb_mPG_TextEncoder, "Array", rb_cPG_CompositeEncoder ); */
|
809
|
+
pg_define_coder( "Array", pg_text_enc_array, rb_cPG_CompositeEncoder, rb_mPG_TextEncoder );
|
810
|
+
/* dummy = rb_define_class_under( rb_mPG_TextEncoder, "QuotedLiteral", rb_cPG_CompositeEncoder ); */
|
811
|
+
pg_define_coder( "QuotedLiteral", pg_text_enc_quoted_literal, rb_cPG_CompositeEncoder, rb_mPG_TextEncoder );
|
812
|
+
/* dummy = rb_define_class_under( rb_mPG_TextEncoder, "ToBase64", rb_cPG_CompositeEncoder ); */
|
813
|
+
pg_define_coder( "ToBase64", pg_text_enc_to_base64, rb_cPG_CompositeEncoder, rb_mPG_TextEncoder );
|
814
|
+
}
|