melbourne 1.0.0

Sign up to get free protection for your applications and to get access to all the features.
Files changed (113) hide show
  1. data/HISTORY +3 -0
  2. data/LICENSE +27 -0
  3. data/README.rdoc +38 -0
  4. data/Rakefile +38 -0
  5. data/VERSION.yml +4 -0
  6. data/ext/melbourne/bstring-license.txt +29 -0
  7. data/ext/melbourne/bstrlib.c +2918 -0
  8. data/ext/melbourne/bstrlib.h +302 -0
  9. data/ext/melbourne/extconf.rb +76 -0
  10. data/ext/melbourne/grammar.cpp +11885 -0
  11. data/ext/melbourne/grammar.hpp +14 -0
  12. data/ext/melbourne/grammar.y +6013 -0
  13. data/ext/melbourne/internal.hpp +137 -0
  14. data/ext/melbourne/lex.c.tab +136 -0
  15. data/ext/melbourne/local_state.hpp +41 -0
  16. data/ext/melbourne/melbourne.cpp +37 -0
  17. data/ext/melbourne/node.hpp +262 -0
  18. data/ext/melbourne/node_types.cpp +245 -0
  19. data/ext/melbourne/node_types.hpp +135 -0
  20. data/ext/melbourne/node_types.rb +190 -0
  21. data/ext/melbourne/quark.cpp +52 -0
  22. data/ext/melbourne/quark.hpp +14 -0
  23. data/ext/melbourne/symbols.cpp +219 -0
  24. data/ext/melbourne/symbols.hpp +116 -0
  25. data/ext/melbourne/var_table.cpp +113 -0
  26. data/ext/melbourne/var_table.hpp +33 -0
  27. data/ext/melbourne/visitor.cpp +1052 -0
  28. data/ext/melbourne/visitor.hpp +20 -0
  29. data/lib/melbourne/ast/constants.rb +128 -0
  30. data/lib/melbourne/ast/control_flow.rb +382 -0
  31. data/lib/melbourne/ast/data.rb +19 -0
  32. data/lib/melbourne/ast/definitions.rb +561 -0
  33. data/lib/melbourne/ast/exceptions.rb +182 -0
  34. data/lib/melbourne/ast/file.rb +15 -0
  35. data/lib/melbourne/ast/grapher.rb +75 -0
  36. data/lib/melbourne/ast/literals.rb +268 -0
  37. data/lib/melbourne/ast/node.rb +21 -0
  38. data/lib/melbourne/ast/operators.rb +117 -0
  39. data/lib/melbourne/ast/self.rb +17 -0
  40. data/lib/melbourne/ast/sends.rb +451 -0
  41. data/lib/melbourne/ast/values.rb +74 -0
  42. data/lib/melbourne/ast/variables.rb +251 -0
  43. data/lib/melbourne/ast.rb +22 -0
  44. data/lib/melbourne/parser.rb +38 -0
  45. data/lib/melbourne/processor.rb +460 -0
  46. data/lib/melbourne.rb +46 -0
  47. data/spec/helpers/ast/node.rb +15 -0
  48. data/spec/helpers/ast/reduced_graph.rb +64 -0
  49. data/spec/lib/parser/alias_spec.rb +97 -0
  50. data/spec/lib/parser/and_spec.rb +63 -0
  51. data/spec/lib/parser/array_spec.rb +157 -0
  52. data/spec/lib/parser/attrasgn_spec.rb +401 -0
  53. data/spec/lib/parser/back_ref_spec.rb +20 -0
  54. data/spec/lib/parser/call_spec.rb +958 -0
  55. data/spec/lib/parser/case_spec.rb +577 -0
  56. data/spec/lib/parser/cdecl_spec.rb +108 -0
  57. data/spec/lib/parser/class_spec.rb +221 -0
  58. data/spec/lib/parser/colon2_spec.rb +13 -0
  59. data/spec/lib/parser/colon3_spec.rb +12 -0
  60. data/spec/lib/parser/const_spec.rb +12 -0
  61. data/spec/lib/parser/cvar_spec.rb +55 -0
  62. data/spec/lib/parser/cvasgn_spec.rb +71 -0
  63. data/spec/lib/parser/cvdecl_spec.rb +31 -0
  64. data/spec/lib/parser/defined_spec.rb +353 -0
  65. data/spec/lib/parser/defn_spec.rb +1409 -0
  66. data/spec/lib/parser/defs_spec.rb +247 -0
  67. data/spec/lib/parser/dot2_spec.rb +29 -0
  68. data/spec/lib/parser/dot3_spec.rb +29 -0
  69. data/spec/lib/parser/dregx_spec.rb +127 -0
  70. data/spec/lib/parser/dstr_spec.rb +453 -0
  71. data/spec/lib/parser/dsym_spec.rb +31 -0
  72. data/spec/lib/parser/dxstr_spec.rb +31 -0
  73. data/spec/lib/parser/ensure_spec.rb +279 -0
  74. data/spec/lib/parser/false_spec.rb +12 -0
  75. data/spec/lib/parser/flip2_spec.rb +138 -0
  76. data/spec/lib/parser/flip3_spec.rb +100 -0
  77. data/spec/lib/parser/for_spec.rb +279 -0
  78. data/spec/lib/parser/gasgn_spec.rb +34 -0
  79. data/spec/lib/parser/gvar_spec.rb +33 -0
  80. data/spec/lib/parser/hash_spec.rb +77 -0
  81. data/spec/lib/parser/iasgn_spec.rb +54 -0
  82. data/spec/lib/parser/if_spec.rb +439 -0
  83. data/spec/lib/parser/iter_spec.rb +2582 -0
  84. data/spec/lib/parser/lasgn_spec.rb +1066 -0
  85. data/spec/lib/parser/lit_spec.rb +75 -0
  86. data/spec/lib/parser/masgn_spec.rb +1970 -0
  87. data/spec/lib/parser/match2_spec.rb +47 -0
  88. data/spec/lib/parser/match3_spec.rb +54 -0
  89. data/spec/lib/parser/match_spec.rb +19 -0
  90. data/spec/lib/parser/module_spec.rb +102 -0
  91. data/spec/lib/parser/nil_spec.rb +13 -0
  92. data/spec/lib/parser/not_spec.rb +39 -0
  93. data/spec/lib/parser/nth_ref_spec.rb +12 -0
  94. data/spec/lib/parser/op_asgn_spec.rb +619 -0
  95. data/spec/lib/parser/or_spec.rb +155 -0
  96. data/spec/lib/parser/postexe_spec.rb +31 -0
  97. data/spec/lib/parser/regex_spec.rb +52 -0
  98. data/spec/lib/parser/rescue_spec.rb +1028 -0
  99. data/spec/lib/parser/return_spec.rb +151 -0
  100. data/spec/lib/parser/sclass_spec.rb +172 -0
  101. data/spec/lib/parser/str_spec.rb +162 -0
  102. data/spec/lib/parser/super_spec.rb +276 -0
  103. data/spec/lib/parser/true_spec.rb +12 -0
  104. data/spec/lib/parser/undef_spec.rb +222 -0
  105. data/spec/lib/parser/until_spec.rb +286 -0
  106. data/spec/lib/parser/valias_spec.rb +12 -0
  107. data/spec/lib/parser/while_spec.rb +458 -0
  108. data/spec/lib/parser/xstr_spec.rb +12 -0
  109. data/spec/lib/parser/yield_spec.rb +202 -0
  110. data/spec/lib/parser/zsuper_spec.rb +101 -0
  111. data/spec/matchers/parse_as.rb +27 -0
  112. data/spec/spec_helper.rb +10 -0
  113. metadata +168 -0
@@ -0,0 +1,2918 @@
1
+ /*
2
+ * This source file is part of the bstring string library. This code was
3
+ * written by Paul Hsieh in 2002-2007, and is covered by the BSD open source
4
+ * license. Refer to the accompanying documentation for details on usage and
5
+ * license.
6
+ */
7
+
8
+ /*
9
+ * bstrlib.c
10
+ *
11
+ * This file is the core module for implementing the bstring functions.
12
+ */
13
+
14
+ #include <stdio.h>
15
+ #include <stddef.h>
16
+ #include <stdarg.h>
17
+ #include <stdlib.h>
18
+ #include <string.h>
19
+ #include <ctype.h>
20
+ #include "bstrlib.h"
21
+
22
+ /* Optionally include a mechanism for debugging memory */
23
+
24
+ #if defined(MEMORY_DEBUG) || defined(BSTRLIB_MEMORY_DEBUG)
25
+ #include "memdbg.h"
26
+ #endif
27
+
28
+ #ifndef bstr__alloc
29
+ #define bstr__alloc(x) malloc (x)
30
+ #endif
31
+
32
+ #ifndef bstr__free
33
+ #define bstr__free(p) free (p)
34
+ #endif
35
+
36
+ #ifndef bstr__realloc
37
+ #define bstr__realloc(p,x) realloc ((p), (x))
38
+ #endif
39
+
40
+ #ifndef bstr__memcpy
41
+ #define bstr__memcpy(d,s,l) memcpy ((d), (s), (l))
42
+ #endif
43
+
44
+ #ifndef bstr__memmove
45
+ #define bstr__memmove(d,s,l) memmove ((d), (s), (l))
46
+ #endif
47
+
48
+ #ifndef bstr__memset
49
+ #define bstr__memset(d,c,l) memset ((d), (c), (l))
50
+ #endif
51
+
52
+ #ifndef bstr__memcmp
53
+ #define bstr__memcmp(d,c,l) memcmp ((d), (c), (l))
54
+ #endif
55
+
56
+ #ifndef bstr__memchr
57
+ #define bstr__memchr(s,c,l) memchr ((s), (c), (l))
58
+ #endif
59
+
60
+ /* Just a length safe wrapper for memmove. */
61
+
62
+ #define bBlockCopy(D,S,L) { if ((L) > 0) bstr__memmove ((D),(S),(L)); }
63
+
64
+ /* Compute the snapped size for a given requested size. By snapping to powers
65
+ of 2 like this, repeated reallocations are avoided. */
66
+ static int snapUpSize (int i) {
67
+ if (i < 8) {
68
+ i = 8;
69
+ } else {
70
+ unsigned int j;
71
+ j = (unsigned int) i;
72
+
73
+ j |= (j >> 1);
74
+ j |= (j >> 2);
75
+ j |= (j >> 4);
76
+ j |= (j >> 8); /* Ok, since int >= 16 bits */
77
+ #if (UINT_MAX != 0xffff)
78
+ j |= (j >> 16); /* For 32 bit int systems */
79
+ #if (UINT_MAX > 0xffffffffUL)
80
+ j |= (j >> 32); /* For 64 bit int systems */
81
+ #endif
82
+ #endif
83
+ /* Least power of two greater than i */
84
+ j++;
85
+ if ((int) j >= i) i = (int) j;
86
+ }
87
+ return i;
88
+ }
89
+
90
+ /* int balloc (bstring b, int len)
91
+ *
92
+ * Increase the size of the memory backing the bstring b to at least len.
93
+ */
94
+ int balloc (bstring b, int olen) {
95
+ int len;
96
+ if (b == NULL || b->data == NULL || b->slen < 0 || b->mlen <= 0 ||
97
+ b->mlen < b->slen || olen <= 0) {
98
+ return BSTR_ERR;
99
+ }
100
+
101
+ if (olen >= b->mlen) {
102
+ unsigned char * x;
103
+
104
+ if ((len = snapUpSize (olen)) <= b->mlen) return BSTR_OK;
105
+
106
+ /* Assume probability of a non-moving realloc is 0.125 */
107
+ if (7 * b->mlen < 8 * b->slen) {
108
+
109
+ /* If slen is close to mlen in size then use realloc to reduce
110
+ the memory defragmentation */
111
+
112
+ reallocStrategy:;
113
+
114
+ x = (unsigned char *) bstr__realloc (b->data, (size_t) len);
115
+ if (x == NULL) {
116
+
117
+ /* Since we failed, try allocating the tighest possible
118
+ allocation */
119
+
120
+ if (NULL == (x = (unsigned char *) bstr__realloc (b->data, (size_t) (len = olen)))) {
121
+ return BSTR_ERR;
122
+ }
123
+ }
124
+ } else {
125
+
126
+ /* If slen is not close to mlen then avoid the penalty of copying
127
+ the extra bytes that are allocated, but not considered part of
128
+ the string */
129
+
130
+ if (NULL == (x = (unsigned char *) bstr__alloc ((size_t) len))) {
131
+
132
+ /* Perhaps there is no available memory for the two
133
+ allocations to be in memory at once */
134
+
135
+ goto reallocStrategy;
136
+
137
+ } else {
138
+ if (b->slen) bstr__memcpy ((char *) x, (char *) b->data, (size_t) b->slen);
139
+ bstr__free (b->data);
140
+ }
141
+ }
142
+ b->data = x;
143
+ b->mlen = len;
144
+ b->data[b->slen] = (unsigned char) '\0';
145
+ }
146
+
147
+ return BSTR_OK;
148
+ }
149
+
150
+ /* int ballocmin (bstring b, int len)
151
+ *
152
+ * Set the size of the memory backing the bstring b to len or b->slen+1,
153
+ * whichever is larger. Note that repeated use of this function can degrade
154
+ * performance.
155
+ */
156
+ int ballocmin (bstring b, int len) {
157
+ unsigned char * s;
158
+
159
+ if (b == NULL || b->data == NULL || (b->slen+1) < 0 || b->mlen <= 0 ||
160
+ b->mlen < b->slen || len <= 0) {
161
+ return BSTR_ERR;
162
+ }
163
+
164
+ if (len < b->slen + 1) len = b->slen + 1;
165
+
166
+ if (len != b->mlen) {
167
+ s = (unsigned char *) bstr__realloc (b->data, (size_t) len);
168
+ if (NULL == s) return BSTR_ERR;
169
+ s[b->slen] = (unsigned char) '\0';
170
+ b->data = s;
171
+ b->mlen = len;
172
+ }
173
+
174
+ return BSTR_OK;
175
+ }
176
+
177
+ /* bstring bfromcstr (const char * str)
178
+ *
179
+ * Create a bstring which contains the contents of the '\0' terminated char *
180
+ * buffer str.
181
+ */
182
+ bstring bfromcstr (const char * str) {
183
+ bstring b;
184
+ int i;
185
+ size_t j;
186
+
187
+ if (str == NULL) return NULL;
188
+ j = (strlen) (str);
189
+ i = snapUpSize ((int) (j + (2 - (j != 0))));
190
+ if (i <= (int) j) return NULL;
191
+
192
+ b = (bstring) bstr__alloc (sizeof (struct tagbstring));
193
+ if (NULL == b) return NULL;
194
+ b->slen = (int) j;
195
+ if (NULL == (b->data = (unsigned char *) bstr__alloc (b->mlen = i))) {
196
+ bstr__free (b);
197
+ return NULL;
198
+ }
199
+
200
+ bstr__memcpy (b->data, str, j+1);
201
+ return b;
202
+ }
203
+
204
+ /* bstring bfromcstralloc (int mlen, const char * str)
205
+ *
206
+ * Create a bstring which contains the contents of the '\0' terminated char *
207
+ * buffer str. The memory buffer backing the string is at least len
208
+ * characters in length.
209
+ */
210
+ bstring bfromcstralloc (int mlen, const char * str) {
211
+ bstring b;
212
+ int i;
213
+ size_t j;
214
+
215
+ if (str == NULL) return NULL;
216
+ j = (strlen) (str);
217
+ i = snapUpSize ((int) (j + (2 - (j != 0))));
218
+ if (i <= (int) j) return NULL;
219
+
220
+ b = (bstring) bstr__alloc (sizeof (struct tagbstring));
221
+ if (b == NULL) return NULL;
222
+ b->slen = (int) j;
223
+ if (i < mlen) i = mlen;
224
+
225
+ if (NULL == (b->data = (unsigned char *) bstr__alloc (b->mlen = i))) {
226
+ bstr__free (b);
227
+ return NULL;
228
+ }
229
+
230
+ bstr__memcpy (b->data, str, j+1);
231
+ return b;
232
+ }
233
+
234
+ /* bstring blk2bstr (const void * blk, int len)
235
+ *
236
+ * Create a bstring which contains the content of the block blk of length
237
+ * len.
238
+ */
239
+ bstring blk2bstr (const void * blk, int len) {
240
+ bstring b;
241
+ int i;
242
+
243
+ if (blk == NULL || len < 0) return NULL;
244
+ b = (bstring) bstr__alloc (sizeof (struct tagbstring));
245
+ if (b == NULL) return NULL;
246
+ b->slen = len;
247
+
248
+ i = len + (2 - (len != 0));
249
+ i = snapUpSize (i);
250
+
251
+ b->mlen = i;
252
+
253
+ b->data = (unsigned char *) bstr__alloc ((size_t) b->mlen);
254
+ if (b->data == NULL) {
255
+ bstr__free (b);
256
+ return NULL;
257
+ }
258
+
259
+ if (len > 0) bstr__memcpy (b->data, blk, (size_t) len);
260
+ b->data[len] = (unsigned char) '\0';
261
+
262
+ return b;
263
+ }
264
+
265
+ /* char * bstr2cstr (const_bstring s, char z)
266
+ *
267
+ * Create a '\0' terminated char * buffer which is equal to the contents of
268
+ * the bstring s, except that any contained '\0' characters are converted
269
+ * to the character in z. This returned value should be freed with a
270
+ * bcstrfree () call, by the calling application.
271
+ */
272
+ char * bstr2cstr (const_bstring b, char z) {
273
+ int i, l;
274
+ char * r;
275
+
276
+ if (b == NULL || b->slen < 0 || b->data == NULL) return NULL;
277
+ l = b->slen;
278
+ r = (char *) bstr__alloc ((size_t) (l + 1));
279
+ if (r == NULL) return r;
280
+
281
+ for (i=0; i < l; i ++) {
282
+ r[i] = (char) ((b->data[i] == '\0') ? z : (char) (b->data[i]));
283
+ }
284
+
285
+ r[l] = (unsigned char) '\0';
286
+
287
+ return r;
288
+ }
289
+
290
+ /* int bcstrfree (char * s)
291
+ *
292
+ * Frees a C-string generated by bstr2cstr (). This is normally unnecessary
293
+ * since it just wraps a call to bstr__free (), however, if bstr__alloc ()
294
+ * and bstr__free () have been redefined as a macros within the bstrlib
295
+ * module (via defining them in memdbg.h after defining
296
+ * BSTRLIB_MEMORY_DEBUG) with some difference in behaviour from the std
297
+ * library functions, then this allows a correct way of freeing the memory
298
+ * that allows higher level code to be independent from these macro
299
+ * redefinitions.
300
+ */
301
+ int bcstrfree (char * s) {
302
+ if (s) {
303
+ bstr__free (s);
304
+ return BSTR_OK;
305
+ }
306
+ return BSTR_ERR;
307
+ }
308
+
309
+ /* int bconcat (bstring b0, const_bstring b1)
310
+ *
311
+ * Concatenate the bstring b1 to the bstring b0.
312
+ */
313
+ int bconcat (bstring b0, const_bstring b1) {
314
+ int len, d;
315
+ bstring aux = (bstring) b1;
316
+
317
+ if (b0 == NULL || b1 == NULL || b0->data == NULL || b1->data == NULL) return BSTR_ERR;
318
+
319
+ d = b0->slen;
320
+ len = b1->slen;
321
+ if ((d | (b0->mlen - d) | len) < 0) return BSTR_ERR;
322
+
323
+ if (b0->mlen <= d + len + 1) {
324
+ ptrdiff_t pd;
325
+ if (0 <= (pd = b1->data - b0->data) && pd < b0->mlen) {
326
+ if (NULL == (aux = bstrcpy (b1))) return BSTR_ERR;
327
+ }
328
+ if (balloc (b0, d + len + 1) != BSTR_OK) {
329
+ if (aux != b1) bdestroy (aux);
330
+ return BSTR_ERR;
331
+ }
332
+ }
333
+
334
+ bBlockCopy (&b0->data[d], &aux->data[0], (size_t) len);
335
+ b0->data[d + len] = (unsigned char) '\0';
336
+ b0->slen += len;
337
+ if (aux != b1) bdestroy (aux);
338
+ return BSTR_OK;
339
+ }
340
+
341
+ /* int bconchar (bstring b, char c)
342
+ *
343
+ * Concatenate the single character c to the bstring b.
344
+ */
345
+ int bconchar (bstring b, char c) {
346
+ int d;
347
+
348
+ if (b == NULL) return BSTR_ERR;
349
+ d = b->slen;
350
+ if ((d | (b->mlen - d)) < 0 || balloc (b, d + 2) != BSTR_OK) return BSTR_ERR;
351
+ b->data[d] = (unsigned char) c;
352
+ b->data[d + 1] = (unsigned char) '\0';
353
+ b->slen++;
354
+ return BSTR_OK;
355
+ }
356
+
357
+ /* int bcatcstr (bstring b, const char * s)
358
+ *
359
+ * Concatenate a char * string to a bstring.
360
+ */
361
+ int bcatcstr (bstring b, const char * s) {
362
+ char * d;
363
+ int i, l;
364
+
365
+ if (b == NULL || b->data == NULL || b->slen < 0 || b->mlen < b->slen
366
+ || b->mlen <= 0 || s == NULL) return BSTR_ERR;
367
+
368
+ /* Optimistically concatenate directly */
369
+ l = b->mlen - b->slen;
370
+ d = (char *) &b->data[b->slen];
371
+ for (i=0; i < l; i++) {
372
+ if ((*d++ = *s++) == '\0') {
373
+ b->slen += i;
374
+ return BSTR_OK;
375
+ }
376
+ }
377
+ b->slen += i;
378
+
379
+ /* Need to explicitely resize and concatenate tail */
380
+ return bcatblk (b, (const void *) s, (int) strlen (s));
381
+ }
382
+
383
+ /* int bcatblk (bstring b, const void * s, int len)
384
+ *
385
+ * Concatenate a fixed length buffer to a bstring.
386
+ */
387
+ int bcatblk (bstring b, const void * s, int len) {
388
+ int nl;
389
+
390
+ if (b == NULL || b->data == NULL || b->slen < 0 || b->mlen < b->slen
391
+ || b->mlen <= 0 || s == NULL || len < 0) return BSTR_ERR;
392
+
393
+ if (0 > (nl = b->slen + len)) return BSTR_ERR; /* Overflow? */
394
+ if (b->mlen <= nl && 0 > balloc (b, nl + 1)) return BSTR_ERR;
395
+
396
+ bBlockCopy (&b->data[b->slen], s, (size_t) len);
397
+ b->slen = nl;
398
+ b->data[nl] = (unsigned char) '\0';
399
+ return BSTR_OK;
400
+ }
401
+
402
+ /* bstring bstrcpy (const_bstring b)
403
+ *
404
+ * Create a copy of the bstring b.
405
+ */
406
+ bstring bstrcpy (const_bstring b) {
407
+ bstring b0;
408
+ int i,j;
409
+
410
+ /* Attempted to copy an invalid string? */
411
+ if (b == NULL || b->slen < 0 || b->data == NULL) return NULL;
412
+
413
+ b0 = (bstring) bstr__alloc (sizeof (struct tagbstring));
414
+ if (b0 == NULL) {
415
+ /* Unable to allocate memory for string header */
416
+ return NULL;
417
+ }
418
+
419
+ i = b->slen;
420
+ j = snapUpSize (i + 1);
421
+
422
+ b0->data = (unsigned char *) bstr__alloc (j);
423
+ if (b0->data == NULL) {
424
+ j = i + 1;
425
+ b0->data = (unsigned char *) bstr__alloc (j);
426
+ if (b0->data == NULL) {
427
+ /* Unable to allocate memory for string data */
428
+ bstr__free (b0);
429
+ return NULL;
430
+ }
431
+ }
432
+
433
+ b0->mlen = j;
434
+ b0->slen = i;
435
+
436
+ if (i) bstr__memcpy ((char *) b0->data, (char *) b->data, i);
437
+ b0->data[b0->slen] = (unsigned char) '\0';
438
+
439
+ return b0;
440
+ }
441
+
442
+ /* int bassign (bstring a, const_bstring b)
443
+ *
444
+ * Overwrite the string a with the contents of string b.
445
+ */
446
+ int bassign (bstring a, const_bstring b) {
447
+ if (b == NULL || b->data == NULL || b->slen < 0)
448
+ return BSTR_ERR;
449
+ if (b->slen != 0) {
450
+ if (balloc (a, b->slen) != BSTR_OK) return BSTR_ERR;
451
+ bstr__memmove (a->data, b->data, b->slen);
452
+ } else {
453
+ if (a == NULL || a->data == NULL || a->mlen < a->slen ||
454
+ a->slen < 0 || a->mlen == 0)
455
+ return BSTR_ERR;
456
+ }
457
+ a->data[b->slen] = (unsigned char) '\0';
458
+ a->slen = b->slen;
459
+ return BSTR_OK;
460
+ }
461
+
462
+ /* int bassignmidstr (bstring a, const_bstring b, int left, int len)
463
+ *
464
+ * Overwrite the string a with the middle of contents of string b
465
+ * starting from position left and running for a length len. left and
466
+ * len are clamped to the ends of b as with the function bmidstr.
467
+ */
468
+ int bassignmidstr (bstring a, const_bstring b, int left, int len) {
469
+ if (b == NULL || b->data == NULL || b->slen < 0)
470
+ return BSTR_ERR;
471
+
472
+ if (left < 0) {
473
+ len += left;
474
+ left = 0;
475
+ }
476
+
477
+ if (len > b->slen - left) len = b->slen - left;
478
+
479
+ if (a == NULL || a->data == NULL || a->mlen < a->slen ||
480
+ a->slen < 0 || a->mlen == 0)
481
+ return BSTR_ERR;
482
+
483
+ if (len > 0) {
484
+ if (balloc (a, len) != BSTR_OK) return BSTR_ERR;
485
+ bstr__memmove (a->data, b->data + left, len);
486
+ a->slen = len;
487
+ } else {
488
+ a->slen = 0;
489
+ }
490
+ a->data[a->slen] = (unsigned char) '\0';
491
+ return BSTR_OK;
492
+ }
493
+
494
+ /* int bassigncstr (bstring a, const char * str)
495
+ *
496
+ * Overwrite the string a with the contents of char * string str. Note that
497
+ * the bstring a must be a well defined and writable bstring. If an error
498
+ * occurs BSTR_ERR is returned however a may be partially overwritten.
499
+ */
500
+ int bassigncstr (bstring a, const char * str) {
501
+ int i;
502
+ size_t len;
503
+ if (a == NULL || a->data == NULL || a->mlen < a->slen ||
504
+ a->slen < 0 || a->mlen == 0 || NULL == str)
505
+ return BSTR_ERR;
506
+
507
+ for (i=0; i < a->mlen; i++) {
508
+ if ('\0' == (a->data[i] = str[i])) {
509
+ a->slen = i;
510
+ return BSTR_OK;
511
+ }
512
+ }
513
+
514
+ a->slen = i;
515
+ len = strlen (str + i);
516
+ if (len > INT_MAX || i + len + 1 > INT_MAX ||
517
+ 0 > balloc (a, (int) (i + len + 1))) return BSTR_ERR;
518
+ bBlockCopy (a->data + i, str + i, (size_t) len + 1);
519
+ a->slen += (int) len;
520
+ return BSTR_OK;
521
+ }
522
+
523
+ /* int bassignblk (bstring a, const void * s, int len)
524
+ *
525
+ * Overwrite the string a with the contents of the block (s, len). Note that
526
+ * the bstring a must be a well defined and writable bstring. If an error
527
+ * occurs BSTR_ERR is returned and a is not overwritten.
528
+ */
529
+ int bassignblk (bstring a, const void * s, int len) {
530
+ if (a == NULL || a->data == NULL || a->mlen < a->slen ||
531
+ a->slen < 0 || a->mlen == 0 || NULL == s || len + 1 < 1)
532
+ return BSTR_ERR;
533
+ if (len + 1 > a->mlen && 0 > balloc (a, len + 1)) return BSTR_ERR;
534
+ bBlockCopy (a->data, s, (size_t) len);
535
+ a->data[len] = (unsigned char) '\0';
536
+ a->slen = len;
537
+ return BSTR_OK;
538
+ }
539
+
540
+ /* int btrunc (bstring b, int n)
541
+ *
542
+ * Truncate the bstring to at most n characters.
543
+ */
544
+ int btrunc (bstring b, int n) {
545
+ if (n < 0 || b == NULL || b->data == NULL || b->mlen < b->slen ||
546
+ b->slen < 0 || b->mlen <= 0) return BSTR_ERR;
547
+ if (b->slen > n) {
548
+ b->slen = n;
549
+ b->data[n] = (unsigned char) '\0';
550
+ }
551
+ return BSTR_OK;
552
+ }
553
+
554
+ #define upcase(c) (toupper ((unsigned char) c))
555
+ #define downcase(c) (tolower ((unsigned char) c))
556
+ #define wspace(c) (isspace ((unsigned char) c))
557
+
558
+ /* int btoupper (bstring b)
559
+ *
560
+ * Convert contents of bstring to upper case.
561
+ */
562
+ int btoupper (bstring b) {
563
+ int i, len;
564
+ if (b == NULL || b->data == NULL || b->mlen < b->slen ||
565
+ b->slen < 0 || b->mlen <= 0) return BSTR_ERR;
566
+ for (i=0, len = b->slen; i < len; i++) {
567
+ b->data[i] = (unsigned char) upcase (b->data[i]);
568
+ }
569
+ return BSTR_OK;
570
+ }
571
+
572
+ /* int btolower (bstring b)
573
+ *
574
+ * Convert contents of bstring to lower case.
575
+ */
576
+ int btolower (bstring b) {
577
+ int i, len;
578
+ if (b == NULL || b->data == NULL || b->mlen < b->slen ||
579
+ b->slen < 0 || b->mlen <= 0) return BSTR_ERR;
580
+ for (i=0, len = b->slen; i < len; i++) {
581
+ b->data[i] = (unsigned char) downcase (b->data[i]);
582
+ }
583
+ return BSTR_OK;
584
+ }
585
+
586
+ /* int bstricmp (const_bstring b0, const_bstring b1)
587
+ *
588
+ * Compare two strings without differentiating between case. The return
589
+ * value is the difference of the values of the characters where the two
590
+ * strings first differ after lower case transformation, otherwise 0 is
591
+ * returned indicating that the strings are equal. If the lengths are
592
+ * different, then a difference from 0 is given, but if the first extra
593
+ * character is '\0', then it is taken to be the value UCHAR_MAX+1.
594
+ */
595
+ int bstricmp (const_bstring b0, const_bstring b1) {
596
+ int i, v, n;
597
+
598
+ if (bdata (b0) == NULL || b0->slen < 0 ||
599
+ bdata (b1) == NULL || b1->slen < 0) return SHRT_MIN;
600
+ if ((n = b0->slen) > b1->slen) n = b1->slen;
601
+ else if (b0->slen == b1->slen && b0->data == b1->data) return BSTR_OK;
602
+
603
+ for (i = 0; i < n; i ++) {
604
+ v = (char) downcase (b0->data[i])
605
+ - (char) downcase (b1->data[i]);
606
+ if (0 != v) return v;
607
+ }
608
+
609
+ if (b0->slen > n) {
610
+ v = (char) downcase (b0->data[n]);
611
+ if (v) return v;
612
+ return UCHAR_MAX + 1;
613
+ }
614
+ if (b1->slen > n) {
615
+ v = - (char) downcase (b1->data[n]);
616
+ if (v) return v;
617
+ return - (int) (UCHAR_MAX + 1);
618
+ }
619
+ return BSTR_OK;
620
+ }
621
+
622
+ /* int bstrnicmp (const_bstring b0, const_bstring b1, int n)
623
+ *
624
+ * Compare two strings without differentiating between case for at most n
625
+ * characters. If the position where the two strings first differ is
626
+ * before the nth position, the return value is the difference of the values
627
+ * of the characters, otherwise 0 is returned. If the lengths are different
628
+ * and less than n characters, then a difference from 0 is given, but if the
629
+ * first extra character is '\0', then it is taken to be the value
630
+ * UCHAR_MAX+1.
631
+ */
632
+ int bstrnicmp (const_bstring b0, const_bstring b1, int n) {
633
+ int i, v, m;
634
+
635
+ if (bdata (b0) == NULL || b0->slen < 0 ||
636
+ bdata (b1) == NULL || b1->slen < 0 || n < 0) return SHRT_MIN;
637
+ m = n;
638
+ if (m > b0->slen) m = b0->slen;
639
+ if (m > b1->slen) m = b1->slen;
640
+
641
+ if (b0->data != b1->data) {
642
+ for (i = 0; i < m; i ++) {
643
+ v = (char) downcase (b0->data[i]);
644
+ v -= (char) downcase (b1->data[i]);
645
+ if (v != 0) return b0->data[i] - b1->data[i];
646
+ }
647
+ }
648
+
649
+ if (n == m || b0->slen == b1->slen) return BSTR_OK;
650
+
651
+ if (b0->slen > m) {
652
+ v = (char) downcase (b0->data[m]);
653
+ if (v) return v;
654
+ return UCHAR_MAX + 1;
655
+ }
656
+
657
+ v = - (char) downcase (b1->data[m]);
658
+ if (v) return v;
659
+ return - (int) (UCHAR_MAX + 1);
660
+ }
661
+
662
+ /* int biseqcaseless (const_bstring b0, const_bstring b1)
663
+ *
664
+ * Compare two strings for equality without differentiating between case.
665
+ * If the strings differ other than in case, 0 is returned, if the strings
666
+ * are the same, 1 is returned, if there is an error, -1 is returned. If
667
+ * the length of the strings are different, this function is O(1). '\0'
668
+ * termination characters are not treated in any special way.
669
+ */
670
+ int biseqcaseless (const_bstring b0, const_bstring b1) {
671
+ int i, n;
672
+
673
+ if (bdata (b0) == NULL || b0->slen < 0 ||
674
+ bdata (b1) == NULL || b1->slen < 0) return BSTR_ERR;
675
+ if (b0->slen != b1->slen) return BSTR_OK;
676
+ if (b0->data == b1->data || b0->slen == 0) return 1;
677
+ for (i=0, n=b0->slen; i < n; i++) {
678
+ if (b0->data[i] != b1->data[i]) {
679
+ unsigned char c = (unsigned char) downcase (b0->data[i]);
680
+ if (c != (unsigned char) downcase (b1->data[i])) return 0;
681
+ }
682
+ }
683
+ return 1;
684
+ }
685
+
686
+ /* int bisstemeqcaselessblk (const_bstring b0, const void * blk, int len)
687
+ *
688
+ * Compare beginning of string b0 with a block of memory of length len
689
+ * without differentiating between case for equality. If the beginning of b0
690
+ * differs from the memory block other than in case (or if b0 is too short),
691
+ * 0 is returned, if the strings are the same, 1 is returned, if there is an
692
+ * error, -1 is returned. '\0' characters are not treated in any special
693
+ * way.
694
+ */
695
+ int bisstemeqcaselessblk (const_bstring b0, const void * blk, int len) {
696
+ int i;
697
+
698
+ if (bdata (b0) == NULL || b0->slen < 0 || NULL == blk || len < 0)
699
+ return BSTR_ERR;
700
+ if (b0->slen < len) return BSTR_OK;
701
+ if (b0->data == (const unsigned char *) blk || len == 0) return 1;
702
+
703
+ for (i = 0; i < len; i ++) {
704
+ if (b0->data[i] != ((const unsigned char *) blk)[i]) {
705
+ if (downcase (b0->data[i]) !=
706
+ downcase (((const unsigned char *) blk)[i])) return 0;
707
+ }
708
+ }
709
+ return 1;
710
+ }
711
+
712
+ /*
713
+ * int bltrimws (bstring b)
714
+ *
715
+ * Delete whitespace contiguous from the left end of the string.
716
+ */
717
+ int bltrimws (bstring b) {
718
+ int i, len;
719
+
720
+ if (b == NULL || b->data == NULL || b->mlen < b->slen ||
721
+ b->slen < 0 || b->mlen <= 0) return BSTR_ERR;
722
+
723
+ for (len = b->slen, i = 0; i < len; i++) {
724
+ if (!wspace (b->data[i])) {
725
+ return bdelete (b, 0, i);
726
+ }
727
+ }
728
+
729
+ b->data[0] = (unsigned char) '\0';
730
+ b->slen = 0;
731
+ return BSTR_OK;
732
+ }
733
+
734
+ /*
735
+ * int brtrimws (bstring b)
736
+ *
737
+ * Delete whitespace contiguous from the right end of the string.
738
+ */
739
+ int brtrimws (bstring b) {
740
+ int i;
741
+
742
+ if (b == NULL || b->data == NULL || b->mlen < b->slen ||
743
+ b->slen < 0 || b->mlen <= 0) return BSTR_ERR;
744
+
745
+ for (i = b->slen - 1; i >= 0; i--) {
746
+ if (!wspace (b->data[i])) {
747
+ if (b->mlen > i) b->data[i+1] = (unsigned char) '\0';
748
+ b->slen = i + 1;
749
+ return BSTR_OK;
750
+ }
751
+ }
752
+
753
+ b->data[0] = (unsigned char) '\0';
754
+ b->slen = 0;
755
+ return BSTR_OK;
756
+ }
757
+
758
+ /*
759
+ * int btrimws (bstring b)
760
+ *
761
+ * Delete whitespace contiguous from both ends of the string.
762
+ */
763
+ int btrimws (bstring b) {
764
+ int i, j;
765
+
766
+ if (b == NULL || b->data == NULL || b->mlen < b->slen ||
767
+ b->slen < 0 || b->mlen <= 0) return BSTR_ERR;
768
+
769
+ for (i = b->slen - 1; i >= 0; i--) {
770
+ if (!wspace (b->data[i])) {
771
+ if (b->mlen > i) b->data[i+1] = (unsigned char) '\0';
772
+ b->slen = i + 1;
773
+ for (j = 0; wspace (b->data[j]); j++) {}
774
+ return bdelete (b, 0, j);
775
+ }
776
+ }
777
+
778
+ b->data[0] = (unsigned char) '\0';
779
+ b->slen = 0;
780
+ return BSTR_OK;
781
+ }
782
+
783
+ /* int biseq (const_bstring b0, const_bstring b1)
784
+ *
785
+ * Compare the string b0 and b1. If the strings differ, 0 is returned, if
786
+ * the strings are the same, 1 is returned, if there is an error, -1 is
787
+ * returned. If the length of the strings are different, this function is
788
+ * O(1). '\0' termination characters are not treated in any special way.
789
+ */
790
+ int biseq (const_bstring b0, const_bstring b1) {
791
+ if (b0 == NULL || b1 == NULL || b0->data == NULL || b1->data == NULL ||
792
+ b0->slen < 0 || b1->slen < 0) return BSTR_ERR;
793
+ if (b0->slen != b1->slen) return BSTR_OK;
794
+ if (b0->data == b1->data || b0->slen == 0) return 1;
795
+ return !bstr__memcmp (b0->data, b1->data, b0->slen);
796
+ }
797
+
798
+ /* int bisstemeqblk (const_bstring b0, const void * blk, int len)
799
+ *
800
+ * Compare beginning of string b0 with a block of memory of length len for
801
+ * equality. If the beginning of b0 differs from the memory block (or if b0
802
+ * is too short), 0 is returned, if the strings are the same, 1 is returned,
803
+ * if there is an error, -1 is returned. '\0' characters are not treated in
804
+ * any special way.
805
+ */
806
+ int bisstemeqblk (const_bstring b0, const void * blk, int len) {
807
+ int i;
808
+
809
+ if (bdata (b0) == NULL || b0->slen < 0 || NULL == blk || len < 0)
810
+ return BSTR_ERR;
811
+ if (b0->slen < len) return BSTR_OK;
812
+ if (b0->data == (const unsigned char *) blk || len == 0) return 1;
813
+
814
+ for (i = 0; i < len; i ++) {
815
+ if (b0->data[i] != ((const unsigned char *) blk)[i]) return BSTR_OK;
816
+ }
817
+ return 1;
818
+ }
819
+
820
+ /* int biseqcstr (const_bstring b, const char *s)
821
+ *
822
+ * Compare the bstring b and char * string s. The C string s must be '\0'
823
+ * terminated at exactly the length of the bstring b, and the contents
824
+ * between the two must be identical with the bstring b with no '\0'
825
+ * characters for the two contents to be considered equal. This is
826
+ * equivalent to the condition that their current contents will be always be
827
+ * equal when comparing them in the same format after converting one or the
828
+ * other. If the strings are equal 1 is returned, if they are unequal 0 is
829
+ * returned and if there is a detectable error BSTR_ERR is returned.
830
+ */
831
+ int biseqcstr (const_bstring b, const char * s) {
832
+ int i;
833
+ if (b == NULL || s == NULL || b->data == NULL || b->slen < 0) return BSTR_ERR;
834
+ for (i=0; i < b->slen; i++) {
835
+ if (s[i] == '\0' || b->data[i] != (unsigned char) s[i]) return BSTR_OK;
836
+ }
837
+ return s[i] == '\0';
838
+ }
839
+
840
+ /* int biseqcstrcaseless (const_bstring b, const char *s)
841
+ *
842
+ * Compare the bstring b and char * string s. The C string s must be '\0'
843
+ * terminated at exactly the length of the bstring b, and the contents
844
+ * between the two must be identical except for case with the bstring b with
845
+ * no '\0' characters for the two contents to be considered equal. This is
846
+ * equivalent to the condition that their current contents will be always be
847
+ * equal ignoring case when comparing them in the same format after
848
+ * converting one or the other. If the strings are equal, except for case,
849
+ * 1 is returned, if they are unequal regardless of case 0 is returned and
850
+ * if there is a detectable error BSTR_ERR is returned.
851
+ */
852
+ int biseqcstrcaseless (const_bstring b, const char * s) {
853
+ int i;
854
+ if (b == NULL || s == NULL || b->data == NULL || b->slen < 0) return BSTR_ERR;
855
+ for (i=0; i < b->slen; i++) {
856
+ if (s[i] == '\0' ||
857
+ (b->data[i] != (unsigned char) s[i] &&
858
+ downcase (b->data[i]) != (unsigned char) downcase (s[i])))
859
+ return BSTR_OK;
860
+ }
861
+ return s[i] == '\0';
862
+ }
863
+
864
+ /* int bstrcmp (const_bstring b0, const_bstring b1)
865
+ *
866
+ * Compare the string b0 and b1. If there is an error, SHRT_MIN is returned,
867
+ * otherwise a value less than or greater than zero, indicating that the
868
+ * string pointed to by b0 is lexicographically less than or greater than
869
+ * the string pointed to by b1 is returned. If the the string lengths are
870
+ * unequal but the characters up until the length of the shorter are equal
871
+ * then a value less than, or greater than zero, indicating that the string
872
+ * pointed to by b0 is shorter or longer than the string pointed to by b1 is
873
+ * returned. 0 is returned if and only if the two strings are the same. If
874
+ * the length of the strings are different, this function is O(n). Like its
875
+ * standard C library counter part strcmp, the comparison does not proceed
876
+ * past any '\0' termination characters encountered.
877
+ */
878
+ int bstrcmp (const_bstring b0, const_bstring b1) {
879
+ int i, v, n;
880
+
881
+ if (b0 == NULL || b1 == NULL || b0->data == NULL || b1->data == NULL ||
882
+ b0->slen < 0 || b1->slen < 0) return SHRT_MIN;
883
+ n = b0->slen; if (n > b1->slen) n = b1->slen;
884
+ if (b0->slen == b1->slen && (b0->data == b1->data || b0->slen == 0))
885
+ return BSTR_OK;
886
+
887
+ for (i = 0; i < n; i ++) {
888
+ v = ((char) b0->data[i]) - ((char) b1->data[i]);
889
+ if (v != 0) return v;
890
+ if (b0->data[i] == (unsigned char) '\0') return BSTR_OK;
891
+ }
892
+
893
+ if (b0->slen > n) return 1;
894
+ if (b1->slen > n) return -1;
895
+ return BSTR_OK;
896
+ }
897
+
898
+ /* int bstrncmp (const_bstring b0, const_bstring b1, int n)
899
+ *
900
+ * Compare the string b0 and b1 for at most n characters. If there is an
901
+ * error, SHRT_MIN is returned, otherwise a value is returned as if b0 and
902
+ * b1 were first truncated to at most n characters then bstrcmp was called
903
+ * with these new strings are paremeters. If the length of the strings are
904
+ * different, this function is O(n). Like its standard C library counter
905
+ * part strcmp, the comparison does not proceed past any '\0' termination
906
+ * characters encountered.
907
+ */
908
+ int bstrncmp (const_bstring b0, const_bstring b1, int n) {
909
+ int i, v, m;
910
+
911
+ if (b0 == NULL || b1 == NULL || b0->data == NULL || b1->data == NULL ||
912
+ b0->slen < 0 || b1->slen < 0) return SHRT_MIN;
913
+ m = n;
914
+ if (m > b0->slen) m = b0->slen;
915
+ if (m > b1->slen) m = b1->slen;
916
+
917
+ if (b0->data != b1->data) {
918
+ for (i = 0; i < m; i ++) {
919
+ v = ((char) b0->data[i]) - ((char) b1->data[i]);
920
+ if (v != 0) return v;
921
+ if (b0->data[i] == (unsigned char) '\0') return BSTR_OK;
922
+ }
923
+ }
924
+
925
+ if (n == m || b0->slen == b1->slen) return BSTR_OK;
926
+
927
+ if (b0->slen > m) return 1;
928
+ return -1;
929
+ }
930
+
931
+ /* bstring bmidstr (const_bstring b, int left, int len)
932
+ *
933
+ * Create a bstring which is the substring of b starting from position left
934
+ * and running for a length len (clamped by the end of the bstring b.) If
935
+ * b is detectably invalid, then NULL is returned. The section described
936
+ * by (left, len) is clamped to the boundaries of b.
937
+ */
938
+ bstring bmidstr (const_bstring b, int left, int len) {
939
+
940
+ if (b == NULL || b->slen < 0 || b->data == NULL) return NULL;
941
+
942
+ if (left < 0) {
943
+ len += left;
944
+ left = 0;
945
+ }
946
+
947
+ if (len > b->slen - left) len = b->slen - left;
948
+
949
+ if (len <= 0) return bfromcstr ("");
950
+ return blk2bstr (b->data + left, len);
951
+ }
952
+
953
+ /* int bdelete (bstring b, int pos, int len)
954
+ *
955
+ * Removes characters from pos to pos+len-1 inclusive and shifts the tail of
956
+ * the bstring starting from pos+len to pos. len must be positive for this
957
+ * call to have any effect. The section of the string described by (pos,
958
+ * len) is clamped to boundaries of the bstring b.
959
+ */
960
+ int bdelete (bstring b, int pos, int len) {
961
+ /* Clamp to left side of bstring */
962
+ if (pos < 0) {
963
+ len += pos;
964
+ pos = 0;
965
+ }
966
+
967
+ if (len < 0 || b == NULL || b->data == NULL || b->slen < 0 ||
968
+ b->mlen < b->slen || b->mlen <= 0)
969
+ return BSTR_ERR;
970
+ if (len > 0 && pos < b->slen) {
971
+ if (pos + len >= b->slen) {
972
+ b->slen = pos;
973
+ } else {
974
+ bBlockCopy ((char *) (b->data + pos),
975
+ (char *) (b->data + pos + len),
976
+ b->slen - (pos+len));
977
+ b->slen -= len;
978
+ }
979
+ b->data[b->slen] = (unsigned char) '\0';
980
+ }
981
+ return BSTR_OK;
982
+ }
983
+
984
+ /* int bdestroy (bstring b)
985
+ *
986
+ * Free up the bstring. Note that if b is detectably invalid or not writable
987
+ * then no action is performed and BSTR_ERR is returned. Like a freed memory
988
+ * allocation, dereferences, writes or any other action on b after it has
989
+ * been bdestroyed is undefined.
990
+ */
991
+ int bdestroy (bstring b) {
992
+ if (b == NULL || b->slen < 0 || b->mlen <= 0 || b->mlen < b->slen ||
993
+ b->data == NULL)
994
+ return BSTR_ERR;
995
+
996
+ bstr__free (b->data);
997
+
998
+ /* In case there is any stale usage, there is one more chance to
999
+ notice this error. */
1000
+
1001
+ b->slen = -1;
1002
+ b->mlen = -__LINE__;
1003
+ b->data = NULL;
1004
+
1005
+ bstr__free (b);
1006
+ return BSTR_OK;
1007
+ }
1008
+
1009
+ /* int binstr (const_bstring b1, int pos, const_bstring b2)
1010
+ *
1011
+ * Search for the bstring b2 in b1 starting from position pos, and searching
1012
+ * forward. If it is found then return with the first position where it is
1013
+ * found, otherwise return BSTR_ERR. Note that this is just a brute force
1014
+ * string searcher that does not attempt clever things like the Boyer-Moore
1015
+ * search algorithm. Because of this there are many degenerate cases where
1016
+ * this can take much longer than it needs to.
1017
+ */
1018
+ int binstr (const_bstring b1, int pos, const_bstring b2) {
1019
+ int j, ii, ll, lf;
1020
+ unsigned char * d0;
1021
+ unsigned char c0;
1022
+ register unsigned char * d1;
1023
+ register unsigned char c1;
1024
+ register int i;
1025
+
1026
+ if (b1 == NULL || b1->data == NULL || b1->slen < 0 ||
1027
+ b2 == NULL || b2->data == NULL || b2->slen < 0) return BSTR_ERR;
1028
+ if (b1->slen == pos) return (b2->slen == 0)?pos:BSTR_ERR;
1029
+ if (b1->slen < pos || pos < 0) return BSTR_ERR;
1030
+ if (b2->slen == 0) return pos;
1031
+
1032
+ /* No space to find such a string? */
1033
+ if ((lf = b1->slen - b2->slen + 1) <= pos) return BSTR_ERR;
1034
+
1035
+ /* An obvious alias case */
1036
+ if (b1->data == b2->data && pos == 0) return 0;
1037
+
1038
+ i = pos;
1039
+
1040
+ d0 = b2->data;
1041
+ d1 = b1->data;
1042
+ ll = b2->slen;
1043
+
1044
+ /* Peel off the b2->slen == 1 case */
1045
+ c0 = d0[0];
1046
+ if (1 == ll) {
1047
+ for (;i < lf; i++) if (c0 == d1[i]) return i;
1048
+ return BSTR_ERR;
1049
+ }
1050
+
1051
+ c1 = c0;
1052
+ j = 0;
1053
+ lf = b1->slen - 1;
1054
+
1055
+ ii = -1;
1056
+ if (i < lf) do {
1057
+ /* Unrolled current character test */
1058
+ if (c1 != d1[i]) {
1059
+ if (c1 != d1[1+i]) {
1060
+ i += 2;
1061
+ continue;
1062
+ }
1063
+ i++;
1064
+ }
1065
+
1066
+ /* Take note if this is the start of a potential match */
1067
+ if (0 == j) ii = i;
1068
+
1069
+ /* Shift the test character down by one */
1070
+ j++;
1071
+ i++;
1072
+
1073
+ /* If this isn't past the last character continue */
1074
+ if (j < ll) {
1075
+ c1 = d0[j];
1076
+ continue;
1077
+ }
1078
+
1079
+ N0:;
1080
+
1081
+ /* If no characters mismatched, then we matched */
1082
+ if (i == ii+j) return ii;
1083
+
1084
+ /* Shift back to the beginning */
1085
+ i -= j;
1086
+ j = 0;
1087
+ c1 = c0;
1088
+ } while (i < lf);
1089
+
1090
+ /* Deal with last case if unrolling caused a misalignment */
1091
+ if (i == lf && ll == j+1 && c1 == d1[i]) goto N0;
1092
+
1093
+ return BSTR_ERR;
1094
+ }
1095
+
1096
+ /* int binstrr (const_bstring b1, int pos, const_bstring b2)
1097
+ *
1098
+ * Search for the bstring b2 in b1 starting from position pos, and searching
1099
+ * backward. If it is found then return with the first position where it is
1100
+ * found, otherwise return BSTR_ERR. Note that this is just a brute force
1101
+ * string searcher that does not attempt clever things like the Boyer-Moore
1102
+ * search algorithm. Because of this there are many degenerate cases where
1103
+ * this can take much longer than it needs to.
1104
+ */
1105
+ int binstrr (const_bstring b1, int pos, const_bstring b2) {
1106
+ int j, i, l;
1107
+ unsigned char * d0, * d1;
1108
+
1109
+ if (b1 == NULL || b1->data == NULL || b1->slen < 0 ||
1110
+ b2 == NULL || b2->data == NULL || b2->slen < 0) return BSTR_ERR;
1111
+ if (b1->slen == pos && b2->slen == 0) return pos;
1112
+ if (b1->slen < pos || pos < 0) return BSTR_ERR;
1113
+ if (b2->slen == 0) return pos;
1114
+
1115
+ /* Obvious alias case */
1116
+ if (b1->data == b2->data && pos == 0 && b2->slen <= b1->slen) return 0;
1117
+
1118
+ i = pos;
1119
+ if ((l = b1->slen - b2->slen) < 0) return BSTR_ERR;
1120
+
1121
+ /* If no space to find such a string then snap back */
1122
+ if (l + 1 <= i) i = l;
1123
+ j = 0;
1124
+
1125
+ d0 = b2->data;
1126
+ d1 = b1->data;
1127
+ l = b2->slen;
1128
+
1129
+ for (;;) {
1130
+ if (d0[j] == d1[i + j]) {
1131
+ j ++;
1132
+ if (j >= l) return i;
1133
+ } else {
1134
+ i --;
1135
+ if (i < 0) break;
1136
+ j=0;
1137
+ }
1138
+ }
1139
+
1140
+ return BSTR_ERR;
1141
+ }
1142
+
1143
+ /* int binstrcaseless (const_bstring b1, int pos, const_bstring b2)
1144
+ *
1145
+ * Search for the bstring b2 in b1 starting from position pos, and searching
1146
+ * forward but without regard to case. If it is found then return with the
1147
+ * first position where it is found, otherwise return BSTR_ERR. Note that
1148
+ * this is just a brute force string searcher that does not attempt clever
1149
+ * things like the Boyer-Moore search algorithm. Because of this there are
1150
+ * many degenerate cases where this can take much longer than it needs to.
1151
+ */
1152
+ int binstrcaseless (const_bstring b1, int pos, const_bstring b2) {
1153
+ int j, i, l, ll;
1154
+ unsigned char * d0, * d1;
1155
+
1156
+ if (b1 == NULL || b1->data == NULL || b1->slen < 0 ||
1157
+ b2 == NULL || b2->data == NULL || b2->slen < 0) return BSTR_ERR;
1158
+ if (b1->slen == pos) return (b2->slen == 0)?pos:BSTR_ERR;
1159
+ if (b1->slen < pos || pos < 0) return BSTR_ERR;
1160
+ if (b2->slen == 0) return pos;
1161
+
1162
+ l = b1->slen - b2->slen + 1;
1163
+
1164
+ /* No space to find such a string? */
1165
+ if (l <= pos) return BSTR_ERR;
1166
+
1167
+ /* An obvious alias case */
1168
+ if (b1->data == b2->data && pos == 0) return BSTR_OK;
1169
+
1170
+ i = pos;
1171
+ j = 0;
1172
+
1173
+ d0 = b2->data;
1174
+ d1 = b1->data;
1175
+ ll = b2->slen;
1176
+
1177
+ for (;;) {
1178
+ if (d0[j] == d1[i + j] || downcase (d0[j]) == downcase (d1[i + j])) {
1179
+ j ++;
1180
+ if (j >= ll) return i;
1181
+ } else {
1182
+ i ++;
1183
+ if (i >= l) break;
1184
+ j=0;
1185
+ }
1186
+ }
1187
+
1188
+ return BSTR_ERR;
1189
+ }
1190
+
1191
+ /* int binstrrcaseless (const_bstring b1, int pos, const_bstring b2)
1192
+ *
1193
+ * Search for the bstring b2 in b1 starting from position pos, and searching
1194
+ * backward but without regard to case. If it is found then return with the
1195
+ * first position where it is found, otherwise return BSTR_ERR. Note that
1196
+ * this is just a brute force string searcher that does not attempt clever
1197
+ * things like the Boyer-Moore search algorithm. Because of this there are
1198
+ * many degenerate cases where this can take much longer than it needs to.
1199
+ */
1200
+ int binstrrcaseless (const_bstring b1, int pos, const_bstring b2) {
1201
+ int j, i, l;
1202
+ unsigned char * d0, * d1;
1203
+
1204
+ if (b1 == NULL || b1->data == NULL || b1->slen < 0 ||
1205
+ b2 == NULL || b2->data == NULL || b2->slen < 0) return BSTR_ERR;
1206
+ if (b1->slen == pos && b2->slen == 0) return pos;
1207
+ if (b1->slen < pos || pos < 0) return BSTR_ERR;
1208
+ if (b2->slen == 0) return pos;
1209
+
1210
+ /* Obvious alias case */
1211
+ if (b1->data == b2->data && pos == 0 && b2->slen <= b1->slen) return BSTR_OK;
1212
+
1213
+ i = pos;
1214
+ if ((l = b1->slen - b2->slen) < 0) return BSTR_ERR;
1215
+
1216
+ /* If no space to find such a string then snap back */
1217
+ if (l + 1 <= i) i = l;
1218
+ j = 0;
1219
+
1220
+ d0 = b2->data;
1221
+ d1 = b1->data;
1222
+ l = b2->slen;
1223
+
1224
+ for (;;) {
1225
+ if (d0[j] == d1[i + j] || downcase (d0[j]) == downcase (d1[i + j])) {
1226
+ j ++;
1227
+ if (j >= l) return i;
1228
+ } else {
1229
+ i --;
1230
+ if (i < 0) break;
1231
+ j=0;
1232
+ }
1233
+ }
1234
+
1235
+ return BSTR_ERR;
1236
+ }
1237
+
1238
+
1239
+ /* int bstrchrp (const_bstring b, int c, int pos)
1240
+ *
1241
+ * Search for the character c in b forwards from the position pos
1242
+ * (inclusive).
1243
+ */
1244
+ int bstrchrp (const_bstring b, int c, int pos) {
1245
+ unsigned char * p;
1246
+
1247
+ if (b == NULL || b->data == NULL || b->slen <= pos || pos < 0) return BSTR_ERR;
1248
+ p = (unsigned char *) bstr__memchr ((b->data + pos), (unsigned char) c, (b->slen - pos));
1249
+ if (p) return (int) (p - b->data);
1250
+ return BSTR_ERR;
1251
+ }
1252
+
1253
+ /* int bstrrchrp (const_bstring b, int c, int pos)
1254
+ *
1255
+ * Search for the character c in b backwards from the position pos in string
1256
+ * (inclusive).
1257
+ */
1258
+ int bstrrchrp (const_bstring b, int c, int pos) {
1259
+ int i;
1260
+
1261
+ if (b == NULL || b->data == NULL || b->slen <= pos || pos < 0) return BSTR_ERR;
1262
+ for (i=pos; i >= 0; i--) {
1263
+ if (b->data[i] == (unsigned char) c) return i;
1264
+ }
1265
+ return BSTR_ERR;
1266
+ }
1267
+
1268
+ #if !defined (BSTRLIB_AGGRESSIVE_MEMORY_FOR_SPEED_TRADEOFF)
1269
+ #define LONG_LOG_BITS_QTY (3)
1270
+ #define LONG_BITS_QTY (1 << LONG_LOG_BITS_QTY)
1271
+ #define LONG_TYPE unsigned char
1272
+
1273
+ #define CFCLEN ((1 << CHAR_BIT) / LONG_BITS_QTY)
1274
+ struct charField { LONG_TYPE content[CFCLEN]; };
1275
+ #define testInCharField(cf,c) ((cf)->content[(c) >> LONG_LOG_BITS_QTY] & (((long)1) << ((c) & (LONG_BITS_QTY-1))))
1276
+ #define setInCharField(cf,idx) { \
1277
+ unsigned int c = (unsigned int) (idx); \
1278
+ (cf)->content[c >> LONG_LOG_BITS_QTY] |= (LONG_TYPE) (1ul << (c & (LONG_BITS_QTY-1))); \
1279
+ }
1280
+
1281
+ #else
1282
+
1283
+ #define CFCLEN (1 << CHAR_BIT)
1284
+ struct charField { unsigned char content[CFCLEN]; };
1285
+ #define testInCharField(cf,c) ((cf)->content[(unsigned char) (c)])
1286
+ #define setInCharField(cf,idx) (cf)->content[(unsigned int) (idx)] = ~0
1287
+
1288
+ #endif
1289
+
1290
+ /* Convert a bstring to charField */
1291
+ static int buildCharField (struct charField * cf, const_bstring b) {
1292
+ int i;
1293
+ if (b == NULL || b->data == NULL || b->slen <= 0) return BSTR_ERR;
1294
+ memset ((void *) cf->content, 0, sizeof (struct charField));
1295
+ for (i=0; i < b->slen; i++) {
1296
+ setInCharField (cf, b->data[i]);
1297
+ }
1298
+ return BSTR_OK;
1299
+ }
1300
+
1301
+ static void invertCharField (struct charField * cf) {
1302
+ int i;
1303
+ for (i=0; i < CFCLEN; i++) cf->content[i] = ~cf->content[i];
1304
+ }
1305
+
1306
+ /* Inner engine for binchr */
1307
+ static int binchrCF (const unsigned char * data, int len, int pos, const struct charField * cf) {
1308
+ int i;
1309
+ for (i=pos; i < len; i++) {
1310
+ unsigned char c = (unsigned char) data[i];
1311
+ if (testInCharField (cf, c)) return i;
1312
+ }
1313
+ return BSTR_ERR;
1314
+ }
1315
+
1316
+ /* int binchr (const_bstring b0, int pos, const_bstring b1);
1317
+ *
1318
+ * Search for the first position in b0 starting from pos or after, in which
1319
+ * one of the characters in b1 is found and return it. If such a position
1320
+ * does not exist in b0, then BSTR_ERR is returned.
1321
+ */
1322
+ int binchr (const_bstring b0, int pos, const_bstring b1) {
1323
+ struct charField chrs;
1324
+ if (pos < 0 || b0 == NULL || b0->data == NULL ||
1325
+ b0->slen <= pos) return BSTR_ERR;
1326
+ if (1 == b1->slen) return bstrchrp (b0, b1->data[0], pos);
1327
+ if (0 > buildCharField (&chrs, b1)) return BSTR_ERR;
1328
+ return binchrCF (b0->data, b0->slen, pos, &chrs);
1329
+ }
1330
+
1331
+ /* Inner engine for binchrr */
1332
+ static int binchrrCF (const unsigned char * data, int pos, const struct charField * cf) {
1333
+ int i;
1334
+ for (i=pos; i >= 0; i--) {
1335
+ unsigned int c = (unsigned int) data[i];
1336
+ if (testInCharField (cf, c)) return i;
1337
+ }
1338
+ return BSTR_ERR;
1339
+ }
1340
+
1341
+ /* int binchrr (const_bstring b0, int pos, const_bstring b1);
1342
+ *
1343
+ * Search for the last position in b0 no greater than pos, in which one of
1344
+ * the characters in b1 is found and return it. If such a position does not
1345
+ * exist in b0, then BSTR_ERR is returned.
1346
+ */
1347
+ int binchrr (const_bstring b0, int pos, const_bstring b1) {
1348
+ struct charField chrs;
1349
+ if (pos < 0 || b0 == NULL || b0->data == NULL || b1 == NULL ||
1350
+ b0->slen < pos) return BSTR_ERR;
1351
+ if (pos == b0->slen) pos--;
1352
+ if (1 == b1->slen) return bstrrchrp (b0, b1->data[0], pos);
1353
+ if (0 > buildCharField (&chrs, b1)) return BSTR_ERR;
1354
+ return binchrrCF (b0->data, pos, &chrs);
1355
+ }
1356
+
1357
+ /* int bninchr (const_bstring b0, int pos, const_bstring b1);
1358
+ *
1359
+ * Search for the first position in b0 starting from pos or after, in which
1360
+ * none of the characters in b1 is found and return it. If such a position
1361
+ * does not exist in b0, then BSTR_ERR is returned.
1362
+ */
1363
+ int bninchr (const_bstring b0, int pos, const_bstring b1) {
1364
+ struct charField chrs;
1365
+ if (pos < 0 || b0 == NULL || b0->data == NULL ||
1366
+ b0->slen <= pos) return BSTR_ERR;
1367
+ if (buildCharField (&chrs, b1) < 0) return BSTR_ERR;
1368
+ invertCharField (&chrs);
1369
+ return binchrCF (b0->data, b0->slen, pos, &chrs);
1370
+ }
1371
+
1372
+ /* int bninchrr (const_bstring b0, int pos, const_bstring b1);
1373
+ *
1374
+ * Search for the last position in b0 no greater than pos, in which none of
1375
+ * the characters in b1 is found and return it. If such a position does not
1376
+ * exist in b0, then BSTR_ERR is returned.
1377
+ */
1378
+ int bninchrr (const_bstring b0, int pos, const_bstring b1) {
1379
+ struct charField chrs;
1380
+ if (pos < 0 || b0 == NULL || b0->data == NULL ||
1381
+ b0->slen < pos) return BSTR_ERR;
1382
+ if (pos == b0->slen) pos--;
1383
+ if (buildCharField (&chrs, b1) < 0) return BSTR_ERR;
1384
+ invertCharField (&chrs);
1385
+ return binchrrCF (b0->data, pos, &chrs);
1386
+ }
1387
+
1388
+ /* int bsetstr (bstring b0, int pos, bstring b1, unsigned char fill)
1389
+ *
1390
+ * Overwrite the string b0 starting at position pos with the string b1. If
1391
+ * the position pos is past the end of b0, then the character "fill" is
1392
+ * appended as necessary to make up the gap between the end of b0 and pos.
1393
+ * If b1 is NULL, it behaves as if it were a 0-length string.
1394
+ */
1395
+ int bsetstr (bstring b0, int pos, const_bstring b1, unsigned char fill) {
1396
+ int d, newlen;
1397
+ ptrdiff_t pd;
1398
+ bstring aux = (bstring) b1;
1399
+
1400
+ if (pos < 0 || b0 == NULL || b0->slen < 0 || NULL == b0->data ||
1401
+ b0->mlen < b0->slen || b0->mlen <= 0) return BSTR_ERR;
1402
+ if (b1 != NULL && (b1->slen < 0 || b1->data == NULL)) return BSTR_ERR;
1403
+
1404
+ d = pos;
1405
+
1406
+ /* Aliasing case */
1407
+ if (NULL != aux) {
1408
+ if ((pd = (ptrdiff_t) (b1->data - b0->data)) >= 0 && pd < (ptrdiff_t) b0->mlen) {
1409
+ if (NULL == (aux = bstrcpy (b1))) return BSTR_ERR;
1410
+ }
1411
+ d += aux->slen;
1412
+ }
1413
+
1414
+ /* Increase memory size if necessary */
1415
+ if (balloc (b0, d + 1) != BSTR_OK) {
1416
+ if (aux != b1) bdestroy (aux);
1417
+ return BSTR_ERR;
1418
+ }
1419
+
1420
+ newlen = b0->slen;
1421
+
1422
+ /* Fill in "fill" character as necessary */
1423
+ if (pos > newlen) {
1424
+ bstr__memset (b0->data + b0->slen, (int) fill, (size_t) (pos - b0->slen));
1425
+ newlen = pos;
1426
+ }
1427
+
1428
+ /* Copy b1 to position pos in b0. */
1429
+ if (aux != NULL) {
1430
+ bBlockCopy ((char *) (b0->data + pos), (char *) aux->data, aux->slen);
1431
+ if (aux != b1) bdestroy (aux);
1432
+ }
1433
+
1434
+ /* Indicate the potentially increased size of b0 */
1435
+ if (d > newlen) newlen = d;
1436
+
1437
+ b0->slen = newlen;
1438
+ b0->data[newlen] = (unsigned char) '\0';
1439
+
1440
+ return BSTR_OK;
1441
+ }
1442
+
1443
+ /* int binsert (bstring b1, int pos, bstring b2, unsigned char fill)
1444
+ *
1445
+ * Inserts the string b2 into b1 at position pos. If the position pos is
1446
+ * past the end of b1, then the character "fill" is appended as necessary to
1447
+ * make up the gap between the end of b1 and pos. Unlike bsetstr, binsert
1448
+ * does not allow b2 to be NULL.
1449
+ */
1450
+ int binsert (bstring b1, int pos, const_bstring b2, unsigned char fill) {
1451
+ int d, l;
1452
+ ptrdiff_t pd;
1453
+ bstring aux = (bstring) b2;
1454
+
1455
+ if (pos < 0 || b1 == NULL || b2 == NULL || b1->slen < 0 ||
1456
+ b2->slen < 0 || b1->mlen < b1->slen || b1->mlen <= 0) return BSTR_ERR;
1457
+
1458
+ /* Aliasing case */
1459
+ if ((pd = (ptrdiff_t) (b2->data - b1->data)) >= 0 && pd < (ptrdiff_t) b1->mlen) {
1460
+ if (NULL == (aux = bstrcpy (b2))) return BSTR_ERR;
1461
+ }
1462
+
1463
+ /* Compute the two possible end pointers */
1464
+ d = b1->slen + aux->slen;
1465
+ l = pos + aux->slen;
1466
+ if ((d|l) < 0) return BSTR_ERR;
1467
+
1468
+ if (l > d) {
1469
+ /* Inserting past the end of the string */
1470
+ if (balloc (b1, l + 1) != BSTR_OK) {
1471
+ if (aux != b2) bdestroy (aux);
1472
+ return BSTR_ERR;
1473
+ }
1474
+ bstr__memset (b1->data + b1->slen, (int) fill, (size_t) (pos - b1->slen));
1475
+ b1->slen = l;
1476
+ } else {
1477
+ /* Inserting in the middle of the string */
1478
+ if (balloc (b1, d + 1) != BSTR_OK) {
1479
+ if (aux != b2) bdestroy (aux);
1480
+ return BSTR_ERR;
1481
+ }
1482
+ bBlockCopy (b1->data + l, b1->data + pos, d - l);
1483
+ b1->slen = d;
1484
+ }
1485
+ bBlockCopy (b1->data + pos, aux->data, aux->slen);
1486
+ b1->data[b1->slen] = (unsigned char) '\0';
1487
+ if (aux != b2) bdestroy (aux);
1488
+ return BSTR_OK;
1489
+ }
1490
+
1491
+ /* int breplace (bstring b1, int pos, int len, bstring b2,
1492
+ * unsigned char fill)
1493
+ *
1494
+ * Replace a section of a string from pos for a length len with the string b2.
1495
+ * fill is used is pos > b1->slen.
1496
+ */
1497
+ int breplace (bstring b1, int pos, int len, const_bstring b2,
1498
+ unsigned char fill) {
1499
+ int pl, ret;
1500
+ ptrdiff_t pd;
1501
+ bstring aux = (bstring) b2;
1502
+
1503
+ if (pos < 0 || len < 0 || (pl = pos + len) < 0 || b1 == NULL ||
1504
+ b2 == NULL || b1->data == NULL || b2->data == NULL ||
1505
+ b1->slen < 0 || b2->slen < 0 || b1->mlen < b1->slen ||
1506
+ b1->mlen <= 0) return BSTR_ERR;
1507
+
1508
+ /* Straddles the end? */
1509
+ if (pl >= b1->slen) {
1510
+ if ((ret = bsetstr (b1, pos, b2, fill)) < 0) return ret;
1511
+ if (pos + b2->slen < b1->slen) {
1512
+ b1->slen = pos + b2->slen;
1513
+ b1->data[b1->slen] = (unsigned char) '\0';
1514
+ }
1515
+ return ret;
1516
+ }
1517
+
1518
+ /* Aliasing case */
1519
+ if ((pd = (ptrdiff_t) (b2->data - b1->data)) >= 0 && pd < (ptrdiff_t) b1->slen) {
1520
+ if (NULL == (aux = bstrcpy (b2))) return BSTR_ERR;
1521
+ }
1522
+
1523
+ if (aux->slen > len) {
1524
+ if (balloc (b1, b1->slen + aux->slen - len) != BSTR_OK) {
1525
+ if (aux != b2) bdestroy (aux);
1526
+ return BSTR_ERR;
1527
+ }
1528
+ }
1529
+
1530
+ if (aux->slen != len) bstr__memmove (b1->data + pos + aux->slen, b1->data + pos + len, b1->slen - (pos + len));
1531
+ bstr__memcpy (b1->data + pos, aux->data, aux->slen);
1532
+ b1->slen += aux->slen - len;
1533
+ b1->data[b1->slen] = (unsigned char) '\0';
1534
+ if (aux != b2) bdestroy (aux);
1535
+ return BSTR_OK;
1536
+ }
1537
+
1538
+ /* int bfindreplace (bstring b, const_bstring find, const_bstring repl,
1539
+ * int pos)
1540
+ *
1541
+ * Replace all occurrences of a find string with a replace string after a
1542
+ * given point in a bstring.
1543
+ */
1544
+
1545
+ typedef int (*instr_fnptr) (const_bstring s1, int pos, const_bstring s2);
1546
+
1547
+ static int findreplaceengine (bstring b, const_bstring find, const_bstring repl, int pos, instr_fnptr instr) {
1548
+ int i, ret, slen, mlen, delta, acc;
1549
+ int * d;
1550
+ int static_d[32];
1551
+ ptrdiff_t pd;
1552
+ bstring auxf = (bstring) find;
1553
+ bstring auxr = (bstring) repl;
1554
+
1555
+ if (b == NULL || b->data == NULL || find == NULL ||
1556
+ find->data == NULL || repl == NULL || repl->data == NULL ||
1557
+ pos < 0 || find->slen <= 0 || b->mlen < 0 || b->slen > b->mlen ||
1558
+ b->mlen <= 0 || b->slen < 0 || repl->slen < 0) return BSTR_ERR;
1559
+ if (pos > b->slen - find->slen) return BSTR_OK;
1560
+
1561
+ /* Alias with find string */
1562
+ pd = (ptrdiff_t) (find->data - b->data);
1563
+ if ((ptrdiff_t) (pos - find->slen) < pd && pd < (ptrdiff_t) b->slen) {
1564
+ if (NULL == (auxf = bstrcpy (find))) return BSTR_ERR;
1565
+ }
1566
+
1567
+ /* Alias with repl string */
1568
+ pd = (ptrdiff_t) (repl->data - b->data);
1569
+ if ((ptrdiff_t) (pos - repl->slen) < pd && pd < (ptrdiff_t) b->slen) {
1570
+ if (NULL == (auxr = bstrcpy (repl))) {
1571
+ if (auxf != find) bdestroy (auxf);
1572
+ return BSTR_ERR;
1573
+ }
1574
+ }
1575
+
1576
+ delta = auxf->slen - auxr->slen;
1577
+
1578
+ /* in-place replacement since find and replace strings are of equal
1579
+ length */
1580
+ if (delta == 0) {
1581
+ while ((pos = instr (b, pos, auxf)) >= 0) {
1582
+ bstr__memcpy (b->data + pos, auxr->data, auxr->slen);
1583
+ pos += auxf->slen;
1584
+ }
1585
+ if (auxf != find) bdestroy (auxf);
1586
+ if (auxr != repl) bdestroy (auxr);
1587
+ return BSTR_OK;
1588
+ }
1589
+
1590
+ /* shrinking replacement since auxf->slen > auxr->slen */
1591
+ if (delta > 0) {
1592
+ acc = 0;
1593
+
1594
+ while ((i = instr (b, pos, auxf)) >= 0) {
1595
+ if (acc && i > pos)
1596
+ bstr__memmove (b->data + pos - acc, b->data + pos, i - pos);
1597
+ if (auxr->slen)
1598
+ bstr__memcpy (b->data + i - acc, auxr->data, auxr->slen);
1599
+ acc += delta;
1600
+ pos = i + auxf->slen;
1601
+ }
1602
+
1603
+ if (acc) {
1604
+ i = b->slen;
1605
+ if (i > pos)
1606
+ bstr__memmove (b->data + pos - acc, b->data + pos, i - pos);
1607
+ b->slen -= acc;
1608
+ b->data[b->slen] = (unsigned char) '\0';
1609
+ }
1610
+
1611
+ if (auxf != find) bdestroy (auxf);
1612
+ if (auxr != repl) bdestroy (auxr);
1613
+ return BSTR_OK;
1614
+ }
1615
+
1616
+ /* expanding replacement since find->slen < repl->slen. Its a lot
1617
+ more complicated. */
1618
+
1619
+ mlen = 32;
1620
+ d = (int *) static_d; /* Avoid malloc for trivial cases */
1621
+ acc = slen = 0;
1622
+
1623
+ while ((pos = instr (b, pos, auxf)) >= 0) {
1624
+ if (slen + 1 >= mlen) {
1625
+ int sl;
1626
+ int * t;
1627
+ mlen += mlen;
1628
+ sl = sizeof (int *) * mlen;
1629
+ if (static_d == d) d = NULL;
1630
+ if (sl < mlen || NULL == (t = (int *) bstr__realloc (d, sl))) {
1631
+ ret = BSTR_ERR;
1632
+ goto done;
1633
+ }
1634
+ if (NULL == d) bstr__memcpy (t, static_d, sizeof (static_d));
1635
+ d = t;
1636
+ }
1637
+ d[slen] = pos;
1638
+ slen++;
1639
+ acc -= delta;
1640
+ pos += auxf->slen;
1641
+ if (pos < 0 || acc < 0) {
1642
+ ret = BSTR_ERR;
1643
+ goto done;
1644
+ }
1645
+ }
1646
+ d[slen] = b->slen;
1647
+
1648
+ if (BSTR_OK == (ret = balloc (b, b->slen + acc + 1))) {
1649
+ b->slen += acc;
1650
+ for (i = slen-1; i >= 0; i--) {
1651
+ int s, l;
1652
+ s = d[i] + auxf->slen;
1653
+ l = d[i+1] - s;
1654
+ if (l) {
1655
+ bstr__memmove (b->data + s + acc, b->data + s, l);
1656
+ }
1657
+ if (auxr->slen) {
1658
+ bstr__memmove (b->data + s + acc - auxr->slen,
1659
+ auxr->data, auxr->slen);
1660
+ }
1661
+ acc += delta;
1662
+ }
1663
+ b->data[b->slen] = (unsigned char) '\0';
1664
+ }
1665
+
1666
+ done:;
1667
+ if (static_d == d) d = NULL;
1668
+ bstr__free (d);
1669
+ if (auxf != find) bdestroy (auxf);
1670
+ if (auxr != repl) bdestroy (auxr);
1671
+ return ret;
1672
+ }
1673
+
1674
+ /* int bfindreplace (bstring b, const_bstring find, const_bstring repl,
1675
+ * int pos)
1676
+ *
1677
+ * Replace all occurrences of a find string with a replace string after a
1678
+ * given point in a bstring.
1679
+ */
1680
+ int bfindreplace (bstring b, const_bstring find, const_bstring repl, int pos) {
1681
+ return findreplaceengine (b, find, repl, pos, binstr);
1682
+ }
1683
+
1684
+ /* int bfindreplacecaseless (bstring b, const_bstring find, const_bstring repl,
1685
+ * int pos)
1686
+ *
1687
+ * Replace all occurrences of a find string, ignoring case, with a replace
1688
+ * string after a given point in a bstring.
1689
+ */
1690
+ int bfindreplacecaseless (bstring b, const_bstring find, const_bstring repl, int pos) {
1691
+ return findreplaceengine (b, find, repl, pos, binstrcaseless);
1692
+ }
1693
+
1694
+ /* int binsertch (bstring b, int pos, int len, unsigned char fill)
1695
+ *
1696
+ * Inserts the character fill repeatedly into b at position pos for a
1697
+ * length len. If the position pos is past the end of b, then the
1698
+ * character "fill" is appended as necessary to make up the gap between the
1699
+ * end of b and the position pos + len.
1700
+ */
1701
+ int binsertch (bstring b, int pos, int len, unsigned char fill) {
1702
+ int d, l, i;
1703
+
1704
+ if (pos < 0 || b == NULL || b->slen < 0 || b->mlen < b->slen ||
1705
+ b->mlen <= 0 || len < 0) return BSTR_ERR;
1706
+
1707
+ /* Compute the two possible end pointers */
1708
+ d = b->slen + len;
1709
+ l = pos + len;
1710
+ if ((d|l) < 0) return BSTR_ERR;
1711
+
1712
+ if (l > d) {
1713
+ /* Inserting past the end of the string */
1714
+ if (balloc (b, l + 1) != BSTR_OK) return BSTR_ERR;
1715
+ pos = b->slen;
1716
+ b->slen = l;
1717
+ } else {
1718
+ /* Inserting in the middle of the string */
1719
+ if (balloc (b, d + 1) != BSTR_OK) return BSTR_ERR;
1720
+ for (i = d - 1; i >= l; i--) {
1721
+ b->data[i] = b->data[i - len];
1722
+ }
1723
+ b->slen = d;
1724
+ }
1725
+
1726
+ for (i=pos; i < l; i++) b->data[i] = fill;
1727
+ b->data[b->slen] = (unsigned char) '\0';
1728
+ return BSTR_OK;
1729
+ }
1730
+
1731
+ /* int bpattern (bstring b, int len)
1732
+ *
1733
+ * Replicate the bstring, b in place, end to end repeatedly until it
1734
+ * surpasses len characters, then chop the result to exactly len characters.
1735
+ * This function operates in-place. The function will return with BSTR_ERR
1736
+ * if b is NULL or of length 0, otherwise BSTR_OK is returned.
1737
+ */
1738
+ int bpattern (bstring b, int len) {
1739
+ int i, d;
1740
+
1741
+ d = blength (b);
1742
+ if (d <= 0 || len < 0 || balloc (b, len + 1) != BSTR_OK) return BSTR_ERR;
1743
+ if (len > 0) {
1744
+ if (d == 1) return bsetstr (b, len, NULL, b->data[0]);
1745
+ for (i = d; i < len; i++) b->data[i] = b->data[i - d];
1746
+ }
1747
+ b->data[len] = (unsigned char) '\0';
1748
+ b->slen = len;
1749
+ return BSTR_OK;
1750
+ }
1751
+
1752
+ #define BS_BUFF_SZ (1024)
1753
+
1754
+ /* int breada (bstring b, bNread readPtr, void * parm)
1755
+ *
1756
+ * Use a finite buffer fread-like function readPtr to concatenate to the
1757
+ * bstring b the entire contents of file-like source data in a roughly
1758
+ * efficient way.
1759
+ */
1760
+ int breada (bstring b, bNread readPtr, void * parm) {
1761
+ int i, l, n;
1762
+
1763
+ if (b == NULL || b->mlen <= 0 || b->slen < 0 || b->mlen < b->slen ||
1764
+ b->mlen <= 0 || readPtr == NULL) return BSTR_ERR;
1765
+
1766
+ i = b->slen;
1767
+ for (n=i+16; ; n += ((n < BS_BUFF_SZ) ? n : BS_BUFF_SZ)) {
1768
+ if (BSTR_OK != balloc (b, n + 1)) return BSTR_ERR;
1769
+ l = (int) readPtr ((void *) (b->data + i), 1, n - i, parm);
1770
+ i += l;
1771
+ b->slen = i;
1772
+ if (i < n) break;
1773
+ }
1774
+
1775
+ b->data[i] = (unsigned char) '\0';
1776
+ return BSTR_OK;
1777
+ }
1778
+
1779
+ /* bstring bread (bNread readPtr, void * parm)
1780
+ *
1781
+ * Use a finite buffer fread-like function readPtr to create a bstring
1782
+ * filled with the entire contents of file-like source data in a roughly
1783
+ * efficient way.
1784
+ */
1785
+ bstring bread (bNread readPtr, void * parm) {
1786
+ int ret;
1787
+ bstring buff;
1788
+
1789
+ if (readPtr == NULL) return NULL;
1790
+ buff = bfromcstr ("");
1791
+ if (buff == NULL) return NULL;
1792
+ ret = breada (buff, readPtr, parm);
1793
+ if (ret < 0) {
1794
+ bdestroy (buff);
1795
+ return NULL;
1796
+ }
1797
+ return buff;
1798
+ }
1799
+
1800
+ /* int bassigngets (bstring b, bNgetc getcPtr, void * parm, char terminator)
1801
+ *
1802
+ * Use an fgetc-like single character stream reading function (getcPtr) to
1803
+ * obtain a sequence of characters which are concatenated to the end of the
1804
+ * bstring b. The stream read is terminated by the passed in terminator
1805
+ * parameter.
1806
+ *
1807
+ * If getcPtr returns with a negative number, or the terminator character
1808
+ * (which is appended) is read, then the stream reading is halted and the
1809
+ * function returns with a partial result in b. If there is an empty partial
1810
+ * result, 1 is returned. If no characters are read, or there is some other
1811
+ * detectable error, BSTR_ERR is returned.
1812
+ */
1813
+ int bassigngets (bstring b, bNgetc getcPtr, void * parm, char terminator) {
1814
+ int c, d, e;
1815
+
1816
+ if (b == NULL || b->mlen <= 0 || b->slen < 0 || b->mlen < b->slen ||
1817
+ b->mlen <= 0 || getcPtr == NULL) return BSTR_ERR;
1818
+ d = 0;
1819
+ e = b->mlen - 2;
1820
+
1821
+ while ((c = getcPtr (parm)) >= 0) {
1822
+ if (d > e) {
1823
+ b->slen = d;
1824
+ if (balloc (b, d + 2) != BSTR_OK) return BSTR_ERR;
1825
+ e = b->mlen - 2;
1826
+ }
1827
+ b->data[d] = (unsigned char) c;
1828
+ d++;
1829
+ if (c == terminator) break;
1830
+ }
1831
+
1832
+ b->data[d] = (unsigned char) '\0';
1833
+ b->slen = d;
1834
+
1835
+ return d == 0 && c < 0;
1836
+ }
1837
+
1838
+ /* int bgetsa (bstring b, bNgetc getcPtr, void * parm, char terminator)
1839
+ *
1840
+ * Use an fgetc-like single character stream reading function (getcPtr) to
1841
+ * obtain a sequence of characters which are concatenated to the end of the
1842
+ * bstring b. The stream read is terminated by the passed in terminator
1843
+ * parameter.
1844
+ *
1845
+ * If getcPtr returns with a negative number, or the terminator character
1846
+ * (which is appended) is read, then the stream reading is halted and the
1847
+ * function returns with a partial result concatentated to b. If there is
1848
+ * an empty partial result, 1 is returned. If no characters are read, or
1849
+ * there is some other detectable error, BSTR_ERR is returned.
1850
+ */
1851
+ int bgetsa (bstring b, bNgetc getcPtr, void * parm, char terminator) {
1852
+ int c, d, e;
1853
+
1854
+ if (b == NULL || b->mlen <= 0 || b->slen < 0 || b->mlen < b->slen ||
1855
+ b->mlen <= 0 || getcPtr == NULL) return BSTR_ERR;
1856
+ d = b->slen;
1857
+ e = b->mlen - 2;
1858
+
1859
+ while ((c = getcPtr (parm)) >= 0) {
1860
+ if (d > e) {
1861
+ b->slen = d;
1862
+ if (balloc (b, d + 2) != BSTR_OK) return BSTR_ERR;
1863
+ e = b->mlen - 2;
1864
+ }
1865
+ b->data[d] = (unsigned char) c;
1866
+ d++;
1867
+ if (c == terminator) break;
1868
+ }
1869
+
1870
+ b->data[d] = (unsigned char) '\0';
1871
+ b->slen = d;
1872
+
1873
+ return d == 0 && c < 0;
1874
+ }
1875
+
1876
+ /* bstring bgets (bNgetc getcPtr, void * parm, char terminator)
1877
+ *
1878
+ * Use an fgetc-like single character stream reading function (getcPtr) to
1879
+ * obtain a sequence of characters which are concatenated into a bstring.
1880
+ * The stream read is terminated by the passed in terminator function.
1881
+ *
1882
+ * If getcPtr returns with a negative number, or the terminator character
1883
+ * (which is appended) is read, then the stream reading is halted and the
1884
+ * result obtained thus far is returned. If no characters are read, or
1885
+ * there is some other detectable error, NULL is returned.
1886
+ */
1887
+ bstring bgets (bNgetc getcPtr, void * parm, char terminator) {
1888
+ int ret;
1889
+ bstring buff;
1890
+
1891
+ if (NULL == getcPtr || NULL == (buff = bfromcstr (""))) return NULL;
1892
+
1893
+ ret = bgetsa (buff, getcPtr, parm, terminator);
1894
+ if (ret < 0 || buff->slen <= 0) {
1895
+ bdestroy (buff);
1896
+ buff = NULL;
1897
+ }
1898
+ return buff;
1899
+ }
1900
+
1901
+ struct bStream {
1902
+ bstring buff; /* Buffer for over-reads */
1903
+ void * parm; /* The stream handle for core stream */
1904
+ bNread readFnPtr; /* fread compatible fnptr for core stream */
1905
+ int isEOF; /* track file's EOF state */
1906
+ int maxBuffSz;
1907
+ };
1908
+
1909
+ /* struct bStream * bsopen (bNread readPtr, void * parm)
1910
+ *
1911
+ * Wrap a given open stream (described by a fread compatible function
1912
+ * pointer and stream handle) into an open bStream suitable for the bstring
1913
+ * library streaming functions.
1914
+ */
1915
+ struct bStream * bsopen (bNread readPtr, void * parm) {
1916
+ struct bStream * s;
1917
+
1918
+ if (readPtr == NULL) return NULL;
1919
+ s = (struct bStream *) bstr__alloc (sizeof (struct bStream));
1920
+ if (s == NULL) return NULL;
1921
+ s->parm = parm;
1922
+ s->buff = bfromcstr ("");
1923
+ s->readFnPtr = readPtr;
1924
+ s->maxBuffSz = BS_BUFF_SZ;
1925
+ s->isEOF = 0;
1926
+ return s;
1927
+ }
1928
+
1929
+ /* int bsbufflength (struct bStream * s, int sz)
1930
+ *
1931
+ * Set the length of the buffer used by the bStream. If sz is zero, the
1932
+ * length is not set. This function returns with the previous length.
1933
+ */
1934
+ int bsbufflength (struct bStream * s, int sz) {
1935
+ int oldSz;
1936
+ if (s == NULL || sz < 0) return BSTR_ERR;
1937
+ oldSz = s->maxBuffSz;
1938
+ if (sz > 0) s->maxBuffSz = sz;
1939
+ return oldSz;
1940
+ }
1941
+
1942
+ int bseof (const struct bStream * s) {
1943
+ if (s == NULL || s->readFnPtr == NULL) return BSTR_ERR;
1944
+ return s->isEOF && (s->buff->slen == 0);
1945
+ }
1946
+
1947
+ /* void * bsclose (struct bStream * s)
1948
+ *
1949
+ * Close the bStream, and return the handle to the stream that was originally
1950
+ * used to open the given stream.
1951
+ */
1952
+ void * bsclose (struct bStream * s) {
1953
+ void * parm;
1954
+ if (s == NULL) return NULL;
1955
+ s->readFnPtr = NULL;
1956
+ if (s->buff) bdestroy (s->buff);
1957
+ s->buff = NULL;
1958
+ parm = s->parm;
1959
+ s->parm = NULL;
1960
+ s->isEOF = 1;
1961
+ bstr__free (s);
1962
+ return parm;
1963
+ }
1964
+
1965
+ /* int bsreadlna (bstring r, struct bStream * s, char terminator)
1966
+ *
1967
+ * Read a bstring terminated by the terminator character or the end of the
1968
+ * stream from the bStream (s) and return it into the parameter r. This
1969
+ * function may read additional characters from the core stream that are not
1970
+ * returned, but will be retained for subsequent read operations.
1971
+ */
1972
+ int bsreadlna (bstring r, struct bStream * s, char terminator) {
1973
+ int i, l, ret, rlo;
1974
+ char * b;
1975
+ struct tagbstring x;
1976
+
1977
+ if (s == NULL || s->buff == NULL || r == NULL || r->mlen <= 0 ||
1978
+ r->slen < 0 || r->mlen < r->slen) return BSTR_ERR;
1979
+ l = s->buff->slen;
1980
+ if (BSTR_OK != balloc (s->buff, s->maxBuffSz + 1)) return BSTR_ERR;
1981
+ b = (char *) s->buff->data;
1982
+ x.data = (unsigned char *) b;
1983
+
1984
+ /* First check if the current buffer holds the terminator */
1985
+ b[l] = terminator; /* Set sentinel */
1986
+ for (i=0; b[i] != terminator; i++) ;
1987
+ if (i < l) {
1988
+ x.slen = i + 1;
1989
+ ret = bconcat (r, &x);
1990
+ s->buff->slen = l;
1991
+ if (BSTR_OK == ret) bdelete (s->buff, 0, i + 1);
1992
+ return BSTR_OK;
1993
+ }
1994
+
1995
+ rlo = r->slen;
1996
+
1997
+ /* If not then just concatenate the entire buffer to the output */
1998
+ x.slen = l;
1999
+ if (BSTR_OK != bconcat (r, &x)) return BSTR_ERR;
2000
+
2001
+ /* Perform direct in-place reads into the destination to allow for
2002
+ the minimum of data-copies */
2003
+ for (;;) {
2004
+ if (BSTR_OK != balloc (r, r->slen + s->maxBuffSz + 1)) return BSTR_ERR;
2005
+ b = (char *) (r->data + r->slen);
2006
+ l = (int) s->readFnPtr (b, 1, s->maxBuffSz, s->parm);
2007
+ if (l <= 0) {
2008
+ r->data[r->slen] = (unsigned char) '\0';
2009
+ s->buff->slen = 0;
2010
+ s->isEOF = 1;
2011
+ /* If nothing was read return with an error message */
2012
+ return BSTR_ERR & -(r->slen == rlo);
2013
+ }
2014
+ b[l] = terminator; /* Set sentinel */
2015
+ for (i=0; b[i] != terminator; i++) ;
2016
+ if (i < l) break;
2017
+ r->slen += l;
2018
+ }
2019
+
2020
+ /* Terminator found, push over-read back to buffer */
2021
+ i++;
2022
+ r->slen += i;
2023
+ s->buff->slen = l - i;
2024
+ bstr__memcpy (s->buff->data, b + i, l - i);
2025
+ r->data[r->slen] = (unsigned char) '\0';
2026
+ return BSTR_OK;
2027
+ }
2028
+
2029
+ /* int bsreadlnsa (bstring r, struct bStream * s, bstring term)
2030
+ *
2031
+ * Read a bstring terminated by any character in the term string or the end
2032
+ * of the stream from the bStream (s) and return it into the parameter r.
2033
+ * This function may read additional characters from the core stream that
2034
+ * are not returned, but will be retained for subsequent read operations.
2035
+ */
2036
+ int bsreadlnsa (bstring r, struct bStream * s, const_bstring term) {
2037
+ int i, l, ret, rlo;
2038
+ unsigned char * b;
2039
+ struct tagbstring x;
2040
+ struct charField cf;
2041
+
2042
+ if (s == NULL || s->buff == NULL || r == NULL || term == NULL ||
2043
+ term->data == NULL || r->mlen <= 0 || r->slen < 0 ||
2044
+ r->mlen < r->slen) return BSTR_ERR;
2045
+ if (term->slen == 1) return bsreadlna (r, s, term->data[0]);
2046
+ if (term->slen < 1 || buildCharField (&cf, term)) return BSTR_ERR;
2047
+
2048
+ l = s->buff->slen;
2049
+ if (BSTR_OK != balloc (s->buff, s->maxBuffSz + 1)) return BSTR_ERR;
2050
+ b = (unsigned char *) s->buff->data;
2051
+ x.data = b;
2052
+
2053
+ /* First check if the current buffer holds the terminator */
2054
+ b[l] = term->data[0]; /* Set sentinel */
2055
+ for (i=0; !testInCharField (&cf, b[i]); i++) ;
2056
+ if (i < l) {
2057
+ x.slen = i + 1;
2058
+ ret = bconcat (r, &x);
2059
+ s->buff->slen = l;
2060
+ if (BSTR_OK == ret) bdelete (s->buff, 0, i + 1);
2061
+ return BSTR_OK;
2062
+ }
2063
+
2064
+ rlo = r->slen;
2065
+
2066
+ /* If not then just concatenate the entire buffer to the output */
2067
+ x.slen = l;
2068
+ if (BSTR_OK != bconcat (r, &x)) return BSTR_ERR;
2069
+
2070
+ /* Perform direct in-place reads into the destination to allow for
2071
+ the minimum of data-copies */
2072
+ for (;;) {
2073
+ if (BSTR_OK != balloc (r, r->slen + s->maxBuffSz + 1)) return BSTR_ERR;
2074
+ b = (unsigned char *) (r->data + r->slen);
2075
+ l = (int) s->readFnPtr (b, 1, s->maxBuffSz, s->parm);
2076
+ if (l <= 0) {
2077
+ r->data[r->slen] = (unsigned char) '\0';
2078
+ s->buff->slen = 0;
2079
+ s->isEOF = 1;
2080
+ /* If nothing was read return with an error message */
2081
+ return BSTR_ERR & -(r->slen == rlo);
2082
+ }
2083
+
2084
+ b[l] = term->data[0]; /* Set sentinel */
2085
+ for (i=0; !testInCharField (&cf, b[i]); i++) ;
2086
+ if (i < l) break;
2087
+ r->slen += l;
2088
+ }
2089
+
2090
+ /* Terminator found, push over-read back to buffer */
2091
+ i++;
2092
+ r->slen += i;
2093
+ s->buff->slen = l - i;
2094
+ bstr__memcpy (s->buff->data, b + i, l - i);
2095
+ r->data[r->slen] = (unsigned char) '\0';
2096
+ return BSTR_OK;
2097
+ }
2098
+
2099
+ /* int bsreada (bstring r, struct bStream * s, int n)
2100
+ *
2101
+ * Read a bstring of length n (or, if it is fewer, as many bytes as is
2102
+ * remaining) from the bStream. This function may read additional
2103
+ * characters from the core stream that are not returned, but will be
2104
+ * retained for subsequent read operations. This function will not read
2105
+ * additional characters from the core stream beyond virtual stream pointer.
2106
+ */
2107
+ int bsreada (bstring r, struct bStream * s, int n) {
2108
+ int l, ret, orslen;
2109
+ char * b;
2110
+ struct tagbstring x;
2111
+
2112
+ if (s == NULL || s->buff == NULL || r == NULL || r->mlen <= 0
2113
+ || r->slen < 0 || r->mlen < r->slen || n <= 0) return BSTR_ERR;
2114
+
2115
+ n += r->slen;
2116
+ if (n <= 0) return BSTR_ERR;
2117
+
2118
+ l = s->buff->slen;
2119
+
2120
+ orslen = r->slen;
2121
+
2122
+ if (0 == l) {
2123
+ if (s->isEOF) return BSTR_ERR;
2124
+ if (r->mlen > n) {
2125
+ l = (int) s->readFnPtr (r->data + r->slen, 1, n - r->slen, s->parm);
2126
+ if (0 >= l || l > n - r->slen) {
2127
+ s->isEOF = 1;
2128
+ return BSTR_ERR;
2129
+ }
2130
+ r->slen += l;
2131
+ r->data[r->slen] = (unsigned char) '\0';
2132
+ return 0;
2133
+ }
2134
+ }
2135
+
2136
+ if (BSTR_OK != balloc (s->buff, s->maxBuffSz + 1)) return BSTR_ERR;
2137
+ b = (char *) s->buff->data;
2138
+ x.data = (unsigned char *) b;
2139
+
2140
+ do {
2141
+ if (l + r->slen >= n) {
2142
+ x.slen = n - r->slen;
2143
+ ret = bconcat (r, &x);
2144
+ s->buff->slen = l;
2145
+ if (BSTR_OK == ret) bdelete (s->buff, 0, x.slen);
2146
+ return BSTR_ERR & -(r->slen == orslen);
2147
+ }
2148
+
2149
+ x.slen = l;
2150
+ if (BSTR_OK != bconcat (r, &x)) break;
2151
+
2152
+ l = n - r->slen;
2153
+ if (l > s->maxBuffSz) l = s->maxBuffSz;
2154
+
2155
+ l = (int) s->readFnPtr (b, 1, l, s->parm);
2156
+
2157
+ } while (l > 0);
2158
+ if (l < 0) l = 0;
2159
+ if (l == 0) s->isEOF = 1;
2160
+ s->buff->slen = l;
2161
+ return BSTR_ERR & -(r->slen == orslen);
2162
+ }
2163
+
2164
+ /* int bsreadln (bstring r, struct bStream * s, char terminator)
2165
+ *
2166
+ * Read a bstring terminated by the terminator character or the end of the
2167
+ * stream from the bStream (s) and return it into the parameter r. This
2168
+ * function may read additional characters from the core stream that are not
2169
+ * returned, but will be retained for subsequent read operations.
2170
+ */
2171
+ int bsreadln (bstring r, struct bStream * s, char terminator) {
2172
+ if (s == NULL || s->buff == NULL || r == NULL || r->mlen <= 0)
2173
+ return BSTR_ERR;
2174
+ if (BSTR_OK != balloc (s->buff, s->maxBuffSz + 1)) return BSTR_ERR;
2175
+ r->slen = 0;
2176
+ return bsreadlna (r, s, terminator);
2177
+ }
2178
+
2179
+ /* int bsreadlns (bstring r, struct bStream * s, bstring term)
2180
+ *
2181
+ * Read a bstring terminated by any character in the term string or the end
2182
+ * of the stream from the bStream (s) and return it into the parameter r.
2183
+ * This function may read additional characters from the core stream that
2184
+ * are not returned, but will be retained for subsequent read operations.
2185
+ */
2186
+ int bsreadlns (bstring r, struct bStream * s, const_bstring term) {
2187
+ if (s == NULL || s->buff == NULL || r == NULL || term == NULL
2188
+ || term->data == NULL || r->mlen <= 0) return BSTR_ERR;
2189
+ if (term->slen == 1) return bsreadln (r, s, term->data[0]);
2190
+ if (term->slen < 1) return BSTR_ERR;
2191
+ if (BSTR_OK != balloc (s->buff, s->maxBuffSz + 1)) return BSTR_ERR;
2192
+ r->slen = 0;
2193
+ return bsreadlnsa (r, s, term);
2194
+ }
2195
+
2196
+ /* int bsread (bstring r, struct bStream * s, int n)
2197
+ *
2198
+ * Read a bstring of length n (or, if it is fewer, as many bytes as is
2199
+ * remaining) from the bStream. This function may read additional
2200
+ * characters from the core stream that are not returned, but will be
2201
+ * retained for subsequent read operations. This function will not read
2202
+ * additional characters from the core stream beyond virtual stream pointer.
2203
+ */
2204
+ int bsread (bstring r, struct bStream * s, int n) {
2205
+ if (s == NULL || s->buff == NULL || r == NULL || r->mlen <= 0
2206
+ || n <= 0) return BSTR_ERR;
2207
+ if (BSTR_OK != balloc (s->buff, s->maxBuffSz + 1)) return BSTR_ERR;
2208
+ r->slen = 0;
2209
+ return bsreada (r, s, n);
2210
+ }
2211
+
2212
+ /* int bsunread (struct bStream * s, const_bstring b)
2213
+ *
2214
+ * Insert a bstring into the bStream at the current position. These
2215
+ * characters will be read prior to those that actually come from the core
2216
+ * stream.
2217
+ */
2218
+ int bsunread (struct bStream * s, const_bstring b) {
2219
+ if (s == NULL || s->buff == NULL) return BSTR_ERR;
2220
+ return binsert (s->buff, 0, b, (unsigned char) '?');
2221
+ }
2222
+
2223
+ /* int bspeek (bstring r, const struct bStream * s)
2224
+ *
2225
+ * Return the currently buffered characters from the bStream that will be
2226
+ * read prior to reads from the core stream.
2227
+ */
2228
+ int bspeek (bstring r, const struct bStream * s) {
2229
+ if (s == NULL || s->buff == NULL) return BSTR_ERR;
2230
+ return bassign (r, s->buff);
2231
+ }
2232
+
2233
+ /* bstring bjoin (const struct bstrList * bl, const_bstring sep);
2234
+ *
2235
+ * Join the entries of a bstrList into one bstring by sequentially
2236
+ * concatenating them with the sep string in between. If there is an error
2237
+ * NULL is returned, otherwise a bstring with the correct result is returned.
2238
+ */
2239
+ bstring bjoin (const struct bstrList * bl, const_bstring sep) {
2240
+ bstring b;
2241
+ int i, c, v;
2242
+
2243
+ if (bl == NULL || bl->qty < 0) return NULL;
2244
+ if (sep != NULL && (sep->slen < 0 || sep->data == NULL)) return NULL;
2245
+
2246
+ for (i = 0, c = 1; i < bl->qty; i++) {
2247
+ v = bl->entry[i]->slen;
2248
+ if (v < 0) return NULL; /* Invalid input */
2249
+ c += v;
2250
+ if (c < 0) return NULL; /* Wrap around ?? */
2251
+ }
2252
+
2253
+ if (sep != NULL) c += (bl->qty - 1) * sep->slen;
2254
+
2255
+ b = (bstring) bstr__alloc (sizeof (struct tagbstring));
2256
+ if (NULL == b) return NULL; /* Out of memory */
2257
+ b->data = (unsigned char *) bstr__alloc (c);
2258
+ if (b->data == NULL) {
2259
+ bstr__free (b);
2260
+ return NULL;
2261
+ }
2262
+
2263
+ b->mlen = c;
2264
+ b->slen = c-1;
2265
+
2266
+ for (i = 0, c = 0; i < bl->qty; i++) {
2267
+ if (i > 0 && sep != NULL) {
2268
+ bstr__memcpy (b->data + c, sep->data, sep->slen);
2269
+ c += sep->slen;
2270
+ }
2271
+ v = bl->entry[i]->slen;
2272
+ bstr__memcpy (b->data + c, bl->entry[i]->data, v);
2273
+ c += v;
2274
+ }
2275
+ b->data[c] = (unsigned char) '\0';
2276
+ return b;
2277
+ }
2278
+
2279
+ #define BSSSC_BUFF_LEN (256)
2280
+
2281
+ /* int bssplitscb (struct bStream * s, const_bstring splitStr,
2282
+ * int (* cb) (void * parm, int ofs, const_bstring entry), void * parm)
2283
+ *
2284
+ * Iterate the set of disjoint sequential substrings read from a stream
2285
+ * divided by any of the characters in splitStr. An empty splitStr causes
2286
+ * the whole stream to be iterated once.
2287
+ *
2288
+ * Note: At the point of calling the cb function, the bStream pointer is
2289
+ * pointed exactly at the position right after having read the split
2290
+ * character. The cb function can act on the stream by causing the bStream
2291
+ * pointer to move, and bssplitscb will continue by starting the next split
2292
+ * at the position of the pointer after the return from cb.
2293
+ *
2294
+ * However, if the cb causes the bStream s to be destroyed then the cb must
2295
+ * return with a negative value, otherwise bssplitscb will continue in an
2296
+ * undefined manner.
2297
+ */
2298
+ int bssplitscb (struct bStream * s, const_bstring splitStr,
2299
+ int (* cb) (void * parm, int ofs, const_bstring entry), void * parm) {
2300
+ struct charField chrs;
2301
+ bstring buff;
2302
+ int i, p, ret;
2303
+
2304
+ if (cb == NULL || s == NULL || s->readFnPtr == NULL
2305
+ || splitStr == NULL || splitStr->slen < 0) return BSTR_ERR;
2306
+
2307
+ if (NULL == (buff = bfromcstr (""))) return BSTR_ERR;
2308
+
2309
+ if (splitStr->slen == 0) {
2310
+ while (bsreada (buff, s, BSSSC_BUFF_LEN) >= 0) ;
2311
+ if ((ret = cb (parm, 0, buff)) > 0)
2312
+ ret = 0;
2313
+ } else {
2314
+ buildCharField (&chrs, splitStr);
2315
+ ret = p = i = 0;
2316
+ for (;;) {
2317
+ if (i >= buff->slen) {
2318
+ bsreada (buff, s, BSSSC_BUFF_LEN);
2319
+ if (i >= buff->slen) {
2320
+ if (0 < (ret = cb (parm, p, buff))) ret = 0;
2321
+ break;
2322
+ }
2323
+ }
2324
+ if (testInCharField (&chrs, buff->data[i])) {
2325
+ struct tagbstring t;
2326
+ unsigned char c;
2327
+
2328
+ blk2tbstr (t, buff->data + i + 1, buff->slen - (i + 1));
2329
+ if ((ret = bsunread (s, &t)) < 0) break;
2330
+ buff->slen = i;
2331
+ c = buff->data[i];
2332
+ buff->data[i] = (unsigned char) '\0';
2333
+ if ((ret = cb (parm, p, buff)) < 0) break;
2334
+ buff->data[i] = c;
2335
+ buff->slen = 0;
2336
+ p += i + 1;
2337
+ i = -1;
2338
+ }
2339
+ i++;
2340
+ }
2341
+ }
2342
+
2343
+ bdestroy (buff);
2344
+ return ret;
2345
+ }
2346
+
2347
+ /* int bssplitstrcb (struct bStream * s, const_bstring splitStr,
2348
+ * int (* cb) (void * parm, int ofs, const_bstring entry), void * parm)
2349
+ *
2350
+ * Iterate the set of disjoint sequential substrings read from a stream
2351
+ * divided by the entire substring splitStr. An empty splitStr causes
2352
+ * each character of the stream to be iterated.
2353
+ *
2354
+ * Note: At the point of calling the cb function, the bStream pointer is
2355
+ * pointed exactly at the position right after having read the split
2356
+ * character. The cb function can act on the stream by causing the bStream
2357
+ * pointer to move, and bssplitscb will continue by starting the next split
2358
+ * at the position of the pointer after the return from cb.
2359
+ *
2360
+ * However, if the cb causes the bStream s to be destroyed then the cb must
2361
+ * return with a negative value, otherwise bssplitscb will continue in an
2362
+ * undefined manner.
2363
+ */
2364
+ int bssplitstrcb (struct bStream * s, const_bstring splitStr,
2365
+ int (* cb) (void * parm, int ofs, const_bstring entry), void * parm) {
2366
+ bstring buff;
2367
+ int i, p, ret;
2368
+
2369
+ if (cb == NULL || s == NULL || s->readFnPtr == NULL
2370
+ || splitStr == NULL || splitStr->slen < 0) return BSTR_ERR;
2371
+
2372
+ if (splitStr->slen == 1) return bssplitscb (s, splitStr, cb, parm);
2373
+
2374
+ if (NULL == (buff = bfromcstr (""))) return BSTR_ERR;
2375
+
2376
+ if (splitStr->slen == 0) {
2377
+ for (i=0; bsreada (buff, s, BSSSC_BUFF_LEN) >= 0; i++) {
2378
+ if ((ret = cb (parm, 0, buff)) < 0) {
2379
+ bdestroy (buff);
2380
+ return ret;
2381
+ }
2382
+ buff->slen = 0;
2383
+ }
2384
+ return BSTR_OK;
2385
+ } else {
2386
+ ret = p = i = 0;
2387
+ for (i=p=0;;) {
2388
+ if ((ret = binstr (buff, 0, splitStr)) >= 0) {
2389
+ struct tagbstring t;
2390
+ blk2tbstr (t, buff->data, ret);
2391
+ i = ret + splitStr->slen;
2392
+ if ((ret = cb (parm, p, &t)) < 0) break;
2393
+ p += i;
2394
+ bdelete (buff, 0, i);
2395
+ } else {
2396
+ bsreada (buff, s, BSSSC_BUFF_LEN);
2397
+ if (bseof (s)) {
2398
+ if ((ret = cb (parm, p, buff)) > 0) ret = 0;
2399
+ break;
2400
+ }
2401
+ }
2402
+ }
2403
+ }
2404
+
2405
+ bdestroy (buff);
2406
+ return ret;
2407
+ }
2408
+
2409
+ /* int bstrListCreate (void)
2410
+ *
2411
+ * Create a bstrList.
2412
+ */
2413
+ struct bstrList * bstrListCreate (void) {
2414
+ struct bstrList * sl = (struct bstrList *) bstr__alloc (sizeof (struct bstrList));
2415
+ if (sl) {
2416
+ sl->entry = (bstring *) bstr__alloc (1*sizeof (bstring));
2417
+ if (!sl->entry) {
2418
+ bstr__free (sl);
2419
+ sl = NULL;
2420
+ } else {
2421
+ sl->qty = 0;
2422
+ sl->mlen = 1;
2423
+ }
2424
+ }
2425
+ return sl;
2426
+ }
2427
+
2428
+ /* int bstrListDestroy (struct bstrList * sl)
2429
+ *
2430
+ * Destroy a bstrList that has been created by bsplit, bsplits or bstrListCreate.
2431
+ */
2432
+ int bstrListDestroy (struct bstrList * sl) {
2433
+ int i;
2434
+ if (sl == NULL || sl->qty < 0) return BSTR_ERR;
2435
+ for (i=0; i < sl->qty; i++) {
2436
+ if (sl->entry[i]) {
2437
+ bdestroy (sl->entry[i]);
2438
+ sl->entry[i] = NULL;
2439
+ }
2440
+ }
2441
+ sl->qty = -1;
2442
+ sl->mlen = -1;
2443
+ bstr__free (sl->entry);
2444
+ sl->entry = NULL;
2445
+ bstr__free (sl);
2446
+ return BSTR_OK;
2447
+ }
2448
+
2449
+ /* int bsplitcb (const_bstring str, unsigned char splitChar, int pos,
2450
+ * int (* cb) (void * parm, int ofs, int len), void * parm)
2451
+ *
2452
+ * Iterate the set of disjoint sequential substrings over str divided by the
2453
+ * character in splitChar.
2454
+ *
2455
+ * Note: Non-destructive modification of str from within the cb function
2456
+ * while performing this split is not undefined. bsplitcb behaves in
2457
+ * sequential lock step with calls to cb. I.e., after returning from a cb
2458
+ * that return a non-negative integer, bsplitcb continues from the position
2459
+ * 1 character after the last detected split character and it will halt
2460
+ * immediately if the length of str falls below this point. However, if the
2461
+ * cb function destroys str, then it *must* return with a negative value,
2462
+ * otherwise bsplitcb will continue in an undefined manner.
2463
+ */
2464
+ int bsplitcb (const_bstring str, unsigned char splitChar, int pos,
2465
+ int (* cb) (void * parm, int ofs, int len), void * parm) {
2466
+ int i, p, ret;
2467
+
2468
+ if (cb == NULL || str == NULL || pos < 0 || pos > str->slen)
2469
+ return BSTR_ERR;
2470
+
2471
+ p = pos;
2472
+ do {
2473
+ for (i=p; i < str->slen; i++) {
2474
+ if (str->data[i] == splitChar) break;
2475
+ }
2476
+ if ((ret = cb (parm, p, i - p)) < 0) return ret;
2477
+ p = i + 1;
2478
+ } while (p <= str->slen);
2479
+ return BSTR_OK;
2480
+ }
2481
+
2482
+ /* int bsplitscb (const_bstring str, const_bstring splitStr, int pos,
2483
+ * int (* cb) (void * parm, int ofs, int len), void * parm)
2484
+ *
2485
+ * Iterate the set of disjoint sequential substrings over str divided by any
2486
+ * of the characters in splitStr. An empty splitStr causes the whole str to
2487
+ * be iterated once.
2488
+ *
2489
+ * Note: Non-destructive modification of str from within the cb function
2490
+ * while performing this split is not undefined. bsplitscb behaves in
2491
+ * sequential lock step with calls to cb. I.e., after returning from a cb
2492
+ * that return a non-negative integer, bsplitscb continues from the position
2493
+ * 1 character after the last detected split character and it will halt
2494
+ * immediately if the length of str falls below this point. However, if the
2495
+ * cb function destroys str, then it *must* return with a negative value,
2496
+ * otherwise bsplitscb will continue in an undefined manner.
2497
+ */
2498
+ int bsplitscb (const_bstring str, const_bstring splitStr, int pos,
2499
+ int (* cb) (void * parm, int ofs, int len), void * parm) {
2500
+ struct charField chrs;
2501
+ int i, p, ret;
2502
+
2503
+ if (cb == NULL || str == NULL || pos < 0 || pos > str->slen
2504
+ || splitStr == NULL || splitStr->slen < 0) return BSTR_ERR;
2505
+ if (splitStr->slen == 0) {
2506
+ if ((ret = cb (parm, 0, str->slen)) > 0) ret = 0;
2507
+ return ret;
2508
+ }
2509
+
2510
+ if (splitStr->slen == 1)
2511
+ return bsplitcb (str, splitStr->data[0], pos, cb, parm);
2512
+
2513
+ buildCharField (&chrs, splitStr);
2514
+
2515
+ p = pos;
2516
+ do {
2517
+ for (i=p; i < str->slen; i++) {
2518
+ if (testInCharField (&chrs, str->data[i])) break;
2519
+ }
2520
+ if ((ret = cb (parm, p, i - p)) < 0) return ret;
2521
+ p = i + 1;
2522
+ } while (p <= str->slen);
2523
+ return BSTR_OK;
2524
+ }
2525
+
2526
+ /* int bsplitstrcb (const_bstring str, const_bstring splitStr, int pos,
2527
+ * int (* cb) (void * parm, int ofs, int len), void * parm)
2528
+ *
2529
+ * Iterate the set of disjoint sequential substrings over str divided by the
2530
+ * substring splitStr. An empty splitStr causes the whole str to be
2531
+ * iterated once.
2532
+ *
2533
+ * Note: Non-destructive modification of str from within the cb function
2534
+ * while performing this split is not undefined. bsplitstrcb behaves in
2535
+ * sequential lock step with calls to cb. I.e., after returning from a cb
2536
+ * that return a non-negative integer, bsplitscb continues from the position
2537
+ * 1 character after the last detected split character and it will halt
2538
+ * immediately if the length of str falls below this point. However, if the
2539
+ * cb function destroys str, then it *must* return with a negative value,
2540
+ * otherwise bsplitscb will continue in an undefined manner.
2541
+ */
2542
+ int bsplitstrcb (const_bstring str, const_bstring splitStr, int pos,
2543
+ int (* cb) (void * parm, int ofs, int len), void * parm) {
2544
+ int i, p, ret;
2545
+
2546
+ if (cb == NULL || str == NULL || pos < 0 || pos > str->slen
2547
+ || splitStr == NULL || splitStr->slen < 0) return BSTR_ERR;
2548
+
2549
+ if (0 == splitStr->slen) {
2550
+ for (i=pos; i < str->slen; i++) {
2551
+ if ((ret = cb (parm, i, 1)) < 0) return ret;
2552
+ }
2553
+ return BSTR_OK;
2554
+ }
2555
+
2556
+ if (splitStr->slen == 1)
2557
+ return bsplitcb (str, splitStr->data[0], pos, cb, parm);
2558
+
2559
+ for (i=p=pos; i <= str->slen - splitStr->slen; i++) {
2560
+ if (0 == bstr__memcmp (splitStr->data, str->data + i, splitStr->slen)) {
2561
+ if ((ret = cb (parm, p, i - p)) < 0) return ret;
2562
+ i += splitStr->slen;
2563
+ p = i;
2564
+ }
2565
+ }
2566
+ if ((ret = cb (parm, p, str->slen - p)) < 0) return ret;
2567
+ return BSTR_OK;
2568
+ }
2569
+
2570
+ struct genBstrList {
2571
+ bstring b;
2572
+ struct bstrList * bl;
2573
+ };
2574
+
2575
+ static int bscb (void * parm, int ofs, int len) {
2576
+ struct genBstrList * g = (struct genBstrList *) parm;
2577
+ if (g->bl->qty >= g->bl->mlen) {
2578
+ int mlen = g->bl->mlen * 2;
2579
+ bstring * tbl;
2580
+
2581
+ while (g->bl->qty >= mlen) {
2582
+ if (mlen < g->bl->mlen) return BSTR_ERR;
2583
+ mlen += mlen;
2584
+ }
2585
+
2586
+ tbl = (bstring *) bstr__realloc (g->bl->entry, sizeof (bstring) * mlen);
2587
+ if (tbl == NULL) return BSTR_ERR;
2588
+
2589
+ g->bl->entry = tbl;
2590
+ g->bl->mlen = mlen;
2591
+ }
2592
+
2593
+ g->bl->entry[g->bl->qty] = bmidstr (g->b, ofs, len);
2594
+ g->bl->qty++;
2595
+ return BSTR_OK;
2596
+ }
2597
+
2598
+ /* struct bstrList * bsplit (const_bstring str, unsigned char splitChar)
2599
+ *
2600
+ * Create an array of sequential substrings from str divided by the character
2601
+ * splitChar.
2602
+ */
2603
+ struct bstrList * bsplit (const_bstring str, unsigned char splitChar) {
2604
+ struct genBstrList g;
2605
+
2606
+ if (str == NULL || str->data == NULL || str->slen < 0) return NULL;
2607
+
2608
+ g.bl = (struct bstrList *) bstr__alloc (sizeof (struct bstrList));
2609
+ if (g.bl == NULL) return NULL;
2610
+ g.bl->mlen = 4;
2611
+ g.bl->entry = (bstring *) bstr__alloc (g.bl->mlen * sizeof (bstring));
2612
+ if (NULL == g.bl->entry) {
2613
+ bstr__free (g.bl);
2614
+ return NULL;
2615
+ }
2616
+
2617
+ g.b = (bstring) str;
2618
+ g.bl->qty = 0;
2619
+ if (bsplitcb (str, splitChar, 0, bscb, &g) < 0) {
2620
+ bstrListDestroy (g.bl);
2621
+ return NULL;
2622
+ }
2623
+ return g.bl;
2624
+ }
2625
+
2626
+ /* struct bstrList * bsplitstr (const_bstring str, const_bstring splitStr)
2627
+ *
2628
+ * Create an array of sequential substrings from str divided by the entire
2629
+ * substring splitStr.
2630
+ */
2631
+ struct bstrList * bsplitstr (const_bstring str, const_bstring splitStr) {
2632
+ struct genBstrList g;
2633
+
2634
+ if (str == NULL || str->data == NULL || str->slen < 0) return NULL;
2635
+
2636
+ g.bl = (struct bstrList *) bstr__alloc (sizeof (struct bstrList));
2637
+ if (g.bl == NULL) return NULL;
2638
+ g.bl->mlen = 4;
2639
+ g.bl->entry = (bstring *) bstr__alloc (g.bl->mlen * sizeof (bstring));
2640
+ if (NULL == g.bl->entry) {
2641
+ bstr__free (g.bl);
2642
+ return NULL;
2643
+ }
2644
+
2645
+ g.b = (bstring) str;
2646
+ g.bl->qty = 0;
2647
+ if (bsplitstrcb (str, splitStr, 0, bscb, &g) < 0) {
2648
+ bstrListDestroy (g.bl);
2649
+ return NULL;
2650
+ }
2651
+ return g.bl;
2652
+ }
2653
+
2654
+ /* struct bstrList * bsplits (const_bstring str, bstring splitStr)
2655
+ *
2656
+ * Create an array of sequential substrings from str divided by any of the
2657
+ * characters in splitStr. An empty splitStr causes a single entry bstrList
2658
+ * containing a copy of str to be returned.
2659
+ */
2660
+ struct bstrList * bsplits (const_bstring str, const_bstring splitStr) {
2661
+ struct genBstrList g;
2662
+
2663
+ if ( str == NULL || str->slen < 0 || str->data == NULL ||
2664
+ splitStr == NULL || splitStr->slen < 0 || splitStr->data == NULL)
2665
+ return NULL;
2666
+
2667
+ g.bl = (struct bstrList *) bstr__alloc (sizeof (struct bstrList));
2668
+ if (g.bl == NULL) return NULL;
2669
+ g.bl->mlen = 4;
2670
+ g.bl->entry = (bstring *) bstr__alloc (g.bl->mlen * sizeof (bstring));
2671
+ if (NULL == g.bl->entry) {
2672
+ bstr__free (g.bl);
2673
+ return NULL;
2674
+ }
2675
+ g.b = (bstring) str;
2676
+ g.bl->qty = 0;
2677
+
2678
+ if (bsplitscb (str, splitStr, 0, bscb, &g) < 0) {
2679
+ bstrListDestroy (g.bl);
2680
+ return NULL;
2681
+ }
2682
+ return g.bl;
2683
+ }
2684
+
2685
+ #if defined (__TURBOC__) && !defined (__BORLANDC__)
2686
+ # ifndef BSTRLIB_NOVSNP
2687
+ # define BSTRLIB_NOVSNP
2688
+ # endif
2689
+ #endif
2690
+
2691
+ /* Give WATCOM C/C++, MSVC some latitude for their non-support of vsnprintf */
2692
+ #if defined(__WATCOMC__) || defined(_MSC_VER)
2693
+ #define exvsnprintf(r,b,n,f,a) {r = _vsnprintf (b,n,f,a);}
2694
+ #else
2695
+ #ifdef BSTRLIB_NOVSNP
2696
+ /* This is just a hack. If you are using a system without a vsnprintf, it is
2697
+ not recommended that bformat be used at all. */
2698
+ #define exvsnprintf(r,b,n,f,a) {vsprintf (b,f,a); r = -1;}
2699
+ #define START_VSNBUFF (256)
2700
+ #else
2701
+
2702
+ #ifdef __GNUC__
2703
+ /* Something is making gcc complain about this prototype not being here, so
2704
+ I've just gone ahead and put it in. */
2705
+ //extern int vsnprintf (char *buf, size_t count, const char *format, va_list arg);
2706
+ #endif
2707
+
2708
+ #define exvsnprintf(r,b,n,f,a) {r = vsnprintf (b,n,f,a);}
2709
+ #endif
2710
+ #endif
2711
+
2712
+ #if !defined (BSTRLIB_NOVSNP)
2713
+
2714
+ #ifndef START_VSNBUFF
2715
+ #define START_VSNBUFF (16)
2716
+ #endif
2717
+
2718
+ /* On IRIX vsnprintf returns n-1 when the operation would overflow the target
2719
+ buffer, WATCOM and MSVC both return -1, while C99 requires that the
2720
+ returned value be exactly what the length would be if the buffer would be
2721
+ large enough. This leads to the idea that if the return value is larger
2722
+ than n, then changing n to the return value will reduce the number of
2723
+ iterations required. */
2724
+
2725
+ /* int bformata (bstring b, const char * fmt, ...)
2726
+ *
2727
+ * After the first parameter, it takes the same parameters as printf (), but
2728
+ * rather than outputting results to stdio, it appends the results to
2729
+ * a bstring which contains what would have been output. Note that if there
2730
+ * is an early generation of a '\0' character, the bstring will be truncated
2731
+ * to this end point.
2732
+ */
2733
+ int bformata (bstring b, const char * fmt, ...) {
2734
+ va_list arglist;
2735
+ bstring buff;
2736
+ int n, r;
2737
+
2738
+ if (b == NULL || fmt == NULL || b->data == NULL || b->mlen <= 0
2739
+ || b->slen < 0 || b->slen > b->mlen) return BSTR_ERR;
2740
+
2741
+ /* Since the length is not determinable beforehand, a search is
2742
+ performed using the truncating "vsnprintf" call (to avoid buffer
2743
+ overflows) on increasing potential sizes for the output result. */
2744
+
2745
+ if ((n = (int) (2*strlen (fmt))) < START_VSNBUFF) n = START_VSNBUFF;
2746
+ if (NULL == (buff = bfromcstralloc (n + 2, ""))) {
2747
+ n = 1;
2748
+ if (NULL == (buff = bfromcstralloc (n + 2, ""))) return BSTR_ERR;
2749
+ }
2750
+
2751
+ for (;;) {
2752
+ va_start (arglist, fmt);
2753
+ exvsnprintf (r, (char *) buff->data, n + 1, fmt, arglist);
2754
+ va_end (arglist);
2755
+
2756
+ buff->data[n] = (unsigned char) '\0';
2757
+ buff->slen = (int) (strlen) ((char *) buff->data);
2758
+
2759
+ if (buff->slen < n) break;
2760
+
2761
+ if (r > n) n = r; else n += n;
2762
+
2763
+ if (BSTR_OK != balloc (buff, n + 2)) {
2764
+ bdestroy (buff);
2765
+ return BSTR_ERR;
2766
+ }
2767
+ }
2768
+
2769
+ r = bconcat (b, buff);
2770
+ bdestroy (buff);
2771
+ return r;
2772
+ }
2773
+
2774
+ /* int bassignformat (bstring b, const char * fmt, ...)
2775
+ *
2776
+ * After the first parameter, it takes the same parameters as printf (), but
2777
+ * rather than outputting results to stdio, it outputs the results to
2778
+ * the bstring parameter b. Note that if there is an early generation of a
2779
+ * '\0' character, the bstring will be truncated to this end point.
2780
+ */
2781
+ int bassignformat (bstring b, const char * fmt, ...) {
2782
+ va_list arglist;
2783
+ bstring buff;
2784
+ int n, r;
2785
+
2786
+ if (b == NULL || fmt == NULL || b->data == NULL || b->mlen <= 0
2787
+ || b->slen < 0 || b->slen > b->mlen) return BSTR_ERR;
2788
+
2789
+ /* Since the length is not determinable beforehand, a search is
2790
+ performed using the truncating "vsnprintf" call (to avoid buffer
2791
+ overflows) on increasing potential sizes for the output result. */
2792
+
2793
+ if ((n = (int) (2*strlen (fmt))) < START_VSNBUFF) n = START_VSNBUFF;
2794
+ if (NULL == (buff = bfromcstralloc (n + 2, ""))) {
2795
+ n = 1;
2796
+ if (NULL == (buff = bfromcstralloc (n + 2, ""))) return BSTR_ERR;
2797
+ }
2798
+
2799
+ for (;;) {
2800
+ va_start (arglist, fmt);
2801
+ exvsnprintf (r, (char *) buff->data, n + 1, fmt, arglist);
2802
+ va_end (arglist);
2803
+
2804
+ buff->data[n] = (unsigned char) '\0';
2805
+ buff->slen = (int) (strlen) ((char *) buff->data);
2806
+
2807
+ if (buff->slen < n) break;
2808
+
2809
+ if (r > n) n = r; else n += n;
2810
+
2811
+ if (BSTR_OK != balloc (buff, n + 2)) {
2812
+ bdestroy (buff);
2813
+ return BSTR_ERR;
2814
+ }
2815
+ }
2816
+
2817
+ r = bassign (b, buff);
2818
+ bdestroy (buff);
2819
+ return r;
2820
+ }
2821
+
2822
+ /* bstring bformat (const char * fmt, ...)
2823
+ *
2824
+ * Takes the same parameters as printf (), but rather than outputting results
2825
+ * to stdio, it forms a bstring which contains what would have been output.
2826
+ * Note that if there is an early generation of a '\0' character, the
2827
+ * bstring will be truncated to this end point.
2828
+ */
2829
+ bstring bformat (const char * fmt, ...) {
2830
+ va_list arglist;
2831
+ bstring buff;
2832
+ int n, r;
2833
+
2834
+ if (fmt == NULL) return NULL;
2835
+
2836
+ /* Since the length is not determinable beforehand, a search is
2837
+ performed using the truncating "vsnprintf" call (to avoid buffer
2838
+ overflows) on increasing potential sizes for the output result. */
2839
+
2840
+ if ((n = (int) (2*strlen (fmt))) < START_VSNBUFF) n = START_VSNBUFF;
2841
+ if (NULL == (buff = bfromcstralloc (n + 2, ""))) {
2842
+ n = 1;
2843
+ if (NULL == (buff = bfromcstralloc (n + 2, ""))) return NULL;
2844
+ }
2845
+
2846
+ for (;;) {
2847
+ va_start (arglist, fmt);
2848
+ exvsnprintf (r, (char *) buff->data, n + 1, fmt, arglist);
2849
+ va_end (arglist);
2850
+
2851
+ buff->data[n] = (unsigned char) '\0';
2852
+ buff->slen = (int) (strlen) ((char *) buff->data);
2853
+
2854
+ if (buff->slen < n) break;
2855
+
2856
+ if (r > n) n = r; else n += n;
2857
+
2858
+ if (BSTR_OK != balloc (buff, n + 2)) {
2859
+ bdestroy (buff);
2860
+ return NULL;
2861
+ }
2862
+ }
2863
+
2864
+ return buff;
2865
+ }
2866
+
2867
+ /* int bvcformata (bstring b, int count, const char * fmt, va_list arglist)
2868
+ *
2869
+ * The bvcformata function formats data under control of the format control
2870
+ * string fmt and attempts to append the result to b. The fmt parameter is
2871
+ * the same as that of the printf function. The variable argument list is
2872
+ * replaced with arglist, which has been initialized by the va_start macro.
2873
+ * The size of the output is upper bounded by count. If the required output
2874
+ * exceeds count, the string b is not augmented with any contents and a value
2875
+ * below BSTR_ERR is returned. If a value below -count is returned then it
2876
+ * is recommended that the negative of this value be used as an update to the
2877
+ * count in a subsequent pass. On other errors, such as running out of
2878
+ * memory, parameter errors or numeric wrap around BSTR_ERR is returned.
2879
+ * BSTR_OK is returned when the output is successfully generated and
2880
+ * appended to b.
2881
+ *
2882
+ * Note: There is no sanity checking of arglist, and this function is
2883
+ * destructive of the contents of b from the b->slen point onward. If there
2884
+ * is an early generation of a '\0' character, the bstring will be truncated
2885
+ * to this end point.
2886
+ */
2887
+ int bvcformata (bstring b, int count, const char * fmt, va_list arg) {
2888
+ int n, r, l;
2889
+
2890
+ if (b == NULL || fmt == NULL || count <= 0 || b->data == NULL
2891
+ || b->mlen <= 0 || b->slen < 0 || b->slen > b->mlen) return BSTR_ERR;
2892
+
2893
+ if (count > (n = b->slen + count) + 2) return BSTR_ERR;
2894
+ if (BSTR_OK != balloc (b, n + 2)) return BSTR_ERR;
2895
+
2896
+ exvsnprintf (r, (char *) b->data + b->slen, count + 2, fmt, arg);
2897
+
2898
+ /* Did the operation complete successfully within bounds? */
2899
+
2900
+ if (n >= (l = b->slen + (int) (strlen) ((const char *) b->data + b->slen))) {
2901
+ b->slen = l;
2902
+ return BSTR_OK;
2903
+ }
2904
+
2905
+ /* Abort, since the buffer was not large enough. The return value
2906
+ tries to help set what the retry length should be. */
2907
+
2908
+ b->data[b->slen] = '\0';
2909
+ if (r > count+1) l = r; else {
2910
+ l = count+count;
2911
+ if (count > l) l = INT_MAX;
2912
+ }
2913
+ n = -l;
2914
+ if (n > BSTR_ERR-1) n = BSTR_ERR-1;
2915
+ return n;
2916
+ }
2917
+
2918
+ #endif