chipper 0.4.2

Sign up to get free protection for your applications and to get access to all the features.
Files changed (134) hide show
  1. data/README.rdoc +51 -0
  2. data/ext/extconf.rb +58 -0
  3. data/ext/libstemmer_c/Makefile +10 -0
  4. data/ext/libstemmer_c/examples/stemwords.c +209 -0
  5. data/ext/libstemmer_c/include/libstemmer.h +79 -0
  6. data/ext/libstemmer_c/libstemmer/libstemmer.c +95 -0
  7. data/ext/libstemmer_c/libstemmer/libstemmer_utf8.c +95 -0
  8. data/ext/libstemmer_c/libstemmer/modules.h +190 -0
  9. data/ext/libstemmer_c/libstemmer/modules_utf8.h +121 -0
  10. data/ext/libstemmer_c/mkinc.mak +82 -0
  11. data/ext/libstemmer_c/mkinc_utf8.mak +52 -0
  12. data/ext/libstemmer_c/runtime/api.c +66 -0
  13. data/ext/libstemmer_c/runtime/api.h +26 -0
  14. data/ext/libstemmer_c/runtime/header.h +58 -0
  15. data/ext/libstemmer_c/runtime/utilities.c +478 -0
  16. data/ext/libstemmer_c/src_c/stem_ISO_8859_1_danish.c +337 -0
  17. data/ext/libstemmer_c/src_c/stem_ISO_8859_1_danish.h +16 -0
  18. data/ext/libstemmer_c/src_c/stem_ISO_8859_1_dutch.c +624 -0
  19. data/ext/libstemmer_c/src_c/stem_ISO_8859_1_dutch.h +16 -0
  20. data/ext/libstemmer_c/src_c/stem_ISO_8859_1_english.c +1117 -0
  21. data/ext/libstemmer_c/src_c/stem_ISO_8859_1_english.h +16 -0
  22. data/ext/libstemmer_c/src_c/stem_ISO_8859_1_finnish.c +762 -0
  23. data/ext/libstemmer_c/src_c/stem_ISO_8859_1_finnish.h +16 -0
  24. data/ext/libstemmer_c/src_c/stem_ISO_8859_1_french.c +1246 -0
  25. data/ext/libstemmer_c/src_c/stem_ISO_8859_1_french.h +16 -0
  26. data/ext/libstemmer_c/src_c/stem_ISO_8859_1_german.c +521 -0
  27. data/ext/libstemmer_c/src_c/stem_ISO_8859_1_german.h +16 -0
  28. data/ext/libstemmer_c/src_c/stem_ISO_8859_1_hungarian.c +1230 -0
  29. data/ext/libstemmer_c/src_c/stem_ISO_8859_1_hungarian.h +16 -0
  30. data/ext/libstemmer_c/src_c/stem_ISO_8859_1_italian.c +1065 -0
  31. data/ext/libstemmer_c/src_c/stem_ISO_8859_1_italian.h +16 -0
  32. data/ext/libstemmer_c/src_c/stem_ISO_8859_1_norwegian.c +297 -0
  33. data/ext/libstemmer_c/src_c/stem_ISO_8859_1_norwegian.h +16 -0
  34. data/ext/libstemmer_c/src_c/stem_ISO_8859_1_porter.c +749 -0
  35. data/ext/libstemmer_c/src_c/stem_ISO_8859_1_porter.h +16 -0
  36. data/ext/libstemmer_c/src_c/stem_ISO_8859_1_portuguese.c +1017 -0
  37. data/ext/libstemmer_c/src_c/stem_ISO_8859_1_portuguese.h +16 -0
  38. data/ext/libstemmer_c/src_c/stem_ISO_8859_1_spanish.c +1093 -0
  39. data/ext/libstemmer_c/src_c/stem_ISO_8859_1_spanish.h +16 -0
  40. data/ext/libstemmer_c/src_c/stem_ISO_8859_1_swedish.c +307 -0
  41. data/ext/libstemmer_c/src_c/stem_ISO_8859_1_swedish.h +16 -0
  42. data/ext/libstemmer_c/src_c/stem_ISO_8859_2_romanian.c +998 -0
  43. data/ext/libstemmer_c/src_c/stem_ISO_8859_2_romanian.h +16 -0
  44. data/ext/libstemmer_c/src_c/stem_KOI8_R_russian.c +700 -0
  45. data/ext/libstemmer_c/src_c/stem_KOI8_R_russian.h +16 -0
  46. data/ext/libstemmer_c/src_c/stem_UTF_8_danish.c +339 -0
  47. data/ext/libstemmer_c/src_c/stem_UTF_8_danish.h +16 -0
  48. data/ext/libstemmer_c/src_c/stem_UTF_8_dutch.c +634 -0
  49. data/ext/libstemmer_c/src_c/stem_UTF_8_dutch.h +16 -0
  50. data/ext/libstemmer_c/src_c/stem_UTF_8_english.c +1125 -0
  51. data/ext/libstemmer_c/src_c/stem_UTF_8_english.h +16 -0
  52. data/ext/libstemmer_c/src_c/stem_UTF_8_finnish.c +768 -0
  53. data/ext/libstemmer_c/src_c/stem_UTF_8_finnish.h +16 -0
  54. data/ext/libstemmer_c/src_c/stem_UTF_8_french.c +1256 -0
  55. data/ext/libstemmer_c/src_c/stem_UTF_8_french.h +16 -0
  56. data/ext/libstemmer_c/src_c/stem_UTF_8_german.c +527 -0
  57. data/ext/libstemmer_c/src_c/stem_UTF_8_german.h +16 -0
  58. data/ext/libstemmer_c/src_c/stem_UTF_8_hungarian.c +1234 -0
  59. data/ext/libstemmer_c/src_c/stem_UTF_8_hungarian.h +16 -0
  60. data/ext/libstemmer_c/src_c/stem_UTF_8_italian.c +1073 -0
  61. data/ext/libstemmer_c/src_c/stem_UTF_8_italian.h +16 -0
  62. data/ext/libstemmer_c/src_c/stem_UTF_8_norwegian.c +299 -0
  63. data/ext/libstemmer_c/src_c/stem_UTF_8_norwegian.h +16 -0
  64. data/ext/libstemmer_c/src_c/stem_UTF_8_porter.c +755 -0
  65. data/ext/libstemmer_c/src_c/stem_UTF_8_porter.h +16 -0
  66. data/ext/libstemmer_c/src_c/stem_UTF_8_portuguese.c +1023 -0
  67. data/ext/libstemmer_c/src_c/stem_UTF_8_portuguese.h +16 -0
  68. data/ext/libstemmer_c/src_c/stem_UTF_8_romanian.c +1004 -0
  69. data/ext/libstemmer_c/src_c/stem_UTF_8_romanian.h +16 -0
  70. data/ext/libstemmer_c/src_c/stem_UTF_8_russian.c +694 -0
  71. data/ext/libstemmer_c/src_c/stem_UTF_8_russian.h +16 -0
  72. data/ext/libstemmer_c/src_c/stem_UTF_8_spanish.c +1097 -0
  73. data/ext/libstemmer_c/src_c/stem_UTF_8_spanish.h +16 -0
  74. data/ext/libstemmer_c/src_c/stem_UTF_8_swedish.c +309 -0
  75. data/ext/libstemmer_c/src_c/stem_UTF_8_swedish.h +16 -0
  76. data/ext/libstemmer_c/src_c/stem_UTF_8_turkish.c +2205 -0
  77. data/ext/libstemmer_c/src_c/stem_UTF_8_turkish.h +16 -0
  78. data/ext/re2/bitstate.cc +378 -0
  79. data/ext/re2/compile.cc +1138 -0
  80. data/ext/re2/dfa.cc +2086 -0
  81. data/ext/re2/filtered_re2.cc +100 -0
  82. data/ext/re2/filtered_re2.h +99 -0
  83. data/ext/re2/hash.cc +231 -0
  84. data/ext/re2/mimics_pcre.cc +185 -0
  85. data/ext/re2/nfa.cc +709 -0
  86. data/ext/re2/onepass.cc +614 -0
  87. data/ext/re2/parse.cc +2202 -0
  88. data/ext/re2/perl_groups.cc +119 -0
  89. data/ext/re2/prefilter.cc +671 -0
  90. data/ext/re2/prefilter.h +105 -0
  91. data/ext/re2/prefilter_tree.cc +398 -0
  92. data/ext/re2/prefilter_tree.h +130 -0
  93. data/ext/re2/prog.cc +341 -0
  94. data/ext/re2/prog.h +376 -0
  95. data/ext/re2/re2.cc +1180 -0
  96. data/ext/re2/re2.h +837 -0
  97. data/ext/re2/regexp.cc +920 -0
  98. data/ext/re2/regexp.h +632 -0
  99. data/ext/re2/rune.cc +258 -0
  100. data/ext/re2/set.cc +113 -0
  101. data/ext/re2/set.h +55 -0
  102. data/ext/re2/simplify.cc +393 -0
  103. data/ext/re2/stringpiece.cc +87 -0
  104. data/ext/re2/stringpiece.h +182 -0
  105. data/ext/re2/tostring.cc +341 -0
  106. data/ext/re2/unicode_casefold.cc +469 -0
  107. data/ext/re2/unicode_casefold.h +75 -0
  108. data/ext/re2/unicode_groups.cc +4851 -0
  109. data/ext/re2/unicode_groups.h +64 -0
  110. data/ext/re2/valgrind.cc +24 -0
  111. data/ext/re2/variadic_function.h +346 -0
  112. data/ext/re2/walker-inl.h +244 -0
  113. data/ext/src/chipper.cc +626 -0
  114. data/ext/src/version.h +1 -0
  115. data/ext/stemmer.rb +40 -0
  116. data/ext/util/arena.h +103 -0
  117. data/ext/util/atomicops.h +79 -0
  118. data/ext/util/benchmark.h +41 -0
  119. data/ext/util/flags.h +27 -0
  120. data/ext/util/logging.h +78 -0
  121. data/ext/util/mutex.h +190 -0
  122. data/ext/util/pcre.h +679 -0
  123. data/ext/util/random.h +29 -0
  124. data/ext/util/sparse_array.h +451 -0
  125. data/ext/util/sparse_set.h +177 -0
  126. data/ext/util/test.h +57 -0
  127. data/ext/util/thread.h +26 -0
  128. data/ext/util/utf.h +43 -0
  129. data/ext/util/util.h +127 -0
  130. data/ext/util/valgrind.h +4517 -0
  131. data/test/helper.rb +5 -0
  132. data/test/test_entities.rb +57 -0
  133. data/test/test_tokens.rb +118 -0
  134. metadata +199 -0
@@ -0,0 +1,624 @@
1
+
2
+ /* This file was generated automatically by the Snowball to ANSI C compiler */
3
+
4
+ #include "../runtime/header.h"
5
+
6
+ #ifdef __cplusplus
7
+ extern "C" {
8
+ #endif
9
+ extern int dutch_ISO_8859_1_stem(struct SN_env * z);
10
+ #ifdef __cplusplus
11
+ }
12
+ #endif
13
+ static int r_standard_suffix(struct SN_env * z);
14
+ static int r_undouble(struct SN_env * z);
15
+ static int r_R2(struct SN_env * z);
16
+ static int r_R1(struct SN_env * z);
17
+ static int r_mark_regions(struct SN_env * z);
18
+ static int r_en_ending(struct SN_env * z);
19
+ static int r_e_ending(struct SN_env * z);
20
+ static int r_postlude(struct SN_env * z);
21
+ static int r_prelude(struct SN_env * z);
22
+ #ifdef __cplusplus
23
+ extern "C" {
24
+ #endif
25
+
26
+
27
+ extern struct SN_env * dutch_ISO_8859_1_create_env(void);
28
+ extern void dutch_ISO_8859_1_close_env(struct SN_env * z);
29
+
30
+
31
+ #ifdef __cplusplus
32
+ }
33
+ #endif
34
+ static const symbol s_0_1[1] = { 0xE1 };
35
+ static const symbol s_0_2[1] = { 0xE4 };
36
+ static const symbol s_0_3[1] = { 0xE9 };
37
+ static const symbol s_0_4[1] = { 0xEB };
38
+ static const symbol s_0_5[1] = { 0xED };
39
+ static const symbol s_0_6[1] = { 0xEF };
40
+ static const symbol s_0_7[1] = { 0xF3 };
41
+ static const symbol s_0_8[1] = { 0xF6 };
42
+ static const symbol s_0_9[1] = { 0xFA };
43
+ static const symbol s_0_10[1] = { 0xFC };
44
+
45
+ static const struct among a_0[11] =
46
+ {
47
+ /* 0 */ { 0, 0, -1, 6, 0},
48
+ /* 1 */ { 1, s_0_1, 0, 1, 0},
49
+ /* 2 */ { 1, s_0_2, 0, 1, 0},
50
+ /* 3 */ { 1, s_0_3, 0, 2, 0},
51
+ /* 4 */ { 1, s_0_4, 0, 2, 0},
52
+ /* 5 */ { 1, s_0_5, 0, 3, 0},
53
+ /* 6 */ { 1, s_0_6, 0, 3, 0},
54
+ /* 7 */ { 1, s_0_7, 0, 4, 0},
55
+ /* 8 */ { 1, s_0_8, 0, 4, 0},
56
+ /* 9 */ { 1, s_0_9, 0, 5, 0},
57
+ /* 10 */ { 1, s_0_10, 0, 5, 0}
58
+ };
59
+
60
+ static const symbol s_1_1[1] = { 'I' };
61
+ static const symbol s_1_2[1] = { 'Y' };
62
+
63
+ static const struct among a_1[3] =
64
+ {
65
+ /* 0 */ { 0, 0, -1, 3, 0},
66
+ /* 1 */ { 1, s_1_1, 0, 2, 0},
67
+ /* 2 */ { 1, s_1_2, 0, 1, 0}
68
+ };
69
+
70
+ static const symbol s_2_0[2] = { 'd', 'd' };
71
+ static const symbol s_2_1[2] = { 'k', 'k' };
72
+ static const symbol s_2_2[2] = { 't', 't' };
73
+
74
+ static const struct among a_2[3] =
75
+ {
76
+ /* 0 */ { 2, s_2_0, -1, -1, 0},
77
+ /* 1 */ { 2, s_2_1, -1, -1, 0},
78
+ /* 2 */ { 2, s_2_2, -1, -1, 0}
79
+ };
80
+
81
+ static const symbol s_3_0[3] = { 'e', 'n', 'e' };
82
+ static const symbol s_3_1[2] = { 's', 'e' };
83
+ static const symbol s_3_2[2] = { 'e', 'n' };
84
+ static const symbol s_3_3[5] = { 'h', 'e', 'd', 'e', 'n' };
85
+ static const symbol s_3_4[1] = { 's' };
86
+
87
+ static const struct among a_3[5] =
88
+ {
89
+ /* 0 */ { 3, s_3_0, -1, 2, 0},
90
+ /* 1 */ { 2, s_3_1, -1, 3, 0},
91
+ /* 2 */ { 2, s_3_2, -1, 2, 0},
92
+ /* 3 */ { 5, s_3_3, 2, 1, 0},
93
+ /* 4 */ { 1, s_3_4, -1, 3, 0}
94
+ };
95
+
96
+ static const symbol s_4_0[3] = { 'e', 'n', 'd' };
97
+ static const symbol s_4_1[2] = { 'i', 'g' };
98
+ static const symbol s_4_2[3] = { 'i', 'n', 'g' };
99
+ static const symbol s_4_3[4] = { 'l', 'i', 'j', 'k' };
100
+ static const symbol s_4_4[4] = { 'b', 'a', 'a', 'r' };
101
+ static const symbol s_4_5[3] = { 'b', 'a', 'r' };
102
+
103
+ static const struct among a_4[6] =
104
+ {
105
+ /* 0 */ { 3, s_4_0, -1, 1, 0},
106
+ /* 1 */ { 2, s_4_1, -1, 2, 0},
107
+ /* 2 */ { 3, s_4_2, -1, 1, 0},
108
+ /* 3 */ { 4, s_4_3, -1, 3, 0},
109
+ /* 4 */ { 4, s_4_4, -1, 4, 0},
110
+ /* 5 */ { 3, s_4_5, -1, 5, 0}
111
+ };
112
+
113
+ static const symbol s_5_0[2] = { 'a', 'a' };
114
+ static const symbol s_5_1[2] = { 'e', 'e' };
115
+ static const symbol s_5_2[2] = { 'o', 'o' };
116
+ static const symbol s_5_3[2] = { 'u', 'u' };
117
+
118
+ static const struct among a_5[4] =
119
+ {
120
+ /* 0 */ { 2, s_5_0, -1, -1, 0},
121
+ /* 1 */ { 2, s_5_1, -1, -1, 0},
122
+ /* 2 */ { 2, s_5_2, -1, -1, 0},
123
+ /* 3 */ { 2, s_5_3, -1, -1, 0}
124
+ };
125
+
126
+ static const unsigned char g_v[] = { 17, 65, 16, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 128 };
127
+
128
+ static const unsigned char g_v_I[] = { 1, 0, 0, 17, 65, 16, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 128 };
129
+
130
+ static const unsigned char g_v_j[] = { 17, 67, 16, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 128 };
131
+
132
+ static const symbol s_0[] = { 'a' };
133
+ static const symbol s_1[] = { 'e' };
134
+ static const symbol s_2[] = { 'i' };
135
+ static const symbol s_3[] = { 'o' };
136
+ static const symbol s_4[] = { 'u' };
137
+ static const symbol s_5[] = { 'y' };
138
+ static const symbol s_6[] = { 'Y' };
139
+ static const symbol s_7[] = { 'i' };
140
+ static const symbol s_8[] = { 'I' };
141
+ static const symbol s_9[] = { 'y' };
142
+ static const symbol s_10[] = { 'Y' };
143
+ static const symbol s_11[] = { 'y' };
144
+ static const symbol s_12[] = { 'i' };
145
+ static const symbol s_13[] = { 'e' };
146
+ static const symbol s_14[] = { 'g', 'e', 'm' };
147
+ static const symbol s_15[] = { 'h', 'e', 'i', 'd' };
148
+ static const symbol s_16[] = { 'h', 'e', 'i', 'd' };
149
+ static const symbol s_17[] = { 'c' };
150
+ static const symbol s_18[] = { 'e', 'n' };
151
+ static const symbol s_19[] = { 'i', 'g' };
152
+ static const symbol s_20[] = { 'e' };
153
+ static const symbol s_21[] = { 'e' };
154
+
155
+ static int r_prelude(struct SN_env * z) {
156
+ int among_var;
157
+ { int c_test = z->c; /* test, line 42 */
158
+ while(1) { /* repeat, line 42 */
159
+ int c1 = z->c;
160
+ z->bra = z->c; /* [, line 43 */
161
+ if (z->c >= z->l || z->p[z->c + 0] >> 5 != 7 || !((340306450 >> (z->p[z->c + 0] & 0x1f)) & 1)) among_var = 6; else
162
+ among_var = find_among(z, a_0, 11); /* substring, line 43 */
163
+ if (!(among_var)) goto lab0;
164
+ z->ket = z->c; /* ], line 43 */
165
+ switch(among_var) {
166
+ case 0: goto lab0;
167
+ case 1:
168
+ { int ret = slice_from_s(z, 1, s_0); /* <-, line 45 */
169
+ if (ret < 0) return ret;
170
+ }
171
+ break;
172
+ case 2:
173
+ { int ret = slice_from_s(z, 1, s_1); /* <-, line 47 */
174
+ if (ret < 0) return ret;
175
+ }
176
+ break;
177
+ case 3:
178
+ { int ret = slice_from_s(z, 1, s_2); /* <-, line 49 */
179
+ if (ret < 0) return ret;
180
+ }
181
+ break;
182
+ case 4:
183
+ { int ret = slice_from_s(z, 1, s_3); /* <-, line 51 */
184
+ if (ret < 0) return ret;
185
+ }
186
+ break;
187
+ case 5:
188
+ { int ret = slice_from_s(z, 1, s_4); /* <-, line 53 */
189
+ if (ret < 0) return ret;
190
+ }
191
+ break;
192
+ case 6:
193
+ if (z->c >= z->l) goto lab0;
194
+ z->c++; /* next, line 54 */
195
+ break;
196
+ }
197
+ continue;
198
+ lab0:
199
+ z->c = c1;
200
+ break;
201
+ }
202
+ z->c = c_test;
203
+ }
204
+ { int c_keep = z->c; /* try, line 57 */
205
+ z->bra = z->c; /* [, line 57 */
206
+ if (!(eq_s(z, 1, s_5))) { z->c = c_keep; goto lab1; }
207
+ z->ket = z->c; /* ], line 57 */
208
+ { int ret = slice_from_s(z, 1, s_6); /* <-, line 57 */
209
+ if (ret < 0) return ret;
210
+ }
211
+ lab1:
212
+ ;
213
+ }
214
+ while(1) { /* repeat, line 58 */
215
+ int c2 = z->c;
216
+ while(1) { /* goto, line 58 */
217
+ int c3 = z->c;
218
+ if (in_grouping(z, g_v, 97, 232, 0)) goto lab3;
219
+ z->bra = z->c; /* [, line 59 */
220
+ { int c4 = z->c; /* or, line 59 */
221
+ if (!(eq_s(z, 1, s_7))) goto lab5;
222
+ z->ket = z->c; /* ], line 59 */
223
+ if (in_grouping(z, g_v, 97, 232, 0)) goto lab5;
224
+ { int ret = slice_from_s(z, 1, s_8); /* <-, line 59 */
225
+ if (ret < 0) return ret;
226
+ }
227
+ goto lab4;
228
+ lab5:
229
+ z->c = c4;
230
+ if (!(eq_s(z, 1, s_9))) goto lab3;
231
+ z->ket = z->c; /* ], line 60 */
232
+ { int ret = slice_from_s(z, 1, s_10); /* <-, line 60 */
233
+ if (ret < 0) return ret;
234
+ }
235
+ }
236
+ lab4:
237
+ z->c = c3;
238
+ break;
239
+ lab3:
240
+ z->c = c3;
241
+ if (z->c >= z->l) goto lab2;
242
+ z->c++; /* goto, line 58 */
243
+ }
244
+ continue;
245
+ lab2:
246
+ z->c = c2;
247
+ break;
248
+ }
249
+ return 1;
250
+ }
251
+
252
+ static int r_mark_regions(struct SN_env * z) {
253
+ z->I[0] = z->l;
254
+ z->I[1] = z->l;
255
+ { /* gopast */ /* grouping v, line 69 */
256
+ int ret = out_grouping(z, g_v, 97, 232, 1);
257
+ if (ret < 0) return 0;
258
+ z->c += ret;
259
+ }
260
+ { /* gopast */ /* non v, line 69 */
261
+ int ret = in_grouping(z, g_v, 97, 232, 1);
262
+ if (ret < 0) return 0;
263
+ z->c += ret;
264
+ }
265
+ z->I[0] = z->c; /* setmark p1, line 69 */
266
+ /* try, line 70 */
267
+ if (!(z->I[0] < 3)) goto lab0;
268
+ z->I[0] = 3;
269
+ lab0:
270
+ { /* gopast */ /* grouping v, line 71 */
271
+ int ret = out_grouping(z, g_v, 97, 232, 1);
272
+ if (ret < 0) return 0;
273
+ z->c += ret;
274
+ }
275
+ { /* gopast */ /* non v, line 71 */
276
+ int ret = in_grouping(z, g_v, 97, 232, 1);
277
+ if (ret < 0) return 0;
278
+ z->c += ret;
279
+ }
280
+ z->I[1] = z->c; /* setmark p2, line 71 */
281
+ return 1;
282
+ }
283
+
284
+ static int r_postlude(struct SN_env * z) {
285
+ int among_var;
286
+ while(1) { /* repeat, line 75 */
287
+ int c1 = z->c;
288
+ z->bra = z->c; /* [, line 77 */
289
+ if (z->c >= z->l || (z->p[z->c + 0] != 73 && z->p[z->c + 0] != 89)) among_var = 3; else
290
+ among_var = find_among(z, a_1, 3); /* substring, line 77 */
291
+ if (!(among_var)) goto lab0;
292
+ z->ket = z->c; /* ], line 77 */
293
+ switch(among_var) {
294
+ case 0: goto lab0;
295
+ case 1:
296
+ { int ret = slice_from_s(z, 1, s_11); /* <-, line 78 */
297
+ if (ret < 0) return ret;
298
+ }
299
+ break;
300
+ case 2:
301
+ { int ret = slice_from_s(z, 1, s_12); /* <-, line 79 */
302
+ if (ret < 0) return ret;
303
+ }
304
+ break;
305
+ case 3:
306
+ if (z->c >= z->l) goto lab0;
307
+ z->c++; /* next, line 80 */
308
+ break;
309
+ }
310
+ continue;
311
+ lab0:
312
+ z->c = c1;
313
+ break;
314
+ }
315
+ return 1;
316
+ }
317
+
318
+ static int r_R1(struct SN_env * z) {
319
+ if (!(z->I[0] <= z->c)) return 0;
320
+ return 1;
321
+ }
322
+
323
+ static int r_R2(struct SN_env * z) {
324
+ if (!(z->I[1] <= z->c)) return 0;
325
+ return 1;
326
+ }
327
+
328
+ static int r_undouble(struct SN_env * z) {
329
+ { int m_test = z->l - z->c; /* test, line 91 */
330
+ if (z->c - 1 <= z->lb || z->p[z->c - 1] >> 5 != 3 || !((1050640 >> (z->p[z->c - 1] & 0x1f)) & 1)) return 0;
331
+ if (!(find_among_b(z, a_2, 3))) return 0; /* among, line 91 */
332
+ z->c = z->l - m_test;
333
+ }
334
+ z->ket = z->c; /* [, line 91 */
335
+ if (z->c <= z->lb) return 0;
336
+ z->c--; /* next, line 91 */
337
+ z->bra = z->c; /* ], line 91 */
338
+ { int ret = slice_del(z); /* delete, line 91 */
339
+ if (ret < 0) return ret;
340
+ }
341
+ return 1;
342
+ }
343
+
344
+ static int r_e_ending(struct SN_env * z) {
345
+ z->B[0] = 0; /* unset e_found, line 95 */
346
+ z->ket = z->c; /* [, line 96 */
347
+ if (!(eq_s_b(z, 1, s_13))) return 0;
348
+ z->bra = z->c; /* ], line 96 */
349
+ { int ret = r_R1(z);
350
+ if (ret == 0) return 0; /* call R1, line 96 */
351
+ if (ret < 0) return ret;
352
+ }
353
+ { int m_test = z->l - z->c; /* test, line 96 */
354
+ if (out_grouping_b(z, g_v, 97, 232, 0)) return 0;
355
+ z->c = z->l - m_test;
356
+ }
357
+ { int ret = slice_del(z); /* delete, line 96 */
358
+ if (ret < 0) return ret;
359
+ }
360
+ z->B[0] = 1; /* set e_found, line 97 */
361
+ { int ret = r_undouble(z);
362
+ if (ret == 0) return 0; /* call undouble, line 98 */
363
+ if (ret < 0) return ret;
364
+ }
365
+ return 1;
366
+ }
367
+
368
+ static int r_en_ending(struct SN_env * z) {
369
+ { int ret = r_R1(z);
370
+ if (ret == 0) return 0; /* call R1, line 102 */
371
+ if (ret < 0) return ret;
372
+ }
373
+ { int m1 = z->l - z->c; (void)m1; /* and, line 102 */
374
+ if (out_grouping_b(z, g_v, 97, 232, 0)) return 0;
375
+ z->c = z->l - m1;
376
+ { int m2 = z->l - z->c; (void)m2; /* not, line 102 */
377
+ if (!(eq_s_b(z, 3, s_14))) goto lab0;
378
+ return 0;
379
+ lab0:
380
+ z->c = z->l - m2;
381
+ }
382
+ }
383
+ { int ret = slice_del(z); /* delete, line 102 */
384
+ if (ret < 0) return ret;
385
+ }
386
+ { int ret = r_undouble(z);
387
+ if (ret == 0) return 0; /* call undouble, line 103 */
388
+ if (ret < 0) return ret;
389
+ }
390
+ return 1;
391
+ }
392
+
393
+ static int r_standard_suffix(struct SN_env * z) {
394
+ int among_var;
395
+ { int m1 = z->l - z->c; (void)m1; /* do, line 107 */
396
+ z->ket = z->c; /* [, line 108 */
397
+ if (z->c <= z->lb || z->p[z->c - 1] >> 5 != 3 || !((540704 >> (z->p[z->c - 1] & 0x1f)) & 1)) goto lab0;
398
+ among_var = find_among_b(z, a_3, 5); /* substring, line 108 */
399
+ if (!(among_var)) goto lab0;
400
+ z->bra = z->c; /* ], line 108 */
401
+ switch(among_var) {
402
+ case 0: goto lab0;
403
+ case 1:
404
+ { int ret = r_R1(z);
405
+ if (ret == 0) goto lab0; /* call R1, line 110 */
406
+ if (ret < 0) return ret;
407
+ }
408
+ { int ret = slice_from_s(z, 4, s_15); /* <-, line 110 */
409
+ if (ret < 0) return ret;
410
+ }
411
+ break;
412
+ case 2:
413
+ { int ret = r_en_ending(z);
414
+ if (ret == 0) goto lab0; /* call en_ending, line 113 */
415
+ if (ret < 0) return ret;
416
+ }
417
+ break;
418
+ case 3:
419
+ { int ret = r_R1(z);
420
+ if (ret == 0) goto lab0; /* call R1, line 116 */
421
+ if (ret < 0) return ret;
422
+ }
423
+ if (out_grouping_b(z, g_v_j, 97, 232, 0)) goto lab0;
424
+ { int ret = slice_del(z); /* delete, line 116 */
425
+ if (ret < 0) return ret;
426
+ }
427
+ break;
428
+ }
429
+ lab0:
430
+ z->c = z->l - m1;
431
+ }
432
+ { int m2 = z->l - z->c; (void)m2; /* do, line 120 */
433
+ { int ret = r_e_ending(z);
434
+ if (ret == 0) goto lab1; /* call e_ending, line 120 */
435
+ if (ret < 0) return ret;
436
+ }
437
+ lab1:
438
+ z->c = z->l - m2;
439
+ }
440
+ { int m3 = z->l - z->c; (void)m3; /* do, line 122 */
441
+ z->ket = z->c; /* [, line 122 */
442
+ if (!(eq_s_b(z, 4, s_16))) goto lab2;
443
+ z->bra = z->c; /* ], line 122 */
444
+ { int ret = r_R2(z);
445
+ if (ret == 0) goto lab2; /* call R2, line 122 */
446
+ if (ret < 0) return ret;
447
+ }
448
+ { int m4 = z->l - z->c; (void)m4; /* not, line 122 */
449
+ if (!(eq_s_b(z, 1, s_17))) goto lab3;
450
+ goto lab2;
451
+ lab3:
452
+ z->c = z->l - m4;
453
+ }
454
+ { int ret = slice_del(z); /* delete, line 122 */
455
+ if (ret < 0) return ret;
456
+ }
457
+ z->ket = z->c; /* [, line 123 */
458
+ if (!(eq_s_b(z, 2, s_18))) goto lab2;
459
+ z->bra = z->c; /* ], line 123 */
460
+ { int ret = r_en_ending(z);
461
+ if (ret == 0) goto lab2; /* call en_ending, line 123 */
462
+ if (ret < 0) return ret;
463
+ }
464
+ lab2:
465
+ z->c = z->l - m3;
466
+ }
467
+ { int m5 = z->l - z->c; (void)m5; /* do, line 126 */
468
+ z->ket = z->c; /* [, line 127 */
469
+ if (z->c - 1 <= z->lb || z->p[z->c - 1] >> 5 != 3 || !((264336 >> (z->p[z->c - 1] & 0x1f)) & 1)) goto lab4;
470
+ among_var = find_among_b(z, a_4, 6); /* substring, line 127 */
471
+ if (!(among_var)) goto lab4;
472
+ z->bra = z->c; /* ], line 127 */
473
+ switch(among_var) {
474
+ case 0: goto lab4;
475
+ case 1:
476
+ { int ret = r_R2(z);
477
+ if (ret == 0) goto lab4; /* call R2, line 129 */
478
+ if (ret < 0) return ret;
479
+ }
480
+ { int ret = slice_del(z); /* delete, line 129 */
481
+ if (ret < 0) return ret;
482
+ }
483
+ { int m6 = z->l - z->c; (void)m6; /* or, line 130 */
484
+ z->ket = z->c; /* [, line 130 */
485
+ if (!(eq_s_b(z, 2, s_19))) goto lab6;
486
+ z->bra = z->c; /* ], line 130 */
487
+ { int ret = r_R2(z);
488
+ if (ret == 0) goto lab6; /* call R2, line 130 */
489
+ if (ret < 0) return ret;
490
+ }
491
+ { int m7 = z->l - z->c; (void)m7; /* not, line 130 */
492
+ if (!(eq_s_b(z, 1, s_20))) goto lab7;
493
+ goto lab6;
494
+ lab7:
495
+ z->c = z->l - m7;
496
+ }
497
+ { int ret = slice_del(z); /* delete, line 130 */
498
+ if (ret < 0) return ret;
499
+ }
500
+ goto lab5;
501
+ lab6:
502
+ z->c = z->l - m6;
503
+ { int ret = r_undouble(z);
504
+ if (ret == 0) goto lab4; /* call undouble, line 130 */
505
+ if (ret < 0) return ret;
506
+ }
507
+ }
508
+ lab5:
509
+ break;
510
+ case 2:
511
+ { int ret = r_R2(z);
512
+ if (ret == 0) goto lab4; /* call R2, line 133 */
513
+ if (ret < 0) return ret;
514
+ }
515
+ { int m8 = z->l - z->c; (void)m8; /* not, line 133 */
516
+ if (!(eq_s_b(z, 1, s_21))) goto lab8;
517
+ goto lab4;
518
+ lab8:
519
+ z->c = z->l - m8;
520
+ }
521
+ { int ret = slice_del(z); /* delete, line 133 */
522
+ if (ret < 0) return ret;
523
+ }
524
+ break;
525
+ case 3:
526
+ { int ret = r_R2(z);
527
+ if (ret == 0) goto lab4; /* call R2, line 136 */
528
+ if (ret < 0) return ret;
529
+ }
530
+ { int ret = slice_del(z); /* delete, line 136 */
531
+ if (ret < 0) return ret;
532
+ }
533
+ { int ret = r_e_ending(z);
534
+ if (ret == 0) goto lab4; /* call e_ending, line 136 */
535
+ if (ret < 0) return ret;
536
+ }
537
+ break;
538
+ case 4:
539
+ { int ret = r_R2(z);
540
+ if (ret == 0) goto lab4; /* call R2, line 139 */
541
+ if (ret < 0) return ret;
542
+ }
543
+ { int ret = slice_del(z); /* delete, line 139 */
544
+ if (ret < 0) return ret;
545
+ }
546
+ break;
547
+ case 5:
548
+ { int ret = r_R2(z);
549
+ if (ret == 0) goto lab4; /* call R2, line 142 */
550
+ if (ret < 0) return ret;
551
+ }
552
+ if (!(z->B[0])) goto lab4; /* Boolean test e_found, line 142 */
553
+ { int ret = slice_del(z); /* delete, line 142 */
554
+ if (ret < 0) return ret;
555
+ }
556
+ break;
557
+ }
558
+ lab4:
559
+ z->c = z->l - m5;
560
+ }
561
+ { int m9 = z->l - z->c; (void)m9; /* do, line 146 */
562
+ if (out_grouping_b(z, g_v_I, 73, 232, 0)) goto lab9;
563
+ { int m_test = z->l - z->c; /* test, line 148 */
564
+ if (z->c - 1 <= z->lb || z->p[z->c - 1] >> 5 != 3 || !((2129954 >> (z->p[z->c - 1] & 0x1f)) & 1)) goto lab9;
565
+ if (!(find_among_b(z, a_5, 4))) goto lab9; /* among, line 149 */
566
+ if (out_grouping_b(z, g_v, 97, 232, 0)) goto lab9;
567
+ z->c = z->l - m_test;
568
+ }
569
+ z->ket = z->c; /* [, line 152 */
570
+ if (z->c <= z->lb) goto lab9;
571
+ z->c--; /* next, line 152 */
572
+ z->bra = z->c; /* ], line 152 */
573
+ { int ret = slice_del(z); /* delete, line 152 */
574
+ if (ret < 0) return ret;
575
+ }
576
+ lab9:
577
+ z->c = z->l - m9;
578
+ }
579
+ return 1;
580
+ }
581
+
582
+ extern int dutch_ISO_8859_1_stem(struct SN_env * z) {
583
+ { int c1 = z->c; /* do, line 159 */
584
+ { int ret = r_prelude(z);
585
+ if (ret == 0) goto lab0; /* call prelude, line 159 */
586
+ if (ret < 0) return ret;
587
+ }
588
+ lab0:
589
+ z->c = c1;
590
+ }
591
+ { int c2 = z->c; /* do, line 160 */
592
+ { int ret = r_mark_regions(z);
593
+ if (ret == 0) goto lab1; /* call mark_regions, line 160 */
594
+ if (ret < 0) return ret;
595
+ }
596
+ lab1:
597
+ z->c = c2;
598
+ }
599
+ z->lb = z->c; z->c = z->l; /* backwards, line 161 */
600
+
601
+ { int m3 = z->l - z->c; (void)m3; /* do, line 162 */
602
+ { int ret = r_standard_suffix(z);
603
+ if (ret == 0) goto lab2; /* call standard_suffix, line 162 */
604
+ if (ret < 0) return ret;
605
+ }
606
+ lab2:
607
+ z->c = z->l - m3;
608
+ }
609
+ z->c = z->lb;
610
+ { int c4 = z->c; /* do, line 163 */
611
+ { int ret = r_postlude(z);
612
+ if (ret == 0) goto lab3; /* call postlude, line 163 */
613
+ if (ret < 0) return ret;
614
+ }
615
+ lab3:
616
+ z->c = c4;
617
+ }
618
+ return 1;
619
+ }
620
+
621
+ extern struct SN_env * dutch_ISO_8859_1_create_env(void) { return SN_create_env(0, 2, 1); }
622
+
623
+ extern void dutch_ISO_8859_1_close_env(struct SN_env * z) { SN_close_env(z, 0); }
624
+
@@ -0,0 +1,16 @@
1
+
2
+ /* This file was generated automatically by the Snowball to ANSI C compiler */
3
+
4
+ #ifdef __cplusplus
5
+ extern "C" {
6
+ #endif
7
+
8
+ extern struct SN_env * dutch_ISO_8859_1_create_env(void);
9
+ extern void dutch_ISO_8859_1_close_env(struct SN_env * z);
10
+
11
+ extern int dutch_ISO_8859_1_stem(struct SN_env * z);
12
+
13
+ #ifdef __cplusplus
14
+ }
15
+ #endif
16
+