ruby-stemmer 0.9.3-x86-mingw32

Sign up to get free protection for your applications and to get access to all the features.
Files changed (97) hide show
  1. data/MIT-LICENSE +21 -0
  2. data/README.rdoc +113 -0
  3. data/Rakefile +70 -0
  4. data/TODO +0 -0
  5. data/VERSION +1 -0
  6. data/ext/lingua/extconf.rb +40 -0
  7. data/ext/lingua/stemmer.c +115 -0
  8. data/lib/lingua/1.8/stemmer_native.so +0 -0
  9. data/lib/lingua/1.9/stemmer_native.so +0 -0
  10. data/lib/lingua/stemmer.rb +60 -0
  11. data/libstemmer_c/MANIFEST +72 -0
  12. data/libstemmer_c/Makefile +9 -0
  13. data/libstemmer_c/Makefile.windows +15 -0
  14. data/libstemmer_c/README +125 -0
  15. data/libstemmer_c/examples/stemwords.c +209 -0
  16. data/libstemmer_c/include/libstemmer.h +79 -0
  17. data/libstemmer_c/libstemmer/libstemmer.c +93 -0
  18. data/libstemmer_c/libstemmer/libstemmer_utf8.c +93 -0
  19. data/libstemmer_c/libstemmer/modules.h +195 -0
  20. data/libstemmer_c/libstemmer/modules.txt +51 -0
  21. data/libstemmer_c/libstemmer/modules_utf8.h +123 -0
  22. data/libstemmer_c/libstemmer/modules_utf8.txt +50 -0
  23. data/libstemmer_c/mkinc.mak +86 -0
  24. data/libstemmer_c/mkinc_utf8.mak +54 -0
  25. data/libstemmer_c/runtime/api.c +66 -0
  26. data/libstemmer_c/runtime/api.h +26 -0
  27. data/libstemmer_c/runtime/header.h +58 -0
  28. data/libstemmer_c/runtime/utilities.c +478 -0
  29. data/libstemmer_c/src_c/stem_ISO_8859_1_danish.c +337 -0
  30. data/libstemmer_c/src_c/stem_ISO_8859_1_danish.h +16 -0
  31. data/libstemmer_c/src_c/stem_ISO_8859_1_dutch.c +624 -0
  32. data/libstemmer_c/src_c/stem_ISO_8859_1_dutch.h +16 -0
  33. data/libstemmer_c/src_c/stem_ISO_8859_1_english.c +1117 -0
  34. data/libstemmer_c/src_c/stem_ISO_8859_1_english.h +16 -0
  35. data/libstemmer_c/src_c/stem_ISO_8859_1_finnish.c +762 -0
  36. data/libstemmer_c/src_c/stem_ISO_8859_1_finnish.h +16 -0
  37. data/libstemmer_c/src_c/stem_ISO_8859_1_french.c +1246 -0
  38. data/libstemmer_c/src_c/stem_ISO_8859_1_french.h +16 -0
  39. data/libstemmer_c/src_c/stem_ISO_8859_1_german.c +503 -0
  40. data/libstemmer_c/src_c/stem_ISO_8859_1_german.h +16 -0
  41. data/libstemmer_c/src_c/stem_ISO_8859_1_hungarian.c +1230 -0
  42. data/libstemmer_c/src_c/stem_ISO_8859_1_hungarian.h +16 -0
  43. data/libstemmer_c/src_c/stem_ISO_8859_1_italian.c +1065 -0
  44. data/libstemmer_c/src_c/stem_ISO_8859_1_italian.h +16 -0
  45. data/libstemmer_c/src_c/stem_ISO_8859_1_latin.c +443 -0
  46. data/libstemmer_c/src_c/stem_ISO_8859_1_latin.h +16 -0
  47. data/libstemmer_c/src_c/stem_ISO_8859_1_norwegian.c +297 -0
  48. data/libstemmer_c/src_c/stem_ISO_8859_1_norwegian.h +16 -0
  49. data/libstemmer_c/src_c/stem_ISO_8859_1_porter.c +749 -0
  50. data/libstemmer_c/src_c/stem_ISO_8859_1_porter.h +16 -0
  51. data/libstemmer_c/src_c/stem_ISO_8859_1_portuguese.c +1017 -0
  52. data/libstemmer_c/src_c/stem_ISO_8859_1_portuguese.h +16 -0
  53. data/libstemmer_c/src_c/stem_ISO_8859_1_spanish.c +1093 -0
  54. data/libstemmer_c/src_c/stem_ISO_8859_1_spanish.h +16 -0
  55. data/libstemmer_c/src_c/stem_ISO_8859_1_swedish.c +307 -0
  56. data/libstemmer_c/src_c/stem_ISO_8859_1_swedish.h +16 -0
  57. data/libstemmer_c/src_c/stem_ISO_8859_2_romanian.c +998 -0
  58. data/libstemmer_c/src_c/stem_ISO_8859_2_romanian.h +16 -0
  59. data/libstemmer_c/src_c/stem_KOI8_R_russian.c +700 -0
  60. data/libstemmer_c/src_c/stem_KOI8_R_russian.h +16 -0
  61. data/libstemmer_c/src_c/stem_UTF_8_danish.c +339 -0
  62. data/libstemmer_c/src_c/stem_UTF_8_danish.h +16 -0
  63. data/libstemmer_c/src_c/stem_UTF_8_dutch.c +634 -0
  64. data/libstemmer_c/src_c/stem_UTF_8_dutch.h +16 -0
  65. data/libstemmer_c/src_c/stem_UTF_8_english.c +1125 -0
  66. data/libstemmer_c/src_c/stem_UTF_8_english.h +16 -0
  67. data/libstemmer_c/src_c/stem_UTF_8_finnish.c +768 -0
  68. data/libstemmer_c/src_c/stem_UTF_8_finnish.h +16 -0
  69. data/libstemmer_c/src_c/stem_UTF_8_french.c +1256 -0
  70. data/libstemmer_c/src_c/stem_UTF_8_french.h +16 -0
  71. data/libstemmer_c/src_c/stem_UTF_8_german.c +509 -0
  72. data/libstemmer_c/src_c/stem_UTF_8_german.h +16 -0
  73. data/libstemmer_c/src_c/stem_UTF_8_hungarian.c +1234 -0
  74. data/libstemmer_c/src_c/stem_UTF_8_hungarian.h +16 -0
  75. data/libstemmer_c/src_c/stem_UTF_8_italian.c +1073 -0
  76. data/libstemmer_c/src_c/stem_UTF_8_italian.h +16 -0
  77. data/libstemmer_c/src_c/stem_UTF_8_latin.c +443 -0
  78. data/libstemmer_c/src_c/stem_UTF_8_latin.h +16 -0
  79. data/libstemmer_c/src_c/stem_UTF_8_norwegian.c +299 -0
  80. data/libstemmer_c/src_c/stem_UTF_8_norwegian.h +16 -0
  81. data/libstemmer_c/src_c/stem_UTF_8_porter.c +755 -0
  82. data/libstemmer_c/src_c/stem_UTF_8_porter.h +16 -0
  83. data/libstemmer_c/src_c/stem_UTF_8_portuguese.c +1023 -0
  84. data/libstemmer_c/src_c/stem_UTF_8_portuguese.h +16 -0
  85. data/libstemmer_c/src_c/stem_UTF_8_romanian.c +1004 -0
  86. data/libstemmer_c/src_c/stem_UTF_8_romanian.h +16 -0
  87. data/libstemmer_c/src_c/stem_UTF_8_russian.c +694 -0
  88. data/libstemmer_c/src_c/stem_UTF_8_russian.h +16 -0
  89. data/libstemmer_c/src_c/stem_UTF_8_spanish.c +1097 -0
  90. data/libstemmer_c/src_c/stem_UTF_8_spanish.h +16 -0
  91. data/libstemmer_c/src_c/stem_UTF_8_swedish.c +309 -0
  92. data/libstemmer_c/src_c/stem_UTF_8_swedish.h +16 -0
  93. data/libstemmer_c/src_c/stem_UTF_8_turkish.c +2205 -0
  94. data/libstemmer_c/src_c/stem_UTF_8_turkish.h +16 -0
  95. data/test/helper.rb +3 -0
  96. data/test/lingua/test_stemmer.rb +99 -0
  97. metadata +162 -0
@@ -0,0 +1,16 @@
1
+
2
+ /* This file was generated automatically by the Snowball to ANSI C compiler */
3
+
4
+ #ifdef __cplusplus
5
+ extern "C" {
6
+ #endif
7
+
8
+ extern struct SN_env * english_ISO_8859_1_create_env(void);
9
+ extern void english_ISO_8859_1_close_env(struct SN_env * z);
10
+
11
+ extern int english_ISO_8859_1_stem(struct SN_env * z);
12
+
13
+ #ifdef __cplusplus
14
+ }
15
+ #endif
16
+
@@ -0,0 +1,762 @@
1
+
2
+ /* This file was generated automatically by the Snowball to ANSI C compiler */
3
+
4
+ #include "../runtime/header.h"
5
+
6
+ #ifdef __cplusplus
7
+ extern "C" {
8
+ #endif
9
+ extern int finnish_ISO_8859_1_stem(struct SN_env * z);
10
+ #ifdef __cplusplus
11
+ }
12
+ #endif
13
+ static int r_tidy(struct SN_env * z);
14
+ static int r_other_endings(struct SN_env * z);
15
+ static int r_t_plural(struct SN_env * z);
16
+ static int r_i_plural(struct SN_env * z);
17
+ static int r_case_ending(struct SN_env * z);
18
+ static int r_VI(struct SN_env * z);
19
+ static int r_LONG(struct SN_env * z);
20
+ static int r_possessive(struct SN_env * z);
21
+ static int r_particle_etc(struct SN_env * z);
22
+ static int r_R2(struct SN_env * z);
23
+ static int r_mark_regions(struct SN_env * z);
24
+ #ifdef __cplusplus
25
+ extern "C" {
26
+ #endif
27
+
28
+
29
+ extern struct SN_env * finnish_ISO_8859_1_create_env(void);
30
+ extern void finnish_ISO_8859_1_close_env(struct SN_env * z);
31
+
32
+
33
+ #ifdef __cplusplus
34
+ }
35
+ #endif
36
+ static const symbol s_0_0[2] = { 'p', 'a' };
37
+ static const symbol s_0_1[3] = { 's', 't', 'i' };
38
+ static const symbol s_0_2[4] = { 'k', 'a', 'a', 'n' };
39
+ static const symbol s_0_3[3] = { 'h', 'a', 'n' };
40
+ static const symbol s_0_4[3] = { 'k', 'i', 'n' };
41
+ static const symbol s_0_5[3] = { 'h', 0xE4, 'n' };
42
+ static const symbol s_0_6[4] = { 'k', 0xE4, 0xE4, 'n' };
43
+ static const symbol s_0_7[2] = { 'k', 'o' };
44
+ static const symbol s_0_8[2] = { 'p', 0xE4 };
45
+ static const symbol s_0_9[2] = { 'k', 0xF6 };
46
+
47
+ static const struct among a_0[10] =
48
+ {
49
+ /* 0 */ { 2, s_0_0, -1, 1, 0},
50
+ /* 1 */ { 3, s_0_1, -1, 2, 0},
51
+ /* 2 */ { 4, s_0_2, -1, 1, 0},
52
+ /* 3 */ { 3, s_0_3, -1, 1, 0},
53
+ /* 4 */ { 3, s_0_4, -1, 1, 0},
54
+ /* 5 */ { 3, s_0_5, -1, 1, 0},
55
+ /* 6 */ { 4, s_0_6, -1, 1, 0},
56
+ /* 7 */ { 2, s_0_7, -1, 1, 0},
57
+ /* 8 */ { 2, s_0_8, -1, 1, 0},
58
+ /* 9 */ { 2, s_0_9, -1, 1, 0}
59
+ };
60
+
61
+ static const symbol s_1_0[3] = { 'l', 'l', 'a' };
62
+ static const symbol s_1_1[2] = { 'n', 'a' };
63
+ static const symbol s_1_2[3] = { 's', 's', 'a' };
64
+ static const symbol s_1_3[2] = { 't', 'a' };
65
+ static const symbol s_1_4[3] = { 'l', 't', 'a' };
66
+ static const symbol s_1_5[3] = { 's', 't', 'a' };
67
+
68
+ static const struct among a_1[6] =
69
+ {
70
+ /* 0 */ { 3, s_1_0, -1, -1, 0},
71
+ /* 1 */ { 2, s_1_1, -1, -1, 0},
72
+ /* 2 */ { 3, s_1_2, -1, -1, 0},
73
+ /* 3 */ { 2, s_1_3, -1, -1, 0},
74
+ /* 4 */ { 3, s_1_4, 3, -1, 0},
75
+ /* 5 */ { 3, s_1_5, 3, -1, 0}
76
+ };
77
+
78
+ static const symbol s_2_0[3] = { 'l', 'l', 0xE4 };
79
+ static const symbol s_2_1[2] = { 'n', 0xE4 };
80
+ static const symbol s_2_2[3] = { 's', 's', 0xE4 };
81
+ static const symbol s_2_3[2] = { 't', 0xE4 };
82
+ static const symbol s_2_4[3] = { 'l', 't', 0xE4 };
83
+ static const symbol s_2_5[3] = { 's', 't', 0xE4 };
84
+
85
+ static const struct among a_2[6] =
86
+ {
87
+ /* 0 */ { 3, s_2_0, -1, -1, 0},
88
+ /* 1 */ { 2, s_2_1, -1, -1, 0},
89
+ /* 2 */ { 3, s_2_2, -1, -1, 0},
90
+ /* 3 */ { 2, s_2_3, -1, -1, 0},
91
+ /* 4 */ { 3, s_2_4, 3, -1, 0},
92
+ /* 5 */ { 3, s_2_5, 3, -1, 0}
93
+ };
94
+
95
+ static const symbol s_3_0[3] = { 'l', 'l', 'e' };
96
+ static const symbol s_3_1[3] = { 'i', 'n', 'e' };
97
+
98
+ static const struct among a_3[2] =
99
+ {
100
+ /* 0 */ { 3, s_3_0, -1, -1, 0},
101
+ /* 1 */ { 3, s_3_1, -1, -1, 0}
102
+ };
103
+
104
+ static const symbol s_4_0[3] = { 'n', 's', 'a' };
105
+ static const symbol s_4_1[3] = { 'm', 'm', 'e' };
106
+ static const symbol s_4_2[3] = { 'n', 'n', 'e' };
107
+ static const symbol s_4_3[2] = { 'n', 'i' };
108
+ static const symbol s_4_4[2] = { 's', 'i' };
109
+ static const symbol s_4_5[2] = { 'a', 'n' };
110
+ static const symbol s_4_6[2] = { 'e', 'n' };
111
+ static const symbol s_4_7[2] = { 0xE4, 'n' };
112
+ static const symbol s_4_8[3] = { 'n', 's', 0xE4 };
113
+
114
+ static const struct among a_4[9] =
115
+ {
116
+ /* 0 */ { 3, s_4_0, -1, 3, 0},
117
+ /* 1 */ { 3, s_4_1, -1, 3, 0},
118
+ /* 2 */ { 3, s_4_2, -1, 3, 0},
119
+ /* 3 */ { 2, s_4_3, -1, 2, 0},
120
+ /* 4 */ { 2, s_4_4, -1, 1, 0},
121
+ /* 5 */ { 2, s_4_5, -1, 4, 0},
122
+ /* 6 */ { 2, s_4_6, -1, 6, 0},
123
+ /* 7 */ { 2, s_4_7, -1, 5, 0},
124
+ /* 8 */ { 3, s_4_8, -1, 3, 0}
125
+ };
126
+
127
+ static const symbol s_5_0[2] = { 'a', 'a' };
128
+ static const symbol s_5_1[2] = { 'e', 'e' };
129
+ static const symbol s_5_2[2] = { 'i', 'i' };
130
+ static const symbol s_5_3[2] = { 'o', 'o' };
131
+ static const symbol s_5_4[2] = { 'u', 'u' };
132
+ static const symbol s_5_5[2] = { 0xE4, 0xE4 };
133
+ static const symbol s_5_6[2] = { 0xF6, 0xF6 };
134
+
135
+ static const struct among a_5[7] =
136
+ {
137
+ /* 0 */ { 2, s_5_0, -1, -1, 0},
138
+ /* 1 */ { 2, s_5_1, -1, -1, 0},
139
+ /* 2 */ { 2, s_5_2, -1, -1, 0},
140
+ /* 3 */ { 2, s_5_3, -1, -1, 0},
141
+ /* 4 */ { 2, s_5_4, -1, -1, 0},
142
+ /* 5 */ { 2, s_5_5, -1, -1, 0},
143
+ /* 6 */ { 2, s_5_6, -1, -1, 0}
144
+ };
145
+
146
+ static const symbol s_6_0[1] = { 'a' };
147
+ static const symbol s_6_1[3] = { 'l', 'l', 'a' };
148
+ static const symbol s_6_2[2] = { 'n', 'a' };
149
+ static const symbol s_6_3[3] = { 's', 's', 'a' };
150
+ static const symbol s_6_4[2] = { 't', 'a' };
151
+ static const symbol s_6_5[3] = { 'l', 't', 'a' };
152
+ static const symbol s_6_6[3] = { 's', 't', 'a' };
153
+ static const symbol s_6_7[3] = { 't', 't', 'a' };
154
+ static const symbol s_6_8[3] = { 'l', 'l', 'e' };
155
+ static const symbol s_6_9[3] = { 'i', 'n', 'e' };
156
+ static const symbol s_6_10[3] = { 'k', 's', 'i' };
157
+ static const symbol s_6_11[1] = { 'n' };
158
+ static const symbol s_6_12[3] = { 'h', 'a', 'n' };
159
+ static const symbol s_6_13[3] = { 'd', 'e', 'n' };
160
+ static const symbol s_6_14[4] = { 's', 'e', 'e', 'n' };
161
+ static const symbol s_6_15[3] = { 'h', 'e', 'n' };
162
+ static const symbol s_6_16[4] = { 't', 't', 'e', 'n' };
163
+ static const symbol s_6_17[3] = { 'h', 'i', 'n' };
164
+ static const symbol s_6_18[4] = { 's', 'i', 'i', 'n' };
165
+ static const symbol s_6_19[3] = { 'h', 'o', 'n' };
166
+ static const symbol s_6_20[3] = { 'h', 0xE4, 'n' };
167
+ static const symbol s_6_21[3] = { 'h', 0xF6, 'n' };
168
+ static const symbol s_6_22[1] = { 0xE4 };
169
+ static const symbol s_6_23[3] = { 'l', 'l', 0xE4 };
170
+ static const symbol s_6_24[2] = { 'n', 0xE4 };
171
+ static const symbol s_6_25[3] = { 's', 's', 0xE4 };
172
+ static const symbol s_6_26[2] = { 't', 0xE4 };
173
+ static const symbol s_6_27[3] = { 'l', 't', 0xE4 };
174
+ static const symbol s_6_28[3] = { 's', 't', 0xE4 };
175
+ static const symbol s_6_29[3] = { 't', 't', 0xE4 };
176
+
177
+ static const struct among a_6[30] =
178
+ {
179
+ /* 0 */ { 1, s_6_0, -1, 8, 0},
180
+ /* 1 */ { 3, s_6_1, 0, -1, 0},
181
+ /* 2 */ { 2, s_6_2, 0, -1, 0},
182
+ /* 3 */ { 3, s_6_3, 0, -1, 0},
183
+ /* 4 */ { 2, s_6_4, 0, -1, 0},
184
+ /* 5 */ { 3, s_6_5, 4, -1, 0},
185
+ /* 6 */ { 3, s_6_6, 4, -1, 0},
186
+ /* 7 */ { 3, s_6_7, 4, 9, 0},
187
+ /* 8 */ { 3, s_6_8, -1, -1, 0},
188
+ /* 9 */ { 3, s_6_9, -1, -1, 0},
189
+ /* 10 */ { 3, s_6_10, -1, -1, 0},
190
+ /* 11 */ { 1, s_6_11, -1, 7, 0},
191
+ /* 12 */ { 3, s_6_12, 11, 1, 0},
192
+ /* 13 */ { 3, s_6_13, 11, -1, r_VI},
193
+ /* 14 */ { 4, s_6_14, 11, -1, r_LONG},
194
+ /* 15 */ { 3, s_6_15, 11, 2, 0},
195
+ /* 16 */ { 4, s_6_16, 11, -1, r_VI},
196
+ /* 17 */ { 3, s_6_17, 11, 3, 0},
197
+ /* 18 */ { 4, s_6_18, 11, -1, r_VI},
198
+ /* 19 */ { 3, s_6_19, 11, 4, 0},
199
+ /* 20 */ { 3, s_6_20, 11, 5, 0},
200
+ /* 21 */ { 3, s_6_21, 11, 6, 0},
201
+ /* 22 */ { 1, s_6_22, -1, 8, 0},
202
+ /* 23 */ { 3, s_6_23, 22, -1, 0},
203
+ /* 24 */ { 2, s_6_24, 22, -1, 0},
204
+ /* 25 */ { 3, s_6_25, 22, -1, 0},
205
+ /* 26 */ { 2, s_6_26, 22, -1, 0},
206
+ /* 27 */ { 3, s_6_27, 26, -1, 0},
207
+ /* 28 */ { 3, s_6_28, 26, -1, 0},
208
+ /* 29 */ { 3, s_6_29, 26, 9, 0}
209
+ };
210
+
211
+ static const symbol s_7_0[3] = { 'e', 'j', 'a' };
212
+ static const symbol s_7_1[3] = { 'm', 'm', 'a' };
213
+ static const symbol s_7_2[4] = { 'i', 'm', 'm', 'a' };
214
+ static const symbol s_7_3[3] = { 'm', 'p', 'a' };
215
+ static const symbol s_7_4[4] = { 'i', 'm', 'p', 'a' };
216
+ static const symbol s_7_5[3] = { 'm', 'm', 'i' };
217
+ static const symbol s_7_6[4] = { 'i', 'm', 'm', 'i' };
218
+ static const symbol s_7_7[3] = { 'm', 'p', 'i' };
219
+ static const symbol s_7_8[4] = { 'i', 'm', 'p', 'i' };
220
+ static const symbol s_7_9[3] = { 'e', 'j', 0xE4 };
221
+ static const symbol s_7_10[3] = { 'm', 'm', 0xE4 };
222
+ static const symbol s_7_11[4] = { 'i', 'm', 'm', 0xE4 };
223
+ static const symbol s_7_12[3] = { 'm', 'p', 0xE4 };
224
+ static const symbol s_7_13[4] = { 'i', 'm', 'p', 0xE4 };
225
+
226
+ static const struct among a_7[14] =
227
+ {
228
+ /* 0 */ { 3, s_7_0, -1, -1, 0},
229
+ /* 1 */ { 3, s_7_1, -1, 1, 0},
230
+ /* 2 */ { 4, s_7_2, 1, -1, 0},
231
+ /* 3 */ { 3, s_7_3, -1, 1, 0},
232
+ /* 4 */ { 4, s_7_4, 3, -1, 0},
233
+ /* 5 */ { 3, s_7_5, -1, 1, 0},
234
+ /* 6 */ { 4, s_7_6, 5, -1, 0},
235
+ /* 7 */ { 3, s_7_7, -1, 1, 0},
236
+ /* 8 */ { 4, s_7_8, 7, -1, 0},
237
+ /* 9 */ { 3, s_7_9, -1, -1, 0},
238
+ /* 10 */ { 3, s_7_10, -1, 1, 0},
239
+ /* 11 */ { 4, s_7_11, 10, -1, 0},
240
+ /* 12 */ { 3, s_7_12, -1, 1, 0},
241
+ /* 13 */ { 4, s_7_13, 12, -1, 0}
242
+ };
243
+
244
+ static const symbol s_8_0[1] = { 'i' };
245
+ static const symbol s_8_1[1] = { 'j' };
246
+
247
+ static const struct among a_8[2] =
248
+ {
249
+ /* 0 */ { 1, s_8_0, -1, -1, 0},
250
+ /* 1 */ { 1, s_8_1, -1, -1, 0}
251
+ };
252
+
253
+ static const symbol s_9_0[3] = { 'm', 'm', 'a' };
254
+ static const symbol s_9_1[4] = { 'i', 'm', 'm', 'a' };
255
+
256
+ static const struct among a_9[2] =
257
+ {
258
+ /* 0 */ { 3, s_9_0, -1, 1, 0},
259
+ /* 1 */ { 4, s_9_1, 0, -1, 0}
260
+ };
261
+
262
+ static const unsigned char g_AEI[] = { 17, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 8 };
263
+
264
+ static const unsigned char g_V1[] = { 17, 65, 16, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 8, 0, 32 };
265
+
266
+ static const unsigned char g_V2[] = { 17, 65, 16, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 8, 0, 32 };
267
+
268
+ static const unsigned char g_particle_end[] = { 17, 97, 24, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 8, 0, 32 };
269
+
270
+ static const symbol s_0[] = { 'k' };
271
+ static const symbol s_1[] = { 'k', 's', 'e' };
272
+ static const symbol s_2[] = { 'k', 's', 'i' };
273
+ static const symbol s_3[] = { 'i' };
274
+ static const symbol s_4[] = { 'a' };
275
+ static const symbol s_5[] = { 'e' };
276
+ static const symbol s_6[] = { 'i' };
277
+ static const symbol s_7[] = { 'o' };
278
+ static const symbol s_8[] = { 0xE4 };
279
+ static const symbol s_9[] = { 0xF6 };
280
+ static const symbol s_10[] = { 'i', 'e' };
281
+ static const symbol s_11[] = { 'e' };
282
+ static const symbol s_12[] = { 'p', 'o' };
283
+ static const symbol s_13[] = { 't' };
284
+ static const symbol s_14[] = { 'p', 'o' };
285
+ static const symbol s_15[] = { 'j' };
286
+ static const symbol s_16[] = { 'o' };
287
+ static const symbol s_17[] = { 'u' };
288
+ static const symbol s_18[] = { 'o' };
289
+ static const symbol s_19[] = { 'j' };
290
+
291
+ static int r_mark_regions(struct SN_env * z) {
292
+ z->I[0] = z->l;
293
+ z->I[1] = z->l;
294
+ if (out_grouping(z, g_V1, 97, 246, 1) < 0) return 0; /* goto */ /* grouping V1, line 46 */
295
+ { /* gopast */ /* non V1, line 46 */
296
+ int ret = in_grouping(z, g_V1, 97, 246, 1);
297
+ if (ret < 0) return 0;
298
+ z->c += ret;
299
+ }
300
+ z->I[0] = z->c; /* setmark p1, line 46 */
301
+ if (out_grouping(z, g_V1, 97, 246, 1) < 0) return 0; /* goto */ /* grouping V1, line 47 */
302
+ { /* gopast */ /* non V1, line 47 */
303
+ int ret = in_grouping(z, g_V1, 97, 246, 1);
304
+ if (ret < 0) return 0;
305
+ z->c += ret;
306
+ }
307
+ z->I[1] = z->c; /* setmark p2, line 47 */
308
+ return 1;
309
+ }
310
+
311
+ static int r_R2(struct SN_env * z) {
312
+ if (!(z->I[1] <= z->c)) return 0;
313
+ return 1;
314
+ }
315
+
316
+ static int r_particle_etc(struct SN_env * z) {
317
+ int among_var;
318
+ { int mlimit; /* setlimit, line 55 */
319
+ int m1 = z->l - z->c; (void)m1;
320
+ if (z->c < z->I[0]) return 0;
321
+ z->c = z->I[0]; /* tomark, line 55 */
322
+ mlimit = z->lb; z->lb = z->c;
323
+ z->c = z->l - m1;
324
+ z->ket = z->c; /* [, line 55 */
325
+ among_var = find_among_b(z, a_0, 10); /* substring, line 55 */
326
+ if (!(among_var)) { z->lb = mlimit; return 0; }
327
+ z->bra = z->c; /* ], line 55 */
328
+ z->lb = mlimit;
329
+ }
330
+ switch(among_var) {
331
+ case 0: return 0;
332
+ case 1:
333
+ if (in_grouping_b(z, g_particle_end, 97, 246, 0)) return 0;
334
+ break;
335
+ case 2:
336
+ { int ret = r_R2(z);
337
+ if (ret == 0) return 0; /* call R2, line 64 */
338
+ if (ret < 0) return ret;
339
+ }
340
+ break;
341
+ }
342
+ { int ret = slice_del(z); /* delete, line 66 */
343
+ if (ret < 0) return ret;
344
+ }
345
+ return 1;
346
+ }
347
+
348
+ static int r_possessive(struct SN_env * z) {
349
+ int among_var;
350
+ { int mlimit; /* setlimit, line 69 */
351
+ int m1 = z->l - z->c; (void)m1;
352
+ if (z->c < z->I[0]) return 0;
353
+ z->c = z->I[0]; /* tomark, line 69 */
354
+ mlimit = z->lb; z->lb = z->c;
355
+ z->c = z->l - m1;
356
+ z->ket = z->c; /* [, line 69 */
357
+ among_var = find_among_b(z, a_4, 9); /* substring, line 69 */
358
+ if (!(among_var)) { z->lb = mlimit; return 0; }
359
+ z->bra = z->c; /* ], line 69 */
360
+ z->lb = mlimit;
361
+ }
362
+ switch(among_var) {
363
+ case 0: return 0;
364
+ case 1:
365
+ { int m2 = z->l - z->c; (void)m2; /* not, line 72 */
366
+ if (!(eq_s_b(z, 1, s_0))) goto lab0;
367
+ return 0;
368
+ lab0:
369
+ z->c = z->l - m2;
370
+ }
371
+ { int ret = slice_del(z); /* delete, line 72 */
372
+ if (ret < 0) return ret;
373
+ }
374
+ break;
375
+ case 2:
376
+ { int ret = slice_del(z); /* delete, line 74 */
377
+ if (ret < 0) return ret;
378
+ }
379
+ z->ket = z->c; /* [, line 74 */
380
+ if (!(eq_s_b(z, 3, s_1))) return 0;
381
+ z->bra = z->c; /* ], line 74 */
382
+ { int ret = slice_from_s(z, 3, s_2); /* <-, line 74 */
383
+ if (ret < 0) return ret;
384
+ }
385
+ break;
386
+ case 3:
387
+ { int ret = slice_del(z); /* delete, line 78 */
388
+ if (ret < 0) return ret;
389
+ }
390
+ break;
391
+ case 4:
392
+ if (z->c - 1 <= z->lb || z->p[z->c - 1] != 97) return 0;
393
+ if (!(find_among_b(z, a_1, 6))) return 0; /* among, line 81 */
394
+ { int ret = slice_del(z); /* delete, line 81 */
395
+ if (ret < 0) return ret;
396
+ }
397
+ break;
398
+ case 5:
399
+ if (z->c - 1 <= z->lb || z->p[z->c - 1] != 228) return 0;
400
+ if (!(find_among_b(z, a_2, 6))) return 0; /* among, line 83 */
401
+ { int ret = slice_del(z); /* delete, line 84 */
402
+ if (ret < 0) return ret;
403
+ }
404
+ break;
405
+ case 6:
406
+ if (z->c - 2 <= z->lb || z->p[z->c - 1] != 101) return 0;
407
+ if (!(find_among_b(z, a_3, 2))) return 0; /* among, line 86 */
408
+ { int ret = slice_del(z); /* delete, line 86 */
409
+ if (ret < 0) return ret;
410
+ }
411
+ break;
412
+ }
413
+ return 1;
414
+ }
415
+
416
+ static int r_LONG(struct SN_env * z) {
417
+ if (!(find_among_b(z, a_5, 7))) return 0; /* among, line 91 */
418
+ return 1;
419
+ }
420
+
421
+ static int r_VI(struct SN_env * z) {
422
+ if (!(eq_s_b(z, 1, s_3))) return 0;
423
+ if (in_grouping_b(z, g_V2, 97, 246, 0)) return 0;
424
+ return 1;
425
+ }
426
+
427
+ static int r_case_ending(struct SN_env * z) {
428
+ int among_var;
429
+ { int mlimit; /* setlimit, line 96 */
430
+ int m1 = z->l - z->c; (void)m1;
431
+ if (z->c < z->I[0]) return 0;
432
+ z->c = z->I[0]; /* tomark, line 96 */
433
+ mlimit = z->lb; z->lb = z->c;
434
+ z->c = z->l - m1;
435
+ z->ket = z->c; /* [, line 96 */
436
+ among_var = find_among_b(z, a_6, 30); /* substring, line 96 */
437
+ if (!(among_var)) { z->lb = mlimit; return 0; }
438
+ z->bra = z->c; /* ], line 96 */
439
+ z->lb = mlimit;
440
+ }
441
+ switch(among_var) {
442
+ case 0: return 0;
443
+ case 1:
444
+ if (!(eq_s_b(z, 1, s_4))) return 0;
445
+ break;
446
+ case 2:
447
+ if (!(eq_s_b(z, 1, s_5))) return 0;
448
+ break;
449
+ case 3:
450
+ if (!(eq_s_b(z, 1, s_6))) return 0;
451
+ break;
452
+ case 4:
453
+ if (!(eq_s_b(z, 1, s_7))) return 0;
454
+ break;
455
+ case 5:
456
+ if (!(eq_s_b(z, 1, s_8))) return 0;
457
+ break;
458
+ case 6:
459
+ if (!(eq_s_b(z, 1, s_9))) return 0;
460
+ break;
461
+ case 7:
462
+ { int m_keep = z->l - z->c;/* (void) m_keep;*/ /* try, line 111 */
463
+ { int m2 = z->l - z->c; (void)m2; /* and, line 113 */
464
+ { int m3 = z->l - z->c; (void)m3; /* or, line 112 */
465
+ { int ret = r_LONG(z);
466
+ if (ret == 0) goto lab2; /* call LONG, line 111 */
467
+ if (ret < 0) return ret;
468
+ }
469
+ goto lab1;
470
+ lab2:
471
+ z->c = z->l - m3;
472
+ if (!(eq_s_b(z, 2, s_10))) { z->c = z->l - m_keep; goto lab0; }
473
+ }
474
+ lab1:
475
+ z->c = z->l - m2;
476
+ if (z->c <= z->lb) { z->c = z->l - m_keep; goto lab0; }
477
+ z->c--; /* next, line 113 */
478
+ }
479
+ z->bra = z->c; /* ], line 113 */
480
+ lab0:
481
+ ;
482
+ }
483
+ break;
484
+ case 8:
485
+ if (in_grouping_b(z, g_V1, 97, 246, 0)) return 0;
486
+ if (out_grouping_b(z, g_V1, 97, 246, 0)) return 0;
487
+ break;
488
+ case 9:
489
+ if (!(eq_s_b(z, 1, s_11))) return 0;
490
+ break;
491
+ }
492
+ { int ret = slice_del(z); /* delete, line 138 */
493
+ if (ret < 0) return ret;
494
+ }
495
+ z->B[0] = 1; /* set ending_removed, line 139 */
496
+ return 1;
497
+ }
498
+
499
+ static int r_other_endings(struct SN_env * z) {
500
+ int among_var;
501
+ { int mlimit; /* setlimit, line 142 */
502
+ int m1 = z->l - z->c; (void)m1;
503
+ if (z->c < z->I[1]) return 0;
504
+ z->c = z->I[1]; /* tomark, line 142 */
505
+ mlimit = z->lb; z->lb = z->c;
506
+ z->c = z->l - m1;
507
+ z->ket = z->c; /* [, line 142 */
508
+ among_var = find_among_b(z, a_7, 14); /* substring, line 142 */
509
+ if (!(among_var)) { z->lb = mlimit; return 0; }
510
+ z->bra = z->c; /* ], line 142 */
511
+ z->lb = mlimit;
512
+ }
513
+ switch(among_var) {
514
+ case 0: return 0;
515
+ case 1:
516
+ { int m2 = z->l - z->c; (void)m2; /* not, line 146 */
517
+ if (!(eq_s_b(z, 2, s_12))) goto lab0;
518
+ return 0;
519
+ lab0:
520
+ z->c = z->l - m2;
521
+ }
522
+ break;
523
+ }
524
+ { int ret = slice_del(z); /* delete, line 151 */
525
+ if (ret < 0) return ret;
526
+ }
527
+ return 1;
528
+ }
529
+
530
+ static int r_i_plural(struct SN_env * z) {
531
+ { int mlimit; /* setlimit, line 154 */
532
+ int m1 = z->l - z->c; (void)m1;
533
+ if (z->c < z->I[0]) return 0;
534
+ z->c = z->I[0]; /* tomark, line 154 */
535
+ mlimit = z->lb; z->lb = z->c;
536
+ z->c = z->l - m1;
537
+ z->ket = z->c; /* [, line 154 */
538
+ if (z->c <= z->lb || (z->p[z->c - 1] != 105 && z->p[z->c - 1] != 106)) { z->lb = mlimit; return 0; }
539
+ if (!(find_among_b(z, a_8, 2))) { z->lb = mlimit; return 0; } /* substring, line 154 */
540
+ z->bra = z->c; /* ], line 154 */
541
+ z->lb = mlimit;
542
+ }
543
+ { int ret = slice_del(z); /* delete, line 158 */
544
+ if (ret < 0) return ret;
545
+ }
546
+ return 1;
547
+ }
548
+
549
+ static int r_t_plural(struct SN_env * z) {
550
+ int among_var;
551
+ { int mlimit; /* setlimit, line 161 */
552
+ int m1 = z->l - z->c; (void)m1;
553
+ if (z->c < z->I[0]) return 0;
554
+ z->c = z->I[0]; /* tomark, line 161 */
555
+ mlimit = z->lb; z->lb = z->c;
556
+ z->c = z->l - m1;
557
+ z->ket = z->c; /* [, line 162 */
558
+ if (!(eq_s_b(z, 1, s_13))) { z->lb = mlimit; return 0; }
559
+ z->bra = z->c; /* ], line 162 */
560
+ { int m_test = z->l - z->c; /* test, line 162 */
561
+ if (in_grouping_b(z, g_V1, 97, 246, 0)) { z->lb = mlimit; return 0; }
562
+ z->c = z->l - m_test;
563
+ }
564
+ { int ret = slice_del(z); /* delete, line 163 */
565
+ if (ret < 0) return ret;
566
+ }
567
+ z->lb = mlimit;
568
+ }
569
+ { int mlimit; /* setlimit, line 165 */
570
+ int m2 = z->l - z->c; (void)m2;
571
+ if (z->c < z->I[1]) return 0;
572
+ z->c = z->I[1]; /* tomark, line 165 */
573
+ mlimit = z->lb; z->lb = z->c;
574
+ z->c = z->l - m2;
575
+ z->ket = z->c; /* [, line 165 */
576
+ if (z->c - 2 <= z->lb || z->p[z->c - 1] != 97) { z->lb = mlimit; return 0; }
577
+ among_var = find_among_b(z, a_9, 2); /* substring, line 165 */
578
+ if (!(among_var)) { z->lb = mlimit; return 0; }
579
+ z->bra = z->c; /* ], line 165 */
580
+ z->lb = mlimit;
581
+ }
582
+ switch(among_var) {
583
+ case 0: return 0;
584
+ case 1:
585
+ { int m3 = z->l - z->c; (void)m3; /* not, line 167 */
586
+ if (!(eq_s_b(z, 2, s_14))) goto lab0;
587
+ return 0;
588
+ lab0:
589
+ z->c = z->l - m3;
590
+ }
591
+ break;
592
+ }
593
+ { int ret = slice_del(z); /* delete, line 170 */
594
+ if (ret < 0) return ret;
595
+ }
596
+ return 1;
597
+ }
598
+
599
+ static int r_tidy(struct SN_env * z) {
600
+ { int mlimit; /* setlimit, line 173 */
601
+ int m1 = z->l - z->c; (void)m1;
602
+ if (z->c < z->I[0]) return 0;
603
+ z->c = z->I[0]; /* tomark, line 173 */
604
+ mlimit = z->lb; z->lb = z->c;
605
+ z->c = z->l - m1;
606
+ { int m2 = z->l - z->c; (void)m2; /* do, line 174 */
607
+ { int m3 = z->l - z->c; (void)m3; /* and, line 174 */
608
+ { int ret = r_LONG(z);
609
+ if (ret == 0) goto lab0; /* call LONG, line 174 */
610
+ if (ret < 0) return ret;
611
+ }
612
+ z->c = z->l - m3;
613
+ z->ket = z->c; /* [, line 174 */
614
+ if (z->c <= z->lb) goto lab0;
615
+ z->c--; /* next, line 174 */
616
+ z->bra = z->c; /* ], line 174 */
617
+ { int ret = slice_del(z); /* delete, line 174 */
618
+ if (ret < 0) return ret;
619
+ }
620
+ }
621
+ lab0:
622
+ z->c = z->l - m2;
623
+ }
624
+ { int m4 = z->l - z->c; (void)m4; /* do, line 175 */
625
+ z->ket = z->c; /* [, line 175 */
626
+ if (in_grouping_b(z, g_AEI, 97, 228, 0)) goto lab1;
627
+ z->bra = z->c; /* ], line 175 */
628
+ if (out_grouping_b(z, g_V1, 97, 246, 0)) goto lab1;
629
+ { int ret = slice_del(z); /* delete, line 175 */
630
+ if (ret < 0) return ret;
631
+ }
632
+ lab1:
633
+ z->c = z->l - m4;
634
+ }
635
+ { int m5 = z->l - z->c; (void)m5; /* do, line 176 */
636
+ z->ket = z->c; /* [, line 176 */
637
+ if (!(eq_s_b(z, 1, s_15))) goto lab2;
638
+ z->bra = z->c; /* ], line 176 */
639
+ { int m6 = z->l - z->c; (void)m6; /* or, line 176 */
640
+ if (!(eq_s_b(z, 1, s_16))) goto lab4;
641
+ goto lab3;
642
+ lab4:
643
+ z->c = z->l - m6;
644
+ if (!(eq_s_b(z, 1, s_17))) goto lab2;
645
+ }
646
+ lab3:
647
+ { int ret = slice_del(z); /* delete, line 176 */
648
+ if (ret < 0) return ret;
649
+ }
650
+ lab2:
651
+ z->c = z->l - m5;
652
+ }
653
+ { int m7 = z->l - z->c; (void)m7; /* do, line 177 */
654
+ z->ket = z->c; /* [, line 177 */
655
+ if (!(eq_s_b(z, 1, s_18))) goto lab5;
656
+ z->bra = z->c; /* ], line 177 */
657
+ if (!(eq_s_b(z, 1, s_19))) goto lab5;
658
+ { int ret = slice_del(z); /* delete, line 177 */
659
+ if (ret < 0) return ret;
660
+ }
661
+ lab5:
662
+ z->c = z->l - m7;
663
+ }
664
+ z->lb = mlimit;
665
+ }
666
+ if (in_grouping_b(z, g_V1, 97, 246, 1) < 0) return 0; /* goto */ /* non V1, line 179 */
667
+ z->ket = z->c; /* [, line 179 */
668
+ if (z->c <= z->lb) return 0;
669
+ z->c--; /* next, line 179 */
670
+ z->bra = z->c; /* ], line 179 */
671
+ z->S[0] = slice_to(z, z->S[0]); /* -> x, line 179 */
672
+ if (z->S[0] == 0) return -1; /* -> x, line 179 */
673
+ if (!(eq_v_b(z, z->S[0]))) return 0; /* name x, line 179 */
674
+ { int ret = slice_del(z); /* delete, line 179 */
675
+ if (ret < 0) return ret;
676
+ }
677
+ return 1;
678
+ }
679
+
680
+ extern int finnish_ISO_8859_1_stem(struct SN_env * z) {
681
+ { int c1 = z->c; /* do, line 185 */
682
+ { int ret = r_mark_regions(z);
683
+ if (ret == 0) goto lab0; /* call mark_regions, line 185 */
684
+ if (ret < 0) return ret;
685
+ }
686
+ lab0:
687
+ z->c = c1;
688
+ }
689
+ z->B[0] = 0; /* unset ending_removed, line 186 */
690
+ z->lb = z->c; z->c = z->l; /* backwards, line 187 */
691
+
692
+ { int m2 = z->l - z->c; (void)m2; /* do, line 188 */
693
+ { int ret = r_particle_etc(z);
694
+ if (ret == 0) goto lab1; /* call particle_etc, line 188 */
695
+ if (ret < 0) return ret;
696
+ }
697
+ lab1:
698
+ z->c = z->l - m2;
699
+ }
700
+ { int m3 = z->l - z->c; (void)m3; /* do, line 189 */
701
+ { int ret = r_possessive(z);
702
+ if (ret == 0) goto lab2; /* call possessive, line 189 */
703
+ if (ret < 0) return ret;
704
+ }
705
+ lab2:
706
+ z->c = z->l - m3;
707
+ }
708
+ { int m4 = z->l - z->c; (void)m4; /* do, line 190 */
709
+ { int ret = r_case_ending(z);
710
+ if (ret == 0) goto lab3; /* call case_ending, line 190 */
711
+ if (ret < 0) return ret;
712
+ }
713
+ lab3:
714
+ z->c = z->l - m4;
715
+ }
716
+ { int m5 = z->l - z->c; (void)m5; /* do, line 191 */
717
+ { int ret = r_other_endings(z);
718
+ if (ret == 0) goto lab4; /* call other_endings, line 191 */
719
+ if (ret < 0) return ret;
720
+ }
721
+ lab4:
722
+ z->c = z->l - m5;
723
+ }
724
+ { int m6 = z->l - z->c; (void)m6; /* or, line 192 */
725
+ if (!(z->B[0])) goto lab6; /* Boolean test ending_removed, line 192 */
726
+ { int m7 = z->l - z->c; (void)m7; /* do, line 192 */
727
+ { int ret = r_i_plural(z);
728
+ if (ret == 0) goto lab7; /* call i_plural, line 192 */
729
+ if (ret < 0) return ret;
730
+ }
731
+ lab7:
732
+ z->c = z->l - m7;
733
+ }
734
+ goto lab5;
735
+ lab6:
736
+ z->c = z->l - m6;
737
+ { int m8 = z->l - z->c; (void)m8; /* do, line 192 */
738
+ { int ret = r_t_plural(z);
739
+ if (ret == 0) goto lab8; /* call t_plural, line 192 */
740
+ if (ret < 0) return ret;
741
+ }
742
+ lab8:
743
+ z->c = z->l - m8;
744
+ }
745
+ }
746
+ lab5:
747
+ { int m9 = z->l - z->c; (void)m9; /* do, line 193 */
748
+ { int ret = r_tidy(z);
749
+ if (ret == 0) goto lab9; /* call tidy, line 193 */
750
+ if (ret < 0) return ret;
751
+ }
752
+ lab9:
753
+ z->c = z->l - m9;
754
+ }
755
+ z->c = z->lb;
756
+ return 1;
757
+ }
758
+
759
+ extern struct SN_env * finnish_ISO_8859_1_create_env(void) { return SN_create_env(1, 2, 1); }
760
+
761
+ extern void finnish_ISO_8859_1_close_env(struct SN_env * z) { SN_close_env(z, 1); }
762
+