ruby-stemmer-dimelo 0.9.3.dimelo1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (95) hide show
  1. checksums.yaml +7 -0
  2. data/MIT-LICENSE +21 -0
  3. data/README.rdoc +117 -0
  4. data/Rakefile +70 -0
  5. data/VERSION +1 -0
  6. data/ext/lingua/extconf.rb +40 -0
  7. data/ext/lingua/stemmer.c +115 -0
  8. data/lib/lingua/stemmer.rb +60 -0
  9. data/libstemmer_c/MANIFEST +72 -0
  10. data/libstemmer_c/Makefile +9 -0
  11. data/libstemmer_c/Makefile.windows +15 -0
  12. data/libstemmer_c/README +125 -0
  13. data/libstemmer_c/examples/stemwords.c +209 -0
  14. data/libstemmer_c/include/libstemmer.h +79 -0
  15. data/libstemmer_c/libstemmer/libstemmer.c +93 -0
  16. data/libstemmer_c/libstemmer/libstemmer_utf8.c +93 -0
  17. data/libstemmer_c/libstemmer/modules.h +195 -0
  18. data/libstemmer_c/libstemmer/modules.txt +51 -0
  19. data/libstemmer_c/libstemmer/modules_utf8.h +123 -0
  20. data/libstemmer_c/libstemmer/modules_utf8.txt +50 -0
  21. data/libstemmer_c/mkinc.mak +86 -0
  22. data/libstemmer_c/mkinc_utf8.mak +54 -0
  23. data/libstemmer_c/runtime/api.c +66 -0
  24. data/libstemmer_c/runtime/api.h +26 -0
  25. data/libstemmer_c/runtime/header.h +58 -0
  26. data/libstemmer_c/runtime/utilities.c +478 -0
  27. data/libstemmer_c/src_c/stem_ISO_8859_1_danish.c +337 -0
  28. data/libstemmer_c/src_c/stem_ISO_8859_1_danish.h +16 -0
  29. data/libstemmer_c/src_c/stem_ISO_8859_1_dutch.c +624 -0
  30. data/libstemmer_c/src_c/stem_ISO_8859_1_dutch.h +16 -0
  31. data/libstemmer_c/src_c/stem_ISO_8859_1_english.c +1117 -0
  32. data/libstemmer_c/src_c/stem_ISO_8859_1_english.h +16 -0
  33. data/libstemmer_c/src_c/stem_ISO_8859_1_finnish.c +762 -0
  34. data/libstemmer_c/src_c/stem_ISO_8859_1_finnish.h +16 -0
  35. data/libstemmer_c/src_c/stem_ISO_8859_1_french.c +1230 -0
  36. data/libstemmer_c/src_c/stem_ISO_8859_1_french.h +16 -0
  37. data/libstemmer_c/src_c/stem_ISO_8859_1_german.c +503 -0
  38. data/libstemmer_c/src_c/stem_ISO_8859_1_german.h +16 -0
  39. data/libstemmer_c/src_c/stem_ISO_8859_1_hungarian.c +1230 -0
  40. data/libstemmer_c/src_c/stem_ISO_8859_1_hungarian.h +16 -0
  41. data/libstemmer_c/src_c/stem_ISO_8859_1_italian.c +1065 -0
  42. data/libstemmer_c/src_c/stem_ISO_8859_1_italian.h +16 -0
  43. data/libstemmer_c/src_c/stem_ISO_8859_1_latin.c +443 -0
  44. data/libstemmer_c/src_c/stem_ISO_8859_1_latin.h +16 -0
  45. data/libstemmer_c/src_c/stem_ISO_8859_1_norwegian.c +297 -0
  46. data/libstemmer_c/src_c/stem_ISO_8859_1_norwegian.h +16 -0
  47. data/libstemmer_c/src_c/stem_ISO_8859_1_porter.c +749 -0
  48. data/libstemmer_c/src_c/stem_ISO_8859_1_porter.h +16 -0
  49. data/libstemmer_c/src_c/stem_ISO_8859_1_portuguese.c +1017 -0
  50. data/libstemmer_c/src_c/stem_ISO_8859_1_portuguese.h +16 -0
  51. data/libstemmer_c/src_c/stem_ISO_8859_1_spanish.c +1093 -0
  52. data/libstemmer_c/src_c/stem_ISO_8859_1_spanish.h +16 -0
  53. data/libstemmer_c/src_c/stem_ISO_8859_1_swedish.c +307 -0
  54. data/libstemmer_c/src_c/stem_ISO_8859_1_swedish.h +16 -0
  55. data/libstemmer_c/src_c/stem_ISO_8859_2_romanian.c +998 -0
  56. data/libstemmer_c/src_c/stem_ISO_8859_2_romanian.h +16 -0
  57. data/libstemmer_c/src_c/stem_KOI8_R_russian.c +700 -0
  58. data/libstemmer_c/src_c/stem_KOI8_R_russian.h +16 -0
  59. data/libstemmer_c/src_c/stem_UTF_8_danish.c +339 -0
  60. data/libstemmer_c/src_c/stem_UTF_8_danish.h +16 -0
  61. data/libstemmer_c/src_c/stem_UTF_8_dutch.c +634 -0
  62. data/libstemmer_c/src_c/stem_UTF_8_dutch.h +16 -0
  63. data/libstemmer_c/src_c/stem_UTF_8_english.c +1125 -0
  64. data/libstemmer_c/src_c/stem_UTF_8_english.h +16 -0
  65. data/libstemmer_c/src_c/stem_UTF_8_finnish.c +768 -0
  66. data/libstemmer_c/src_c/stem_UTF_8_finnish.h +16 -0
  67. data/libstemmer_c/src_c/stem_UTF_8_french.c +1230 -0
  68. data/libstemmer_c/src_c/stem_UTF_8_french.h +16 -0
  69. data/libstemmer_c/src_c/stem_UTF_8_german.c +509 -0
  70. data/libstemmer_c/src_c/stem_UTF_8_german.h +16 -0
  71. data/libstemmer_c/src_c/stem_UTF_8_hungarian.c +1234 -0
  72. data/libstemmer_c/src_c/stem_UTF_8_hungarian.h +16 -0
  73. data/libstemmer_c/src_c/stem_UTF_8_italian.c +1073 -0
  74. data/libstemmer_c/src_c/stem_UTF_8_italian.h +16 -0
  75. data/libstemmer_c/src_c/stem_UTF_8_latin.c +443 -0
  76. data/libstemmer_c/src_c/stem_UTF_8_latin.h +16 -0
  77. data/libstemmer_c/src_c/stem_UTF_8_norwegian.c +299 -0
  78. data/libstemmer_c/src_c/stem_UTF_8_norwegian.h +16 -0
  79. data/libstemmer_c/src_c/stem_UTF_8_porter.c +755 -0
  80. data/libstemmer_c/src_c/stem_UTF_8_porter.h +16 -0
  81. data/libstemmer_c/src_c/stem_UTF_8_portuguese.c +1023 -0
  82. data/libstemmer_c/src_c/stem_UTF_8_portuguese.h +16 -0
  83. data/libstemmer_c/src_c/stem_UTF_8_romanian.c +1004 -0
  84. data/libstemmer_c/src_c/stem_UTF_8_romanian.h +16 -0
  85. data/libstemmer_c/src_c/stem_UTF_8_russian.c +694 -0
  86. data/libstemmer_c/src_c/stem_UTF_8_russian.h +16 -0
  87. data/libstemmer_c/src_c/stem_UTF_8_spanish.c +1097 -0
  88. data/libstemmer_c/src_c/stem_UTF_8_spanish.h +16 -0
  89. data/libstemmer_c/src_c/stem_UTF_8_swedish.c +309 -0
  90. data/libstemmer_c/src_c/stem_UTF_8_swedish.h +16 -0
  91. data/libstemmer_c/src_c/stem_UTF_8_turkish.c +2205 -0
  92. data/libstemmer_c/src_c/stem_UTF_8_turkish.h +16 -0
  93. data/test/helper.rb +3 -0
  94. data/test/lingua/test_stemmer.rb +99 -0
  95. metadata +141 -0
@@ -0,0 +1,16 @@
1
+
2
+ /* This file was generated automatically by the Snowball to ANSI C compiler */
3
+
4
+ #ifdef __cplusplus
5
+ extern "C" {
6
+ #endif
7
+
8
+ extern struct SN_env * english_ISO_8859_1_create_env(void);
9
+ extern void english_ISO_8859_1_close_env(struct SN_env * z);
10
+
11
+ extern int english_ISO_8859_1_stem(struct SN_env * z);
12
+
13
+ #ifdef __cplusplus
14
+ }
15
+ #endif
16
+
@@ -0,0 +1,762 @@
1
+
2
+ /* This file was generated automatically by the Snowball to ANSI C compiler */
3
+
4
+ #include "../runtime/header.h"
5
+
6
+ #ifdef __cplusplus
7
+ extern "C" {
8
+ #endif
9
+ extern int finnish_ISO_8859_1_stem(struct SN_env * z);
10
+ #ifdef __cplusplus
11
+ }
12
+ #endif
13
+ static int r_tidy(struct SN_env * z);
14
+ static int r_other_endings(struct SN_env * z);
15
+ static int r_t_plural(struct SN_env * z);
16
+ static int r_i_plural(struct SN_env * z);
17
+ static int r_case_ending(struct SN_env * z);
18
+ static int r_VI(struct SN_env * z);
19
+ static int r_LONG(struct SN_env * z);
20
+ static int r_possessive(struct SN_env * z);
21
+ static int r_particle_etc(struct SN_env * z);
22
+ static int r_R2(struct SN_env * z);
23
+ static int r_mark_regions(struct SN_env * z);
24
+ #ifdef __cplusplus
25
+ extern "C" {
26
+ #endif
27
+
28
+
29
+ extern struct SN_env * finnish_ISO_8859_1_create_env(void);
30
+ extern void finnish_ISO_8859_1_close_env(struct SN_env * z);
31
+
32
+
33
+ #ifdef __cplusplus
34
+ }
35
+ #endif
36
+ static const symbol s_0_0[2] = { 'p', 'a' };
37
+ static const symbol s_0_1[3] = { 's', 't', 'i' };
38
+ static const symbol s_0_2[4] = { 'k', 'a', 'a', 'n' };
39
+ static const symbol s_0_3[3] = { 'h', 'a', 'n' };
40
+ static const symbol s_0_4[3] = { 'k', 'i', 'n' };
41
+ static const symbol s_0_5[3] = { 'h', 0xE4, 'n' };
42
+ static const symbol s_0_6[4] = { 'k', 0xE4, 0xE4, 'n' };
43
+ static const symbol s_0_7[2] = { 'k', 'o' };
44
+ static const symbol s_0_8[2] = { 'p', 0xE4 };
45
+ static const symbol s_0_9[2] = { 'k', 0xF6 };
46
+
47
+ static const struct among a_0[10] =
48
+ {
49
+ /* 0 */ { 2, s_0_0, -1, 1, 0},
50
+ /* 1 */ { 3, s_0_1, -1, 2, 0},
51
+ /* 2 */ { 4, s_0_2, -1, 1, 0},
52
+ /* 3 */ { 3, s_0_3, -1, 1, 0},
53
+ /* 4 */ { 3, s_0_4, -1, 1, 0},
54
+ /* 5 */ { 3, s_0_5, -1, 1, 0},
55
+ /* 6 */ { 4, s_0_6, -1, 1, 0},
56
+ /* 7 */ { 2, s_0_7, -1, 1, 0},
57
+ /* 8 */ { 2, s_0_8, -1, 1, 0},
58
+ /* 9 */ { 2, s_0_9, -1, 1, 0}
59
+ };
60
+
61
+ static const symbol s_1_0[3] = { 'l', 'l', 'a' };
62
+ static const symbol s_1_1[2] = { 'n', 'a' };
63
+ static const symbol s_1_2[3] = { 's', 's', 'a' };
64
+ static const symbol s_1_3[2] = { 't', 'a' };
65
+ static const symbol s_1_4[3] = { 'l', 't', 'a' };
66
+ static const symbol s_1_5[3] = { 's', 't', 'a' };
67
+
68
+ static const struct among a_1[6] =
69
+ {
70
+ /* 0 */ { 3, s_1_0, -1, -1, 0},
71
+ /* 1 */ { 2, s_1_1, -1, -1, 0},
72
+ /* 2 */ { 3, s_1_2, -1, -1, 0},
73
+ /* 3 */ { 2, s_1_3, -1, -1, 0},
74
+ /* 4 */ { 3, s_1_4, 3, -1, 0},
75
+ /* 5 */ { 3, s_1_5, 3, -1, 0}
76
+ };
77
+
78
+ static const symbol s_2_0[3] = { 'l', 'l', 0xE4 };
79
+ static const symbol s_2_1[2] = { 'n', 0xE4 };
80
+ static const symbol s_2_2[3] = { 's', 's', 0xE4 };
81
+ static const symbol s_2_3[2] = { 't', 0xE4 };
82
+ static const symbol s_2_4[3] = { 'l', 't', 0xE4 };
83
+ static const symbol s_2_5[3] = { 's', 't', 0xE4 };
84
+
85
+ static const struct among a_2[6] =
86
+ {
87
+ /* 0 */ { 3, s_2_0, -1, -1, 0},
88
+ /* 1 */ { 2, s_2_1, -1, -1, 0},
89
+ /* 2 */ { 3, s_2_2, -1, -1, 0},
90
+ /* 3 */ { 2, s_2_3, -1, -1, 0},
91
+ /* 4 */ { 3, s_2_4, 3, -1, 0},
92
+ /* 5 */ { 3, s_2_5, 3, -1, 0}
93
+ };
94
+
95
+ static const symbol s_3_0[3] = { 'l', 'l', 'e' };
96
+ static const symbol s_3_1[3] = { 'i', 'n', 'e' };
97
+
98
+ static const struct among a_3[2] =
99
+ {
100
+ /* 0 */ { 3, s_3_0, -1, -1, 0},
101
+ /* 1 */ { 3, s_3_1, -1, -1, 0}
102
+ };
103
+
104
+ static const symbol s_4_0[3] = { 'n', 's', 'a' };
105
+ static const symbol s_4_1[3] = { 'm', 'm', 'e' };
106
+ static const symbol s_4_2[3] = { 'n', 'n', 'e' };
107
+ static const symbol s_4_3[2] = { 'n', 'i' };
108
+ static const symbol s_4_4[2] = { 's', 'i' };
109
+ static const symbol s_4_5[2] = { 'a', 'n' };
110
+ static const symbol s_4_6[2] = { 'e', 'n' };
111
+ static const symbol s_4_7[2] = { 0xE4, 'n' };
112
+ static const symbol s_4_8[3] = { 'n', 's', 0xE4 };
113
+
114
+ static const struct among a_4[9] =
115
+ {
116
+ /* 0 */ { 3, s_4_0, -1, 3, 0},
117
+ /* 1 */ { 3, s_4_1, -1, 3, 0},
118
+ /* 2 */ { 3, s_4_2, -1, 3, 0},
119
+ /* 3 */ { 2, s_4_3, -1, 2, 0},
120
+ /* 4 */ { 2, s_4_4, -1, 1, 0},
121
+ /* 5 */ { 2, s_4_5, -1, 4, 0},
122
+ /* 6 */ { 2, s_4_6, -1, 6, 0},
123
+ /* 7 */ { 2, s_4_7, -1, 5, 0},
124
+ /* 8 */ { 3, s_4_8, -1, 3, 0}
125
+ };
126
+
127
+ static const symbol s_5_0[2] = { 'a', 'a' };
128
+ static const symbol s_5_1[2] = { 'e', 'e' };
129
+ static const symbol s_5_2[2] = { 'i', 'i' };
130
+ static const symbol s_5_3[2] = { 'o', 'o' };
131
+ static const symbol s_5_4[2] = { 'u', 'u' };
132
+ static const symbol s_5_5[2] = { 0xE4, 0xE4 };
133
+ static const symbol s_5_6[2] = { 0xF6, 0xF6 };
134
+
135
+ static const struct among a_5[7] =
136
+ {
137
+ /* 0 */ { 2, s_5_0, -1, -1, 0},
138
+ /* 1 */ { 2, s_5_1, -1, -1, 0},
139
+ /* 2 */ { 2, s_5_2, -1, -1, 0},
140
+ /* 3 */ { 2, s_5_3, -1, -1, 0},
141
+ /* 4 */ { 2, s_5_4, -1, -1, 0},
142
+ /* 5 */ { 2, s_5_5, -1, -1, 0},
143
+ /* 6 */ { 2, s_5_6, -1, -1, 0}
144
+ };
145
+
146
+ static const symbol s_6_0[1] = { 'a' };
147
+ static const symbol s_6_1[3] = { 'l', 'l', 'a' };
148
+ static const symbol s_6_2[2] = { 'n', 'a' };
149
+ static const symbol s_6_3[3] = { 's', 's', 'a' };
150
+ static const symbol s_6_4[2] = { 't', 'a' };
151
+ static const symbol s_6_5[3] = { 'l', 't', 'a' };
152
+ static const symbol s_6_6[3] = { 's', 't', 'a' };
153
+ static const symbol s_6_7[3] = { 't', 't', 'a' };
154
+ static const symbol s_6_8[3] = { 'l', 'l', 'e' };
155
+ static const symbol s_6_9[3] = { 'i', 'n', 'e' };
156
+ static const symbol s_6_10[3] = { 'k', 's', 'i' };
157
+ static const symbol s_6_11[1] = { 'n' };
158
+ static const symbol s_6_12[3] = { 'h', 'a', 'n' };
159
+ static const symbol s_6_13[3] = { 'd', 'e', 'n' };
160
+ static const symbol s_6_14[4] = { 's', 'e', 'e', 'n' };
161
+ static const symbol s_6_15[3] = { 'h', 'e', 'n' };
162
+ static const symbol s_6_16[4] = { 't', 't', 'e', 'n' };
163
+ static const symbol s_6_17[3] = { 'h', 'i', 'n' };
164
+ static const symbol s_6_18[4] = { 's', 'i', 'i', 'n' };
165
+ static const symbol s_6_19[3] = { 'h', 'o', 'n' };
166
+ static const symbol s_6_20[3] = { 'h', 0xE4, 'n' };
167
+ static const symbol s_6_21[3] = { 'h', 0xF6, 'n' };
168
+ static const symbol s_6_22[1] = { 0xE4 };
169
+ static const symbol s_6_23[3] = { 'l', 'l', 0xE4 };
170
+ static const symbol s_6_24[2] = { 'n', 0xE4 };
171
+ static const symbol s_6_25[3] = { 's', 's', 0xE4 };
172
+ static const symbol s_6_26[2] = { 't', 0xE4 };
173
+ static const symbol s_6_27[3] = { 'l', 't', 0xE4 };
174
+ static const symbol s_6_28[3] = { 's', 't', 0xE4 };
175
+ static const symbol s_6_29[3] = { 't', 't', 0xE4 };
176
+
177
+ static const struct among a_6[30] =
178
+ {
179
+ /* 0 */ { 1, s_6_0, -1, 8, 0},
180
+ /* 1 */ { 3, s_6_1, 0, -1, 0},
181
+ /* 2 */ { 2, s_6_2, 0, -1, 0},
182
+ /* 3 */ { 3, s_6_3, 0, -1, 0},
183
+ /* 4 */ { 2, s_6_4, 0, -1, 0},
184
+ /* 5 */ { 3, s_6_5, 4, -1, 0},
185
+ /* 6 */ { 3, s_6_6, 4, -1, 0},
186
+ /* 7 */ { 3, s_6_7, 4, 9, 0},
187
+ /* 8 */ { 3, s_6_8, -1, -1, 0},
188
+ /* 9 */ { 3, s_6_9, -1, -1, 0},
189
+ /* 10 */ { 3, s_6_10, -1, -1, 0},
190
+ /* 11 */ { 1, s_6_11, -1, 7, 0},
191
+ /* 12 */ { 3, s_6_12, 11, 1, 0},
192
+ /* 13 */ { 3, s_6_13, 11, -1, r_VI},
193
+ /* 14 */ { 4, s_6_14, 11, -1, r_LONG},
194
+ /* 15 */ { 3, s_6_15, 11, 2, 0},
195
+ /* 16 */ { 4, s_6_16, 11, -1, r_VI},
196
+ /* 17 */ { 3, s_6_17, 11, 3, 0},
197
+ /* 18 */ { 4, s_6_18, 11, -1, r_VI},
198
+ /* 19 */ { 3, s_6_19, 11, 4, 0},
199
+ /* 20 */ { 3, s_6_20, 11, 5, 0},
200
+ /* 21 */ { 3, s_6_21, 11, 6, 0},
201
+ /* 22 */ { 1, s_6_22, -1, 8, 0},
202
+ /* 23 */ { 3, s_6_23, 22, -1, 0},
203
+ /* 24 */ { 2, s_6_24, 22, -1, 0},
204
+ /* 25 */ { 3, s_6_25, 22, -1, 0},
205
+ /* 26 */ { 2, s_6_26, 22, -1, 0},
206
+ /* 27 */ { 3, s_6_27, 26, -1, 0},
207
+ /* 28 */ { 3, s_6_28, 26, -1, 0},
208
+ /* 29 */ { 3, s_6_29, 26, 9, 0}
209
+ };
210
+
211
+ static const symbol s_7_0[3] = { 'e', 'j', 'a' };
212
+ static const symbol s_7_1[3] = { 'm', 'm', 'a' };
213
+ static const symbol s_7_2[4] = { 'i', 'm', 'm', 'a' };
214
+ static const symbol s_7_3[3] = { 'm', 'p', 'a' };
215
+ static const symbol s_7_4[4] = { 'i', 'm', 'p', 'a' };
216
+ static const symbol s_7_5[3] = { 'm', 'm', 'i' };
217
+ static const symbol s_7_6[4] = { 'i', 'm', 'm', 'i' };
218
+ static const symbol s_7_7[3] = { 'm', 'p', 'i' };
219
+ static const symbol s_7_8[4] = { 'i', 'm', 'p', 'i' };
220
+ static const symbol s_7_9[3] = { 'e', 'j', 0xE4 };
221
+ static const symbol s_7_10[3] = { 'm', 'm', 0xE4 };
222
+ static const symbol s_7_11[4] = { 'i', 'm', 'm', 0xE4 };
223
+ static const symbol s_7_12[3] = { 'm', 'p', 0xE4 };
224
+ static const symbol s_7_13[4] = { 'i', 'm', 'p', 0xE4 };
225
+
226
+ static const struct among a_7[14] =
227
+ {
228
+ /* 0 */ { 3, s_7_0, -1, -1, 0},
229
+ /* 1 */ { 3, s_7_1, -1, 1, 0},
230
+ /* 2 */ { 4, s_7_2, 1, -1, 0},
231
+ /* 3 */ { 3, s_7_3, -1, 1, 0},
232
+ /* 4 */ { 4, s_7_4, 3, -1, 0},
233
+ /* 5 */ { 3, s_7_5, -1, 1, 0},
234
+ /* 6 */ { 4, s_7_6, 5, -1, 0},
235
+ /* 7 */ { 3, s_7_7, -1, 1, 0},
236
+ /* 8 */ { 4, s_7_8, 7, -1, 0},
237
+ /* 9 */ { 3, s_7_9, -1, -1, 0},
238
+ /* 10 */ { 3, s_7_10, -1, 1, 0},
239
+ /* 11 */ { 4, s_7_11, 10, -1, 0},
240
+ /* 12 */ { 3, s_7_12, -1, 1, 0},
241
+ /* 13 */ { 4, s_7_13, 12, -1, 0}
242
+ };
243
+
244
+ static const symbol s_8_0[1] = { 'i' };
245
+ static const symbol s_8_1[1] = { 'j' };
246
+
247
+ static const struct among a_8[2] =
248
+ {
249
+ /* 0 */ { 1, s_8_0, -1, -1, 0},
250
+ /* 1 */ { 1, s_8_1, -1, -1, 0}
251
+ };
252
+
253
+ static const symbol s_9_0[3] = { 'm', 'm', 'a' };
254
+ static const symbol s_9_1[4] = { 'i', 'm', 'm', 'a' };
255
+
256
+ static const struct among a_9[2] =
257
+ {
258
+ /* 0 */ { 3, s_9_0, -1, 1, 0},
259
+ /* 1 */ { 4, s_9_1, 0, -1, 0}
260
+ };
261
+
262
+ static const unsigned char g_AEI[] = { 17, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 8 };
263
+
264
+ static const unsigned char g_V1[] = { 17, 65, 16, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 8, 0, 32 };
265
+
266
+ static const unsigned char g_V2[] = { 17, 65, 16, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 8, 0, 32 };
267
+
268
+ static const unsigned char g_particle_end[] = { 17, 97, 24, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 8, 0, 32 };
269
+
270
+ static const symbol s_0[] = { 'k' };
271
+ static const symbol s_1[] = { 'k', 's', 'e' };
272
+ static const symbol s_2[] = { 'k', 's', 'i' };
273
+ static const symbol s_3[] = { 'i' };
274
+ static const symbol s_4[] = { 'a' };
275
+ static const symbol s_5[] = { 'e' };
276
+ static const symbol s_6[] = { 'i' };
277
+ static const symbol s_7[] = { 'o' };
278
+ static const symbol s_8[] = { 0xE4 };
279
+ static const symbol s_9[] = { 0xF6 };
280
+ static const symbol s_10[] = { 'i', 'e' };
281
+ static const symbol s_11[] = { 'e' };
282
+ static const symbol s_12[] = { 'p', 'o' };
283
+ static const symbol s_13[] = { 't' };
284
+ static const symbol s_14[] = { 'p', 'o' };
285
+ static const symbol s_15[] = { 'j' };
286
+ static const symbol s_16[] = { 'o' };
287
+ static const symbol s_17[] = { 'u' };
288
+ static const symbol s_18[] = { 'o' };
289
+ static const symbol s_19[] = { 'j' };
290
+
291
+ static int r_mark_regions(struct SN_env * z) {
292
+ z->I[0] = z->l;
293
+ z->I[1] = z->l;
294
+ if (out_grouping(z, g_V1, 97, 246, 1) < 0) return 0; /* goto */ /* grouping V1, line 46 */
295
+ { /* gopast */ /* non V1, line 46 */
296
+ int ret = in_grouping(z, g_V1, 97, 246, 1);
297
+ if (ret < 0) return 0;
298
+ z->c += ret;
299
+ }
300
+ z->I[0] = z->c; /* setmark p1, line 46 */
301
+ if (out_grouping(z, g_V1, 97, 246, 1) < 0) return 0; /* goto */ /* grouping V1, line 47 */
302
+ { /* gopast */ /* non V1, line 47 */
303
+ int ret = in_grouping(z, g_V1, 97, 246, 1);
304
+ if (ret < 0) return 0;
305
+ z->c += ret;
306
+ }
307
+ z->I[1] = z->c; /* setmark p2, line 47 */
308
+ return 1;
309
+ }
310
+
311
+ static int r_R2(struct SN_env * z) {
312
+ if (!(z->I[1] <= z->c)) return 0;
313
+ return 1;
314
+ }
315
+
316
+ static int r_particle_etc(struct SN_env * z) {
317
+ int among_var;
318
+ { int mlimit; /* setlimit, line 55 */
319
+ int m1 = z->l - z->c; (void)m1;
320
+ if (z->c < z->I[0]) return 0;
321
+ z->c = z->I[0]; /* tomark, line 55 */
322
+ mlimit = z->lb; z->lb = z->c;
323
+ z->c = z->l - m1;
324
+ z->ket = z->c; /* [, line 55 */
325
+ among_var = find_among_b(z, a_0, 10); /* substring, line 55 */
326
+ if (!(among_var)) { z->lb = mlimit; return 0; }
327
+ z->bra = z->c; /* ], line 55 */
328
+ z->lb = mlimit;
329
+ }
330
+ switch(among_var) {
331
+ case 0: return 0;
332
+ case 1:
333
+ if (in_grouping_b(z, g_particle_end, 97, 246, 0)) return 0;
334
+ break;
335
+ case 2:
336
+ { int ret = r_R2(z);
337
+ if (ret == 0) return 0; /* call R2, line 64 */
338
+ if (ret < 0) return ret;
339
+ }
340
+ break;
341
+ }
342
+ { int ret = slice_del(z); /* delete, line 66 */
343
+ if (ret < 0) return ret;
344
+ }
345
+ return 1;
346
+ }
347
+
348
+ static int r_possessive(struct SN_env * z) {
349
+ int among_var;
350
+ { int mlimit; /* setlimit, line 69 */
351
+ int m1 = z->l - z->c; (void)m1;
352
+ if (z->c < z->I[0]) return 0;
353
+ z->c = z->I[0]; /* tomark, line 69 */
354
+ mlimit = z->lb; z->lb = z->c;
355
+ z->c = z->l - m1;
356
+ z->ket = z->c; /* [, line 69 */
357
+ among_var = find_among_b(z, a_4, 9); /* substring, line 69 */
358
+ if (!(among_var)) { z->lb = mlimit; return 0; }
359
+ z->bra = z->c; /* ], line 69 */
360
+ z->lb = mlimit;
361
+ }
362
+ switch(among_var) {
363
+ case 0: return 0;
364
+ case 1:
365
+ { int m2 = z->l - z->c; (void)m2; /* not, line 72 */
366
+ if (!(eq_s_b(z, 1, s_0))) goto lab0;
367
+ return 0;
368
+ lab0:
369
+ z->c = z->l - m2;
370
+ }
371
+ { int ret = slice_del(z); /* delete, line 72 */
372
+ if (ret < 0) return ret;
373
+ }
374
+ break;
375
+ case 2:
376
+ { int ret = slice_del(z); /* delete, line 74 */
377
+ if (ret < 0) return ret;
378
+ }
379
+ z->ket = z->c; /* [, line 74 */
380
+ if (!(eq_s_b(z, 3, s_1))) return 0;
381
+ z->bra = z->c; /* ], line 74 */
382
+ { int ret = slice_from_s(z, 3, s_2); /* <-, line 74 */
383
+ if (ret < 0) return ret;
384
+ }
385
+ break;
386
+ case 3:
387
+ { int ret = slice_del(z); /* delete, line 78 */
388
+ if (ret < 0) return ret;
389
+ }
390
+ break;
391
+ case 4:
392
+ if (z->c - 1 <= z->lb || z->p[z->c - 1] != 97) return 0;
393
+ if (!(find_among_b(z, a_1, 6))) return 0; /* among, line 81 */
394
+ { int ret = slice_del(z); /* delete, line 81 */
395
+ if (ret < 0) return ret;
396
+ }
397
+ break;
398
+ case 5:
399
+ if (z->c - 1 <= z->lb || z->p[z->c - 1] != 228) return 0;
400
+ if (!(find_among_b(z, a_2, 6))) return 0; /* among, line 83 */
401
+ { int ret = slice_del(z); /* delete, line 84 */
402
+ if (ret < 0) return ret;
403
+ }
404
+ break;
405
+ case 6:
406
+ if (z->c - 2 <= z->lb || z->p[z->c - 1] != 101) return 0;
407
+ if (!(find_among_b(z, a_3, 2))) return 0; /* among, line 86 */
408
+ { int ret = slice_del(z); /* delete, line 86 */
409
+ if (ret < 0) return ret;
410
+ }
411
+ break;
412
+ }
413
+ return 1;
414
+ }
415
+
416
+ static int r_LONG(struct SN_env * z) {
417
+ if (!(find_among_b(z, a_5, 7))) return 0; /* among, line 91 */
418
+ return 1;
419
+ }
420
+
421
+ static int r_VI(struct SN_env * z) {
422
+ if (!(eq_s_b(z, 1, s_3))) return 0;
423
+ if (in_grouping_b(z, g_V2, 97, 246, 0)) return 0;
424
+ return 1;
425
+ }
426
+
427
+ static int r_case_ending(struct SN_env * z) {
428
+ int among_var;
429
+ { int mlimit; /* setlimit, line 96 */
430
+ int m1 = z->l - z->c; (void)m1;
431
+ if (z->c < z->I[0]) return 0;
432
+ z->c = z->I[0]; /* tomark, line 96 */
433
+ mlimit = z->lb; z->lb = z->c;
434
+ z->c = z->l - m1;
435
+ z->ket = z->c; /* [, line 96 */
436
+ among_var = find_among_b(z, a_6, 30); /* substring, line 96 */
437
+ if (!(among_var)) { z->lb = mlimit; return 0; }
438
+ z->bra = z->c; /* ], line 96 */
439
+ z->lb = mlimit;
440
+ }
441
+ switch(among_var) {
442
+ case 0: return 0;
443
+ case 1:
444
+ if (!(eq_s_b(z, 1, s_4))) return 0;
445
+ break;
446
+ case 2:
447
+ if (!(eq_s_b(z, 1, s_5))) return 0;
448
+ break;
449
+ case 3:
450
+ if (!(eq_s_b(z, 1, s_6))) return 0;
451
+ break;
452
+ case 4:
453
+ if (!(eq_s_b(z, 1, s_7))) return 0;
454
+ break;
455
+ case 5:
456
+ if (!(eq_s_b(z, 1, s_8))) return 0;
457
+ break;
458
+ case 6:
459
+ if (!(eq_s_b(z, 1, s_9))) return 0;
460
+ break;
461
+ case 7:
462
+ { int m_keep = z->l - z->c;/* (void) m_keep;*/ /* try, line 111 */
463
+ { int m2 = z->l - z->c; (void)m2; /* and, line 113 */
464
+ { int m3 = z->l - z->c; (void)m3; /* or, line 112 */
465
+ { int ret = r_LONG(z);
466
+ if (ret == 0) goto lab2; /* call LONG, line 111 */
467
+ if (ret < 0) return ret;
468
+ }
469
+ goto lab1;
470
+ lab2:
471
+ z->c = z->l - m3;
472
+ if (!(eq_s_b(z, 2, s_10))) { z->c = z->l - m_keep; goto lab0; }
473
+ }
474
+ lab1:
475
+ z->c = z->l - m2;
476
+ if (z->c <= z->lb) { z->c = z->l - m_keep; goto lab0; }
477
+ z->c--; /* next, line 113 */
478
+ }
479
+ z->bra = z->c; /* ], line 113 */
480
+ lab0:
481
+ ;
482
+ }
483
+ break;
484
+ case 8:
485
+ if (in_grouping_b(z, g_V1, 97, 246, 0)) return 0;
486
+ if (out_grouping_b(z, g_V1, 97, 246, 0)) return 0;
487
+ break;
488
+ case 9:
489
+ if (!(eq_s_b(z, 1, s_11))) return 0;
490
+ break;
491
+ }
492
+ { int ret = slice_del(z); /* delete, line 138 */
493
+ if (ret < 0) return ret;
494
+ }
495
+ z->B[0] = 1; /* set ending_removed, line 139 */
496
+ return 1;
497
+ }
498
+
499
+ static int r_other_endings(struct SN_env * z) {
500
+ int among_var;
501
+ { int mlimit; /* setlimit, line 142 */
502
+ int m1 = z->l - z->c; (void)m1;
503
+ if (z->c < z->I[1]) return 0;
504
+ z->c = z->I[1]; /* tomark, line 142 */
505
+ mlimit = z->lb; z->lb = z->c;
506
+ z->c = z->l - m1;
507
+ z->ket = z->c; /* [, line 142 */
508
+ among_var = find_among_b(z, a_7, 14); /* substring, line 142 */
509
+ if (!(among_var)) { z->lb = mlimit; return 0; }
510
+ z->bra = z->c; /* ], line 142 */
511
+ z->lb = mlimit;
512
+ }
513
+ switch(among_var) {
514
+ case 0: return 0;
515
+ case 1:
516
+ { int m2 = z->l - z->c; (void)m2; /* not, line 146 */
517
+ if (!(eq_s_b(z, 2, s_12))) goto lab0;
518
+ return 0;
519
+ lab0:
520
+ z->c = z->l - m2;
521
+ }
522
+ break;
523
+ }
524
+ { int ret = slice_del(z); /* delete, line 151 */
525
+ if (ret < 0) return ret;
526
+ }
527
+ return 1;
528
+ }
529
+
530
+ static int r_i_plural(struct SN_env * z) {
531
+ { int mlimit; /* setlimit, line 154 */
532
+ int m1 = z->l - z->c; (void)m1;
533
+ if (z->c < z->I[0]) return 0;
534
+ z->c = z->I[0]; /* tomark, line 154 */
535
+ mlimit = z->lb; z->lb = z->c;
536
+ z->c = z->l - m1;
537
+ z->ket = z->c; /* [, line 154 */
538
+ if (z->c <= z->lb || (z->p[z->c - 1] != 105 && z->p[z->c - 1] != 106)) { z->lb = mlimit; return 0; }
539
+ if (!(find_among_b(z, a_8, 2))) { z->lb = mlimit; return 0; } /* substring, line 154 */
540
+ z->bra = z->c; /* ], line 154 */
541
+ z->lb = mlimit;
542
+ }
543
+ { int ret = slice_del(z); /* delete, line 158 */
544
+ if (ret < 0) return ret;
545
+ }
546
+ return 1;
547
+ }
548
+
549
+ static int r_t_plural(struct SN_env * z) {
550
+ int among_var;
551
+ { int mlimit; /* setlimit, line 161 */
552
+ int m1 = z->l - z->c; (void)m1;
553
+ if (z->c < z->I[0]) return 0;
554
+ z->c = z->I[0]; /* tomark, line 161 */
555
+ mlimit = z->lb; z->lb = z->c;
556
+ z->c = z->l - m1;
557
+ z->ket = z->c; /* [, line 162 */
558
+ if (!(eq_s_b(z, 1, s_13))) { z->lb = mlimit; return 0; }
559
+ z->bra = z->c; /* ], line 162 */
560
+ { int m_test = z->l - z->c; /* test, line 162 */
561
+ if (in_grouping_b(z, g_V1, 97, 246, 0)) { z->lb = mlimit; return 0; }
562
+ z->c = z->l - m_test;
563
+ }
564
+ { int ret = slice_del(z); /* delete, line 163 */
565
+ if (ret < 0) return ret;
566
+ }
567
+ z->lb = mlimit;
568
+ }
569
+ { int mlimit; /* setlimit, line 165 */
570
+ int m2 = z->l - z->c; (void)m2;
571
+ if (z->c < z->I[1]) return 0;
572
+ z->c = z->I[1]; /* tomark, line 165 */
573
+ mlimit = z->lb; z->lb = z->c;
574
+ z->c = z->l - m2;
575
+ z->ket = z->c; /* [, line 165 */
576
+ if (z->c - 2 <= z->lb || z->p[z->c - 1] != 97) { z->lb = mlimit; return 0; }
577
+ among_var = find_among_b(z, a_9, 2); /* substring, line 165 */
578
+ if (!(among_var)) { z->lb = mlimit; return 0; }
579
+ z->bra = z->c; /* ], line 165 */
580
+ z->lb = mlimit;
581
+ }
582
+ switch(among_var) {
583
+ case 0: return 0;
584
+ case 1:
585
+ { int m3 = z->l - z->c; (void)m3; /* not, line 167 */
586
+ if (!(eq_s_b(z, 2, s_14))) goto lab0;
587
+ return 0;
588
+ lab0:
589
+ z->c = z->l - m3;
590
+ }
591
+ break;
592
+ }
593
+ { int ret = slice_del(z); /* delete, line 170 */
594
+ if (ret < 0) return ret;
595
+ }
596
+ return 1;
597
+ }
598
+
599
+ static int r_tidy(struct SN_env * z) {
600
+ { int mlimit; /* setlimit, line 173 */
601
+ int m1 = z->l - z->c; (void)m1;
602
+ if (z->c < z->I[0]) return 0;
603
+ z->c = z->I[0]; /* tomark, line 173 */
604
+ mlimit = z->lb; z->lb = z->c;
605
+ z->c = z->l - m1;
606
+ { int m2 = z->l - z->c; (void)m2; /* do, line 174 */
607
+ { int m3 = z->l - z->c; (void)m3; /* and, line 174 */
608
+ { int ret = r_LONG(z);
609
+ if (ret == 0) goto lab0; /* call LONG, line 174 */
610
+ if (ret < 0) return ret;
611
+ }
612
+ z->c = z->l - m3;
613
+ z->ket = z->c; /* [, line 174 */
614
+ if (z->c <= z->lb) goto lab0;
615
+ z->c--; /* next, line 174 */
616
+ z->bra = z->c; /* ], line 174 */
617
+ { int ret = slice_del(z); /* delete, line 174 */
618
+ if (ret < 0) return ret;
619
+ }
620
+ }
621
+ lab0:
622
+ z->c = z->l - m2;
623
+ }
624
+ { int m4 = z->l - z->c; (void)m4; /* do, line 175 */
625
+ z->ket = z->c; /* [, line 175 */
626
+ if (in_grouping_b(z, g_AEI, 97, 228, 0)) goto lab1;
627
+ z->bra = z->c; /* ], line 175 */
628
+ if (out_grouping_b(z, g_V1, 97, 246, 0)) goto lab1;
629
+ { int ret = slice_del(z); /* delete, line 175 */
630
+ if (ret < 0) return ret;
631
+ }
632
+ lab1:
633
+ z->c = z->l - m4;
634
+ }
635
+ { int m5 = z->l - z->c; (void)m5; /* do, line 176 */
636
+ z->ket = z->c; /* [, line 176 */
637
+ if (!(eq_s_b(z, 1, s_15))) goto lab2;
638
+ z->bra = z->c; /* ], line 176 */
639
+ { int m6 = z->l - z->c; (void)m6; /* or, line 176 */
640
+ if (!(eq_s_b(z, 1, s_16))) goto lab4;
641
+ goto lab3;
642
+ lab4:
643
+ z->c = z->l - m6;
644
+ if (!(eq_s_b(z, 1, s_17))) goto lab2;
645
+ }
646
+ lab3:
647
+ { int ret = slice_del(z); /* delete, line 176 */
648
+ if (ret < 0) return ret;
649
+ }
650
+ lab2:
651
+ z->c = z->l - m5;
652
+ }
653
+ { int m7 = z->l - z->c; (void)m7; /* do, line 177 */
654
+ z->ket = z->c; /* [, line 177 */
655
+ if (!(eq_s_b(z, 1, s_18))) goto lab5;
656
+ z->bra = z->c; /* ], line 177 */
657
+ if (!(eq_s_b(z, 1, s_19))) goto lab5;
658
+ { int ret = slice_del(z); /* delete, line 177 */
659
+ if (ret < 0) return ret;
660
+ }
661
+ lab5:
662
+ z->c = z->l - m7;
663
+ }
664
+ z->lb = mlimit;
665
+ }
666
+ if (in_grouping_b(z, g_V1, 97, 246, 1) < 0) return 0; /* goto */ /* non V1, line 179 */
667
+ z->ket = z->c; /* [, line 179 */
668
+ if (z->c <= z->lb) return 0;
669
+ z->c--; /* next, line 179 */
670
+ z->bra = z->c; /* ], line 179 */
671
+ z->S[0] = slice_to(z, z->S[0]); /* -> x, line 179 */
672
+ if (z->S[0] == 0) return -1; /* -> x, line 179 */
673
+ if (!(eq_v_b(z, z->S[0]))) return 0; /* name x, line 179 */
674
+ { int ret = slice_del(z); /* delete, line 179 */
675
+ if (ret < 0) return ret;
676
+ }
677
+ return 1;
678
+ }
679
+
680
+ extern int finnish_ISO_8859_1_stem(struct SN_env * z) {
681
+ { int c1 = z->c; /* do, line 185 */
682
+ { int ret = r_mark_regions(z);
683
+ if (ret == 0) goto lab0; /* call mark_regions, line 185 */
684
+ if (ret < 0) return ret;
685
+ }
686
+ lab0:
687
+ z->c = c1;
688
+ }
689
+ z->B[0] = 0; /* unset ending_removed, line 186 */
690
+ z->lb = z->c; z->c = z->l; /* backwards, line 187 */
691
+
692
+ { int m2 = z->l - z->c; (void)m2; /* do, line 188 */
693
+ { int ret = r_particle_etc(z);
694
+ if (ret == 0) goto lab1; /* call particle_etc, line 188 */
695
+ if (ret < 0) return ret;
696
+ }
697
+ lab1:
698
+ z->c = z->l - m2;
699
+ }
700
+ { int m3 = z->l - z->c; (void)m3; /* do, line 189 */
701
+ { int ret = r_possessive(z);
702
+ if (ret == 0) goto lab2; /* call possessive, line 189 */
703
+ if (ret < 0) return ret;
704
+ }
705
+ lab2:
706
+ z->c = z->l - m3;
707
+ }
708
+ { int m4 = z->l - z->c; (void)m4; /* do, line 190 */
709
+ { int ret = r_case_ending(z);
710
+ if (ret == 0) goto lab3; /* call case_ending, line 190 */
711
+ if (ret < 0) return ret;
712
+ }
713
+ lab3:
714
+ z->c = z->l - m4;
715
+ }
716
+ { int m5 = z->l - z->c; (void)m5; /* do, line 191 */
717
+ { int ret = r_other_endings(z);
718
+ if (ret == 0) goto lab4; /* call other_endings, line 191 */
719
+ if (ret < 0) return ret;
720
+ }
721
+ lab4:
722
+ z->c = z->l - m5;
723
+ }
724
+ { int m6 = z->l - z->c; (void)m6; /* or, line 192 */
725
+ if (!(z->B[0])) goto lab6; /* Boolean test ending_removed, line 192 */
726
+ { int m7 = z->l - z->c; (void)m7; /* do, line 192 */
727
+ { int ret = r_i_plural(z);
728
+ if (ret == 0) goto lab7; /* call i_plural, line 192 */
729
+ if (ret < 0) return ret;
730
+ }
731
+ lab7:
732
+ z->c = z->l - m7;
733
+ }
734
+ goto lab5;
735
+ lab6:
736
+ z->c = z->l - m6;
737
+ { int m8 = z->l - z->c; (void)m8; /* do, line 192 */
738
+ { int ret = r_t_plural(z);
739
+ if (ret == 0) goto lab8; /* call t_plural, line 192 */
740
+ if (ret < 0) return ret;
741
+ }
742
+ lab8:
743
+ z->c = z->l - m8;
744
+ }
745
+ }
746
+ lab5:
747
+ { int m9 = z->l - z->c; (void)m9; /* do, line 193 */
748
+ { int ret = r_tidy(z);
749
+ if (ret == 0) goto lab9; /* call tidy, line 193 */
750
+ if (ret < 0) return ret;
751
+ }
752
+ lab9:
753
+ z->c = z->l - m9;
754
+ }
755
+ z->c = z->lb;
756
+ return 1;
757
+ }
758
+
759
+ extern struct SN_env * finnish_ISO_8859_1_create_env(void) { return SN_create_env(1, 2, 1); }
760
+
761
+ extern void finnish_ISO_8859_1_close_env(struct SN_env * z) { SN_close_env(z, 1); }
762
+