ruby-stemmer-dimelo 0.9.3.dimelo1

Sign up to get free protection for your applications and to get access to all the features.
Files changed (95) hide show
  1. checksums.yaml +7 -0
  2. data/MIT-LICENSE +21 -0
  3. data/README.rdoc +117 -0
  4. data/Rakefile +70 -0
  5. data/VERSION +1 -0
  6. data/ext/lingua/extconf.rb +40 -0
  7. data/ext/lingua/stemmer.c +115 -0
  8. data/lib/lingua/stemmer.rb +60 -0
  9. data/libstemmer_c/MANIFEST +72 -0
  10. data/libstemmer_c/Makefile +9 -0
  11. data/libstemmer_c/Makefile.windows +15 -0
  12. data/libstemmer_c/README +125 -0
  13. data/libstemmer_c/examples/stemwords.c +209 -0
  14. data/libstemmer_c/include/libstemmer.h +79 -0
  15. data/libstemmer_c/libstemmer/libstemmer.c +93 -0
  16. data/libstemmer_c/libstemmer/libstemmer_utf8.c +93 -0
  17. data/libstemmer_c/libstemmer/modules.h +195 -0
  18. data/libstemmer_c/libstemmer/modules.txt +51 -0
  19. data/libstemmer_c/libstemmer/modules_utf8.h +123 -0
  20. data/libstemmer_c/libstemmer/modules_utf8.txt +50 -0
  21. data/libstemmer_c/mkinc.mak +86 -0
  22. data/libstemmer_c/mkinc_utf8.mak +54 -0
  23. data/libstemmer_c/runtime/api.c +66 -0
  24. data/libstemmer_c/runtime/api.h +26 -0
  25. data/libstemmer_c/runtime/header.h +58 -0
  26. data/libstemmer_c/runtime/utilities.c +478 -0
  27. data/libstemmer_c/src_c/stem_ISO_8859_1_danish.c +337 -0
  28. data/libstemmer_c/src_c/stem_ISO_8859_1_danish.h +16 -0
  29. data/libstemmer_c/src_c/stem_ISO_8859_1_dutch.c +624 -0
  30. data/libstemmer_c/src_c/stem_ISO_8859_1_dutch.h +16 -0
  31. data/libstemmer_c/src_c/stem_ISO_8859_1_english.c +1117 -0
  32. data/libstemmer_c/src_c/stem_ISO_8859_1_english.h +16 -0
  33. data/libstemmer_c/src_c/stem_ISO_8859_1_finnish.c +762 -0
  34. data/libstemmer_c/src_c/stem_ISO_8859_1_finnish.h +16 -0
  35. data/libstemmer_c/src_c/stem_ISO_8859_1_french.c +1230 -0
  36. data/libstemmer_c/src_c/stem_ISO_8859_1_french.h +16 -0
  37. data/libstemmer_c/src_c/stem_ISO_8859_1_german.c +503 -0
  38. data/libstemmer_c/src_c/stem_ISO_8859_1_german.h +16 -0
  39. data/libstemmer_c/src_c/stem_ISO_8859_1_hungarian.c +1230 -0
  40. data/libstemmer_c/src_c/stem_ISO_8859_1_hungarian.h +16 -0
  41. data/libstemmer_c/src_c/stem_ISO_8859_1_italian.c +1065 -0
  42. data/libstemmer_c/src_c/stem_ISO_8859_1_italian.h +16 -0
  43. data/libstemmer_c/src_c/stem_ISO_8859_1_latin.c +443 -0
  44. data/libstemmer_c/src_c/stem_ISO_8859_1_latin.h +16 -0
  45. data/libstemmer_c/src_c/stem_ISO_8859_1_norwegian.c +297 -0
  46. data/libstemmer_c/src_c/stem_ISO_8859_1_norwegian.h +16 -0
  47. data/libstemmer_c/src_c/stem_ISO_8859_1_porter.c +749 -0
  48. data/libstemmer_c/src_c/stem_ISO_8859_1_porter.h +16 -0
  49. data/libstemmer_c/src_c/stem_ISO_8859_1_portuguese.c +1017 -0
  50. data/libstemmer_c/src_c/stem_ISO_8859_1_portuguese.h +16 -0
  51. data/libstemmer_c/src_c/stem_ISO_8859_1_spanish.c +1093 -0
  52. data/libstemmer_c/src_c/stem_ISO_8859_1_spanish.h +16 -0
  53. data/libstemmer_c/src_c/stem_ISO_8859_1_swedish.c +307 -0
  54. data/libstemmer_c/src_c/stem_ISO_8859_1_swedish.h +16 -0
  55. data/libstemmer_c/src_c/stem_ISO_8859_2_romanian.c +998 -0
  56. data/libstemmer_c/src_c/stem_ISO_8859_2_romanian.h +16 -0
  57. data/libstemmer_c/src_c/stem_KOI8_R_russian.c +700 -0
  58. data/libstemmer_c/src_c/stem_KOI8_R_russian.h +16 -0
  59. data/libstemmer_c/src_c/stem_UTF_8_danish.c +339 -0
  60. data/libstemmer_c/src_c/stem_UTF_8_danish.h +16 -0
  61. data/libstemmer_c/src_c/stem_UTF_8_dutch.c +634 -0
  62. data/libstemmer_c/src_c/stem_UTF_8_dutch.h +16 -0
  63. data/libstemmer_c/src_c/stem_UTF_8_english.c +1125 -0
  64. data/libstemmer_c/src_c/stem_UTF_8_english.h +16 -0
  65. data/libstemmer_c/src_c/stem_UTF_8_finnish.c +768 -0
  66. data/libstemmer_c/src_c/stem_UTF_8_finnish.h +16 -0
  67. data/libstemmer_c/src_c/stem_UTF_8_french.c +1230 -0
  68. data/libstemmer_c/src_c/stem_UTF_8_french.h +16 -0
  69. data/libstemmer_c/src_c/stem_UTF_8_german.c +509 -0
  70. data/libstemmer_c/src_c/stem_UTF_8_german.h +16 -0
  71. data/libstemmer_c/src_c/stem_UTF_8_hungarian.c +1234 -0
  72. data/libstemmer_c/src_c/stem_UTF_8_hungarian.h +16 -0
  73. data/libstemmer_c/src_c/stem_UTF_8_italian.c +1073 -0
  74. data/libstemmer_c/src_c/stem_UTF_8_italian.h +16 -0
  75. data/libstemmer_c/src_c/stem_UTF_8_latin.c +443 -0
  76. data/libstemmer_c/src_c/stem_UTF_8_latin.h +16 -0
  77. data/libstemmer_c/src_c/stem_UTF_8_norwegian.c +299 -0
  78. data/libstemmer_c/src_c/stem_UTF_8_norwegian.h +16 -0
  79. data/libstemmer_c/src_c/stem_UTF_8_porter.c +755 -0
  80. data/libstemmer_c/src_c/stem_UTF_8_porter.h +16 -0
  81. data/libstemmer_c/src_c/stem_UTF_8_portuguese.c +1023 -0
  82. data/libstemmer_c/src_c/stem_UTF_8_portuguese.h +16 -0
  83. data/libstemmer_c/src_c/stem_UTF_8_romanian.c +1004 -0
  84. data/libstemmer_c/src_c/stem_UTF_8_romanian.h +16 -0
  85. data/libstemmer_c/src_c/stem_UTF_8_russian.c +694 -0
  86. data/libstemmer_c/src_c/stem_UTF_8_russian.h +16 -0
  87. data/libstemmer_c/src_c/stem_UTF_8_spanish.c +1097 -0
  88. data/libstemmer_c/src_c/stem_UTF_8_spanish.h +16 -0
  89. data/libstemmer_c/src_c/stem_UTF_8_swedish.c +309 -0
  90. data/libstemmer_c/src_c/stem_UTF_8_swedish.h +16 -0
  91. data/libstemmer_c/src_c/stem_UTF_8_turkish.c +2205 -0
  92. data/libstemmer_c/src_c/stem_UTF_8_turkish.h +16 -0
  93. data/test/helper.rb +3 -0
  94. data/test/lingua/test_stemmer.rb +99 -0
  95. metadata +141 -0
@@ -0,0 +1,16 @@
1
+
2
+ /* This file was generated automatically by the Snowball to ANSI C compiler */
3
+
4
+ #ifdef __cplusplus
5
+ extern "C" {
6
+ #endif
7
+
8
+ extern struct SN_env * english_UTF_8_create_env(void);
9
+ extern void english_UTF_8_close_env(struct SN_env * z);
10
+
11
+ extern int english_UTF_8_stem(struct SN_env * z);
12
+
13
+ #ifdef __cplusplus
14
+ }
15
+ #endif
16
+
@@ -0,0 +1,768 @@
1
+
2
+ /* This file was generated automatically by the Snowball to ANSI C compiler */
3
+
4
+ #include "../runtime/header.h"
5
+
6
+ #ifdef __cplusplus
7
+ extern "C" {
8
+ #endif
9
+ extern int finnish_UTF_8_stem(struct SN_env * z);
10
+ #ifdef __cplusplus
11
+ }
12
+ #endif
13
+ static int r_tidy(struct SN_env * z);
14
+ static int r_other_endings(struct SN_env * z);
15
+ static int r_t_plural(struct SN_env * z);
16
+ static int r_i_plural(struct SN_env * z);
17
+ static int r_case_ending(struct SN_env * z);
18
+ static int r_VI(struct SN_env * z);
19
+ static int r_LONG(struct SN_env * z);
20
+ static int r_possessive(struct SN_env * z);
21
+ static int r_particle_etc(struct SN_env * z);
22
+ static int r_R2(struct SN_env * z);
23
+ static int r_mark_regions(struct SN_env * z);
24
+ #ifdef __cplusplus
25
+ extern "C" {
26
+ #endif
27
+
28
+
29
+ extern struct SN_env * finnish_UTF_8_create_env(void);
30
+ extern void finnish_UTF_8_close_env(struct SN_env * z);
31
+
32
+
33
+ #ifdef __cplusplus
34
+ }
35
+ #endif
36
+ static const symbol s_0_0[2] = { 'p', 'a' };
37
+ static const symbol s_0_1[3] = { 's', 't', 'i' };
38
+ static const symbol s_0_2[4] = { 'k', 'a', 'a', 'n' };
39
+ static const symbol s_0_3[3] = { 'h', 'a', 'n' };
40
+ static const symbol s_0_4[3] = { 'k', 'i', 'n' };
41
+ static const symbol s_0_5[4] = { 'h', 0xC3, 0xA4, 'n' };
42
+ static const symbol s_0_6[6] = { 'k', 0xC3, 0xA4, 0xC3, 0xA4, 'n' };
43
+ static const symbol s_0_7[2] = { 'k', 'o' };
44
+ static const symbol s_0_8[3] = { 'p', 0xC3, 0xA4 };
45
+ static const symbol s_0_9[3] = { 'k', 0xC3, 0xB6 };
46
+
47
+ static const struct among a_0[10] =
48
+ {
49
+ /* 0 */ { 2, s_0_0, -1, 1, 0},
50
+ /* 1 */ { 3, s_0_1, -1, 2, 0},
51
+ /* 2 */ { 4, s_0_2, -1, 1, 0},
52
+ /* 3 */ { 3, s_0_3, -1, 1, 0},
53
+ /* 4 */ { 3, s_0_4, -1, 1, 0},
54
+ /* 5 */ { 4, s_0_5, -1, 1, 0},
55
+ /* 6 */ { 6, s_0_6, -1, 1, 0},
56
+ /* 7 */ { 2, s_0_7, -1, 1, 0},
57
+ /* 8 */ { 3, s_0_8, -1, 1, 0},
58
+ /* 9 */ { 3, s_0_9, -1, 1, 0}
59
+ };
60
+
61
+ static const symbol s_1_0[3] = { 'l', 'l', 'a' };
62
+ static const symbol s_1_1[2] = { 'n', 'a' };
63
+ static const symbol s_1_2[3] = { 's', 's', 'a' };
64
+ static const symbol s_1_3[2] = { 't', 'a' };
65
+ static const symbol s_1_4[3] = { 'l', 't', 'a' };
66
+ static const symbol s_1_5[3] = { 's', 't', 'a' };
67
+
68
+ static const struct among a_1[6] =
69
+ {
70
+ /* 0 */ { 3, s_1_0, -1, -1, 0},
71
+ /* 1 */ { 2, s_1_1, -1, -1, 0},
72
+ /* 2 */ { 3, s_1_2, -1, -1, 0},
73
+ /* 3 */ { 2, s_1_3, -1, -1, 0},
74
+ /* 4 */ { 3, s_1_4, 3, -1, 0},
75
+ /* 5 */ { 3, s_1_5, 3, -1, 0}
76
+ };
77
+
78
+ static const symbol s_2_0[4] = { 'l', 'l', 0xC3, 0xA4 };
79
+ static const symbol s_2_1[3] = { 'n', 0xC3, 0xA4 };
80
+ static const symbol s_2_2[4] = { 's', 's', 0xC3, 0xA4 };
81
+ static const symbol s_2_3[3] = { 't', 0xC3, 0xA4 };
82
+ static const symbol s_2_4[4] = { 'l', 't', 0xC3, 0xA4 };
83
+ static const symbol s_2_5[4] = { 's', 't', 0xC3, 0xA4 };
84
+
85
+ static const struct among a_2[6] =
86
+ {
87
+ /* 0 */ { 4, s_2_0, -1, -1, 0},
88
+ /* 1 */ { 3, s_2_1, -1, -1, 0},
89
+ /* 2 */ { 4, s_2_2, -1, -1, 0},
90
+ /* 3 */ { 3, s_2_3, -1, -1, 0},
91
+ /* 4 */ { 4, s_2_4, 3, -1, 0},
92
+ /* 5 */ { 4, s_2_5, 3, -1, 0}
93
+ };
94
+
95
+ static const symbol s_3_0[3] = { 'l', 'l', 'e' };
96
+ static const symbol s_3_1[3] = { 'i', 'n', 'e' };
97
+
98
+ static const struct among a_3[2] =
99
+ {
100
+ /* 0 */ { 3, s_3_0, -1, -1, 0},
101
+ /* 1 */ { 3, s_3_1, -1, -1, 0}
102
+ };
103
+
104
+ static const symbol s_4_0[3] = { 'n', 's', 'a' };
105
+ static const symbol s_4_1[3] = { 'm', 'm', 'e' };
106
+ static const symbol s_4_2[3] = { 'n', 'n', 'e' };
107
+ static const symbol s_4_3[2] = { 'n', 'i' };
108
+ static const symbol s_4_4[2] = { 's', 'i' };
109
+ static const symbol s_4_5[2] = { 'a', 'n' };
110
+ static const symbol s_4_6[2] = { 'e', 'n' };
111
+ static const symbol s_4_7[3] = { 0xC3, 0xA4, 'n' };
112
+ static const symbol s_4_8[4] = { 'n', 's', 0xC3, 0xA4 };
113
+
114
+ static const struct among a_4[9] =
115
+ {
116
+ /* 0 */ { 3, s_4_0, -1, 3, 0},
117
+ /* 1 */ { 3, s_4_1, -1, 3, 0},
118
+ /* 2 */ { 3, s_4_2, -1, 3, 0},
119
+ /* 3 */ { 2, s_4_3, -1, 2, 0},
120
+ /* 4 */ { 2, s_4_4, -1, 1, 0},
121
+ /* 5 */ { 2, s_4_5, -1, 4, 0},
122
+ /* 6 */ { 2, s_4_6, -1, 6, 0},
123
+ /* 7 */ { 3, s_4_7, -1, 5, 0},
124
+ /* 8 */ { 4, s_4_8, -1, 3, 0}
125
+ };
126
+
127
+ static const symbol s_5_0[2] = { 'a', 'a' };
128
+ static const symbol s_5_1[2] = { 'e', 'e' };
129
+ static const symbol s_5_2[2] = { 'i', 'i' };
130
+ static const symbol s_5_3[2] = { 'o', 'o' };
131
+ static const symbol s_5_4[2] = { 'u', 'u' };
132
+ static const symbol s_5_5[4] = { 0xC3, 0xA4, 0xC3, 0xA4 };
133
+ static const symbol s_5_6[4] = { 0xC3, 0xB6, 0xC3, 0xB6 };
134
+
135
+ static const struct among a_5[7] =
136
+ {
137
+ /* 0 */ { 2, s_5_0, -1, -1, 0},
138
+ /* 1 */ { 2, s_5_1, -1, -1, 0},
139
+ /* 2 */ { 2, s_5_2, -1, -1, 0},
140
+ /* 3 */ { 2, s_5_3, -1, -1, 0},
141
+ /* 4 */ { 2, s_5_4, -1, -1, 0},
142
+ /* 5 */ { 4, s_5_5, -1, -1, 0},
143
+ /* 6 */ { 4, s_5_6, -1, -1, 0}
144
+ };
145
+
146
+ static const symbol s_6_0[1] = { 'a' };
147
+ static const symbol s_6_1[3] = { 'l', 'l', 'a' };
148
+ static const symbol s_6_2[2] = { 'n', 'a' };
149
+ static const symbol s_6_3[3] = { 's', 's', 'a' };
150
+ static const symbol s_6_4[2] = { 't', 'a' };
151
+ static const symbol s_6_5[3] = { 'l', 't', 'a' };
152
+ static const symbol s_6_6[3] = { 's', 't', 'a' };
153
+ static const symbol s_6_7[3] = { 't', 't', 'a' };
154
+ static const symbol s_6_8[3] = { 'l', 'l', 'e' };
155
+ static const symbol s_6_9[3] = { 'i', 'n', 'e' };
156
+ static const symbol s_6_10[3] = { 'k', 's', 'i' };
157
+ static const symbol s_6_11[1] = { 'n' };
158
+ static const symbol s_6_12[3] = { 'h', 'a', 'n' };
159
+ static const symbol s_6_13[3] = { 'd', 'e', 'n' };
160
+ static const symbol s_6_14[4] = { 's', 'e', 'e', 'n' };
161
+ static const symbol s_6_15[3] = { 'h', 'e', 'n' };
162
+ static const symbol s_6_16[4] = { 't', 't', 'e', 'n' };
163
+ static const symbol s_6_17[3] = { 'h', 'i', 'n' };
164
+ static const symbol s_6_18[4] = { 's', 'i', 'i', 'n' };
165
+ static const symbol s_6_19[3] = { 'h', 'o', 'n' };
166
+ static const symbol s_6_20[4] = { 'h', 0xC3, 0xA4, 'n' };
167
+ static const symbol s_6_21[4] = { 'h', 0xC3, 0xB6, 'n' };
168
+ static const symbol s_6_22[2] = { 0xC3, 0xA4 };
169
+ static const symbol s_6_23[4] = { 'l', 'l', 0xC3, 0xA4 };
170
+ static const symbol s_6_24[3] = { 'n', 0xC3, 0xA4 };
171
+ static const symbol s_6_25[4] = { 's', 's', 0xC3, 0xA4 };
172
+ static const symbol s_6_26[3] = { 't', 0xC3, 0xA4 };
173
+ static const symbol s_6_27[4] = { 'l', 't', 0xC3, 0xA4 };
174
+ static const symbol s_6_28[4] = { 's', 't', 0xC3, 0xA4 };
175
+ static const symbol s_6_29[4] = { 't', 't', 0xC3, 0xA4 };
176
+
177
+ static const struct among a_6[30] =
178
+ {
179
+ /* 0 */ { 1, s_6_0, -1, 8, 0},
180
+ /* 1 */ { 3, s_6_1, 0, -1, 0},
181
+ /* 2 */ { 2, s_6_2, 0, -1, 0},
182
+ /* 3 */ { 3, s_6_3, 0, -1, 0},
183
+ /* 4 */ { 2, s_6_4, 0, -1, 0},
184
+ /* 5 */ { 3, s_6_5, 4, -1, 0},
185
+ /* 6 */ { 3, s_6_6, 4, -1, 0},
186
+ /* 7 */ { 3, s_6_7, 4, 9, 0},
187
+ /* 8 */ { 3, s_6_8, -1, -1, 0},
188
+ /* 9 */ { 3, s_6_9, -1, -1, 0},
189
+ /* 10 */ { 3, s_6_10, -1, -1, 0},
190
+ /* 11 */ { 1, s_6_11, -1, 7, 0},
191
+ /* 12 */ { 3, s_6_12, 11, 1, 0},
192
+ /* 13 */ { 3, s_6_13, 11, -1, r_VI},
193
+ /* 14 */ { 4, s_6_14, 11, -1, r_LONG},
194
+ /* 15 */ { 3, s_6_15, 11, 2, 0},
195
+ /* 16 */ { 4, s_6_16, 11, -1, r_VI},
196
+ /* 17 */ { 3, s_6_17, 11, 3, 0},
197
+ /* 18 */ { 4, s_6_18, 11, -1, r_VI},
198
+ /* 19 */ { 3, s_6_19, 11, 4, 0},
199
+ /* 20 */ { 4, s_6_20, 11, 5, 0},
200
+ /* 21 */ { 4, s_6_21, 11, 6, 0},
201
+ /* 22 */ { 2, s_6_22, -1, 8, 0},
202
+ /* 23 */ { 4, s_6_23, 22, -1, 0},
203
+ /* 24 */ { 3, s_6_24, 22, -1, 0},
204
+ /* 25 */ { 4, s_6_25, 22, -1, 0},
205
+ /* 26 */ { 3, s_6_26, 22, -1, 0},
206
+ /* 27 */ { 4, s_6_27, 26, -1, 0},
207
+ /* 28 */ { 4, s_6_28, 26, -1, 0},
208
+ /* 29 */ { 4, s_6_29, 26, 9, 0}
209
+ };
210
+
211
+ static const symbol s_7_0[3] = { 'e', 'j', 'a' };
212
+ static const symbol s_7_1[3] = { 'm', 'm', 'a' };
213
+ static const symbol s_7_2[4] = { 'i', 'm', 'm', 'a' };
214
+ static const symbol s_7_3[3] = { 'm', 'p', 'a' };
215
+ static const symbol s_7_4[4] = { 'i', 'm', 'p', 'a' };
216
+ static const symbol s_7_5[3] = { 'm', 'm', 'i' };
217
+ static const symbol s_7_6[4] = { 'i', 'm', 'm', 'i' };
218
+ static const symbol s_7_7[3] = { 'm', 'p', 'i' };
219
+ static const symbol s_7_8[4] = { 'i', 'm', 'p', 'i' };
220
+ static const symbol s_7_9[4] = { 'e', 'j', 0xC3, 0xA4 };
221
+ static const symbol s_7_10[4] = { 'm', 'm', 0xC3, 0xA4 };
222
+ static const symbol s_7_11[5] = { 'i', 'm', 'm', 0xC3, 0xA4 };
223
+ static const symbol s_7_12[4] = { 'm', 'p', 0xC3, 0xA4 };
224
+ static const symbol s_7_13[5] = { 'i', 'm', 'p', 0xC3, 0xA4 };
225
+
226
+ static const struct among a_7[14] =
227
+ {
228
+ /* 0 */ { 3, s_7_0, -1, -1, 0},
229
+ /* 1 */ { 3, s_7_1, -1, 1, 0},
230
+ /* 2 */ { 4, s_7_2, 1, -1, 0},
231
+ /* 3 */ { 3, s_7_3, -1, 1, 0},
232
+ /* 4 */ { 4, s_7_4, 3, -1, 0},
233
+ /* 5 */ { 3, s_7_5, -1, 1, 0},
234
+ /* 6 */ { 4, s_7_6, 5, -1, 0},
235
+ /* 7 */ { 3, s_7_7, -1, 1, 0},
236
+ /* 8 */ { 4, s_7_8, 7, -1, 0},
237
+ /* 9 */ { 4, s_7_9, -1, -1, 0},
238
+ /* 10 */ { 4, s_7_10, -1, 1, 0},
239
+ /* 11 */ { 5, s_7_11, 10, -1, 0},
240
+ /* 12 */ { 4, s_7_12, -1, 1, 0},
241
+ /* 13 */ { 5, s_7_13, 12, -1, 0}
242
+ };
243
+
244
+ static const symbol s_8_0[1] = { 'i' };
245
+ static const symbol s_8_1[1] = { 'j' };
246
+
247
+ static const struct among a_8[2] =
248
+ {
249
+ /* 0 */ { 1, s_8_0, -1, -1, 0},
250
+ /* 1 */ { 1, s_8_1, -1, -1, 0}
251
+ };
252
+
253
+ static const symbol s_9_0[3] = { 'm', 'm', 'a' };
254
+ static const symbol s_9_1[4] = { 'i', 'm', 'm', 'a' };
255
+
256
+ static const struct among a_9[2] =
257
+ {
258
+ /* 0 */ { 3, s_9_0, -1, 1, 0},
259
+ /* 1 */ { 4, s_9_1, 0, -1, 0}
260
+ };
261
+
262
+ static const unsigned char g_AEI[] = { 17, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 8 };
263
+
264
+ static const unsigned char g_V1[] = { 17, 65, 16, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 8, 0, 32 };
265
+
266
+ static const unsigned char g_V2[] = { 17, 65, 16, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 8, 0, 32 };
267
+
268
+ static const unsigned char g_particle_end[] = { 17, 97, 24, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 8, 0, 32 };
269
+
270
+ static const symbol s_0[] = { 'k' };
271
+ static const symbol s_1[] = { 'k', 's', 'e' };
272
+ static const symbol s_2[] = { 'k', 's', 'i' };
273
+ static const symbol s_3[] = { 'i' };
274
+ static const symbol s_4[] = { 'a' };
275
+ static const symbol s_5[] = { 'e' };
276
+ static const symbol s_6[] = { 'i' };
277
+ static const symbol s_7[] = { 'o' };
278
+ static const symbol s_8[] = { 0xC3, 0xA4 };
279
+ static const symbol s_9[] = { 0xC3, 0xB6 };
280
+ static const symbol s_10[] = { 'i', 'e' };
281
+ static const symbol s_11[] = { 'e' };
282
+ static const symbol s_12[] = { 'p', 'o' };
283
+ static const symbol s_13[] = { 't' };
284
+ static const symbol s_14[] = { 'p', 'o' };
285
+ static const symbol s_15[] = { 'j' };
286
+ static const symbol s_16[] = { 'o' };
287
+ static const symbol s_17[] = { 'u' };
288
+ static const symbol s_18[] = { 'o' };
289
+ static const symbol s_19[] = { 'j' };
290
+
291
+ static int r_mark_regions(struct SN_env * z) {
292
+ z->I[0] = z->l;
293
+ z->I[1] = z->l;
294
+ if (out_grouping_U(z, g_V1, 97, 246, 1) < 0) return 0; /* goto */ /* grouping V1, line 46 */
295
+ { /* gopast */ /* non V1, line 46 */
296
+ int ret = in_grouping_U(z, g_V1, 97, 246, 1);
297
+ if (ret < 0) return 0;
298
+ z->c += ret;
299
+ }
300
+ z->I[0] = z->c; /* setmark p1, line 46 */
301
+ if (out_grouping_U(z, g_V1, 97, 246, 1) < 0) return 0; /* goto */ /* grouping V1, line 47 */
302
+ { /* gopast */ /* non V1, line 47 */
303
+ int ret = in_grouping_U(z, g_V1, 97, 246, 1);
304
+ if (ret < 0) return 0;
305
+ z->c += ret;
306
+ }
307
+ z->I[1] = z->c; /* setmark p2, line 47 */
308
+ return 1;
309
+ }
310
+
311
+ static int r_R2(struct SN_env * z) {
312
+ if (!(z->I[1] <= z->c)) return 0;
313
+ return 1;
314
+ }
315
+
316
+ static int r_particle_etc(struct SN_env * z) {
317
+ int among_var;
318
+ { int mlimit; /* setlimit, line 55 */
319
+ int m1 = z->l - z->c; (void)m1;
320
+ if (z->c < z->I[0]) return 0;
321
+ z->c = z->I[0]; /* tomark, line 55 */
322
+ mlimit = z->lb; z->lb = z->c;
323
+ z->c = z->l - m1;
324
+ z->ket = z->c; /* [, line 55 */
325
+ among_var = find_among_b(z, a_0, 10); /* substring, line 55 */
326
+ if (!(among_var)) { z->lb = mlimit; return 0; }
327
+ z->bra = z->c; /* ], line 55 */
328
+ z->lb = mlimit;
329
+ }
330
+ switch(among_var) {
331
+ case 0: return 0;
332
+ case 1:
333
+ if (in_grouping_b_U(z, g_particle_end, 97, 246, 0)) return 0;
334
+ break;
335
+ case 2:
336
+ { int ret = r_R2(z);
337
+ if (ret == 0) return 0; /* call R2, line 64 */
338
+ if (ret < 0) return ret;
339
+ }
340
+ break;
341
+ }
342
+ { int ret = slice_del(z); /* delete, line 66 */
343
+ if (ret < 0) return ret;
344
+ }
345
+ return 1;
346
+ }
347
+
348
+ static int r_possessive(struct SN_env * z) {
349
+ int among_var;
350
+ { int mlimit; /* setlimit, line 69 */
351
+ int m1 = z->l - z->c; (void)m1;
352
+ if (z->c < z->I[0]) return 0;
353
+ z->c = z->I[0]; /* tomark, line 69 */
354
+ mlimit = z->lb; z->lb = z->c;
355
+ z->c = z->l - m1;
356
+ z->ket = z->c; /* [, line 69 */
357
+ among_var = find_among_b(z, a_4, 9); /* substring, line 69 */
358
+ if (!(among_var)) { z->lb = mlimit; return 0; }
359
+ z->bra = z->c; /* ], line 69 */
360
+ z->lb = mlimit;
361
+ }
362
+ switch(among_var) {
363
+ case 0: return 0;
364
+ case 1:
365
+ { int m2 = z->l - z->c; (void)m2; /* not, line 72 */
366
+ if (!(eq_s_b(z, 1, s_0))) goto lab0;
367
+ return 0;
368
+ lab0:
369
+ z->c = z->l - m2;
370
+ }
371
+ { int ret = slice_del(z); /* delete, line 72 */
372
+ if (ret < 0) return ret;
373
+ }
374
+ break;
375
+ case 2:
376
+ { int ret = slice_del(z); /* delete, line 74 */
377
+ if (ret < 0) return ret;
378
+ }
379
+ z->ket = z->c; /* [, line 74 */
380
+ if (!(eq_s_b(z, 3, s_1))) return 0;
381
+ z->bra = z->c; /* ], line 74 */
382
+ { int ret = slice_from_s(z, 3, s_2); /* <-, line 74 */
383
+ if (ret < 0) return ret;
384
+ }
385
+ break;
386
+ case 3:
387
+ { int ret = slice_del(z); /* delete, line 78 */
388
+ if (ret < 0) return ret;
389
+ }
390
+ break;
391
+ case 4:
392
+ if (z->c - 1 <= z->lb || z->p[z->c - 1] != 97) return 0;
393
+ if (!(find_among_b(z, a_1, 6))) return 0; /* among, line 81 */
394
+ { int ret = slice_del(z); /* delete, line 81 */
395
+ if (ret < 0) return ret;
396
+ }
397
+ break;
398
+ case 5:
399
+ if (z->c - 2 <= z->lb || z->p[z->c - 1] != 164) return 0;
400
+ if (!(find_among_b(z, a_2, 6))) return 0; /* among, line 83 */
401
+ { int ret = slice_del(z); /* delete, line 84 */
402
+ if (ret < 0) return ret;
403
+ }
404
+ break;
405
+ case 6:
406
+ if (z->c - 2 <= z->lb || z->p[z->c - 1] != 101) return 0;
407
+ if (!(find_among_b(z, a_3, 2))) return 0; /* among, line 86 */
408
+ { int ret = slice_del(z); /* delete, line 86 */
409
+ if (ret < 0) return ret;
410
+ }
411
+ break;
412
+ }
413
+ return 1;
414
+ }
415
+
416
+ static int r_LONG(struct SN_env * z) {
417
+ if (!(find_among_b(z, a_5, 7))) return 0; /* among, line 91 */
418
+ return 1;
419
+ }
420
+
421
+ static int r_VI(struct SN_env * z) {
422
+ if (!(eq_s_b(z, 1, s_3))) return 0;
423
+ if (in_grouping_b_U(z, g_V2, 97, 246, 0)) return 0;
424
+ return 1;
425
+ }
426
+
427
+ static int r_case_ending(struct SN_env * z) {
428
+ int among_var;
429
+ { int mlimit; /* setlimit, line 96 */
430
+ int m1 = z->l - z->c; (void)m1;
431
+ if (z->c < z->I[0]) return 0;
432
+ z->c = z->I[0]; /* tomark, line 96 */
433
+ mlimit = z->lb; z->lb = z->c;
434
+ z->c = z->l - m1;
435
+ z->ket = z->c; /* [, line 96 */
436
+ among_var = find_among_b(z, a_6, 30); /* substring, line 96 */
437
+ if (!(among_var)) { z->lb = mlimit; return 0; }
438
+ z->bra = z->c; /* ], line 96 */
439
+ z->lb = mlimit;
440
+ }
441
+ switch(among_var) {
442
+ case 0: return 0;
443
+ case 1:
444
+ if (!(eq_s_b(z, 1, s_4))) return 0;
445
+ break;
446
+ case 2:
447
+ if (!(eq_s_b(z, 1, s_5))) return 0;
448
+ break;
449
+ case 3:
450
+ if (!(eq_s_b(z, 1, s_6))) return 0;
451
+ break;
452
+ case 4:
453
+ if (!(eq_s_b(z, 1, s_7))) return 0;
454
+ break;
455
+ case 5:
456
+ if (!(eq_s_b(z, 2, s_8))) return 0;
457
+ break;
458
+ case 6:
459
+ if (!(eq_s_b(z, 2, s_9))) return 0;
460
+ break;
461
+ case 7:
462
+ { int m_keep = z->l - z->c;/* (void) m_keep;*/ /* try, line 111 */
463
+ { int m2 = z->l - z->c; (void)m2; /* and, line 113 */
464
+ { int m3 = z->l - z->c; (void)m3; /* or, line 112 */
465
+ { int ret = r_LONG(z);
466
+ if (ret == 0) goto lab2; /* call LONG, line 111 */
467
+ if (ret < 0) return ret;
468
+ }
469
+ goto lab1;
470
+ lab2:
471
+ z->c = z->l - m3;
472
+ if (!(eq_s_b(z, 2, s_10))) { z->c = z->l - m_keep; goto lab0; }
473
+ }
474
+ lab1:
475
+ z->c = z->l - m2;
476
+ { int ret = skip_utf8(z->p, z->c, z->lb, 0, -1);
477
+ if (ret < 0) { z->c = z->l - m_keep; goto lab0; }
478
+ z->c = ret; /* next, line 113 */
479
+ }
480
+ }
481
+ z->bra = z->c; /* ], line 113 */
482
+ lab0:
483
+ ;
484
+ }
485
+ break;
486
+ case 8:
487
+ if (in_grouping_b_U(z, g_V1, 97, 246, 0)) return 0;
488
+ if (out_grouping_b_U(z, g_V1, 97, 246, 0)) return 0;
489
+ break;
490
+ case 9:
491
+ if (!(eq_s_b(z, 1, s_11))) return 0;
492
+ break;
493
+ }
494
+ { int ret = slice_del(z); /* delete, line 138 */
495
+ if (ret < 0) return ret;
496
+ }
497
+ z->B[0] = 1; /* set ending_removed, line 139 */
498
+ return 1;
499
+ }
500
+
501
+ static int r_other_endings(struct SN_env * z) {
502
+ int among_var;
503
+ { int mlimit; /* setlimit, line 142 */
504
+ int m1 = z->l - z->c; (void)m1;
505
+ if (z->c < z->I[1]) return 0;
506
+ z->c = z->I[1]; /* tomark, line 142 */
507
+ mlimit = z->lb; z->lb = z->c;
508
+ z->c = z->l - m1;
509
+ z->ket = z->c; /* [, line 142 */
510
+ among_var = find_among_b(z, a_7, 14); /* substring, line 142 */
511
+ if (!(among_var)) { z->lb = mlimit; return 0; }
512
+ z->bra = z->c; /* ], line 142 */
513
+ z->lb = mlimit;
514
+ }
515
+ switch(among_var) {
516
+ case 0: return 0;
517
+ case 1:
518
+ { int m2 = z->l - z->c; (void)m2; /* not, line 146 */
519
+ if (!(eq_s_b(z, 2, s_12))) goto lab0;
520
+ return 0;
521
+ lab0:
522
+ z->c = z->l - m2;
523
+ }
524
+ break;
525
+ }
526
+ { int ret = slice_del(z); /* delete, line 151 */
527
+ if (ret < 0) return ret;
528
+ }
529
+ return 1;
530
+ }
531
+
532
+ static int r_i_plural(struct SN_env * z) {
533
+ { int mlimit; /* setlimit, line 154 */
534
+ int m1 = z->l - z->c; (void)m1;
535
+ if (z->c < z->I[0]) return 0;
536
+ z->c = z->I[0]; /* tomark, line 154 */
537
+ mlimit = z->lb; z->lb = z->c;
538
+ z->c = z->l - m1;
539
+ z->ket = z->c; /* [, line 154 */
540
+ if (z->c <= z->lb || (z->p[z->c - 1] != 105 && z->p[z->c - 1] != 106)) { z->lb = mlimit; return 0; }
541
+ if (!(find_among_b(z, a_8, 2))) { z->lb = mlimit; return 0; } /* substring, line 154 */
542
+ z->bra = z->c; /* ], line 154 */
543
+ z->lb = mlimit;
544
+ }
545
+ { int ret = slice_del(z); /* delete, line 158 */
546
+ if (ret < 0) return ret;
547
+ }
548
+ return 1;
549
+ }
550
+
551
+ static int r_t_plural(struct SN_env * z) {
552
+ int among_var;
553
+ { int mlimit; /* setlimit, line 161 */
554
+ int m1 = z->l - z->c; (void)m1;
555
+ if (z->c < z->I[0]) return 0;
556
+ z->c = z->I[0]; /* tomark, line 161 */
557
+ mlimit = z->lb; z->lb = z->c;
558
+ z->c = z->l - m1;
559
+ z->ket = z->c; /* [, line 162 */
560
+ if (!(eq_s_b(z, 1, s_13))) { z->lb = mlimit; return 0; }
561
+ z->bra = z->c; /* ], line 162 */
562
+ { int m_test = z->l - z->c; /* test, line 162 */
563
+ if (in_grouping_b_U(z, g_V1, 97, 246, 0)) { z->lb = mlimit; return 0; }
564
+ z->c = z->l - m_test;
565
+ }
566
+ { int ret = slice_del(z); /* delete, line 163 */
567
+ if (ret < 0) return ret;
568
+ }
569
+ z->lb = mlimit;
570
+ }
571
+ { int mlimit; /* setlimit, line 165 */
572
+ int m2 = z->l - z->c; (void)m2;
573
+ if (z->c < z->I[1]) return 0;
574
+ z->c = z->I[1]; /* tomark, line 165 */
575
+ mlimit = z->lb; z->lb = z->c;
576
+ z->c = z->l - m2;
577
+ z->ket = z->c; /* [, line 165 */
578
+ if (z->c - 2 <= z->lb || z->p[z->c - 1] != 97) { z->lb = mlimit; return 0; }
579
+ among_var = find_among_b(z, a_9, 2); /* substring, line 165 */
580
+ if (!(among_var)) { z->lb = mlimit; return 0; }
581
+ z->bra = z->c; /* ], line 165 */
582
+ z->lb = mlimit;
583
+ }
584
+ switch(among_var) {
585
+ case 0: return 0;
586
+ case 1:
587
+ { int m3 = z->l - z->c; (void)m3; /* not, line 167 */
588
+ if (!(eq_s_b(z, 2, s_14))) goto lab0;
589
+ return 0;
590
+ lab0:
591
+ z->c = z->l - m3;
592
+ }
593
+ break;
594
+ }
595
+ { int ret = slice_del(z); /* delete, line 170 */
596
+ if (ret < 0) return ret;
597
+ }
598
+ return 1;
599
+ }
600
+
601
+ static int r_tidy(struct SN_env * z) {
602
+ { int mlimit; /* setlimit, line 173 */
603
+ int m1 = z->l - z->c; (void)m1;
604
+ if (z->c < z->I[0]) return 0;
605
+ z->c = z->I[0]; /* tomark, line 173 */
606
+ mlimit = z->lb; z->lb = z->c;
607
+ z->c = z->l - m1;
608
+ { int m2 = z->l - z->c; (void)m2; /* do, line 174 */
609
+ { int m3 = z->l - z->c; (void)m3; /* and, line 174 */
610
+ { int ret = r_LONG(z);
611
+ if (ret == 0) goto lab0; /* call LONG, line 174 */
612
+ if (ret < 0) return ret;
613
+ }
614
+ z->c = z->l - m3;
615
+ z->ket = z->c; /* [, line 174 */
616
+ { int ret = skip_utf8(z->p, z->c, z->lb, 0, -1);
617
+ if (ret < 0) goto lab0;
618
+ z->c = ret; /* next, line 174 */
619
+ }
620
+ z->bra = z->c; /* ], line 174 */
621
+ { int ret = slice_del(z); /* delete, line 174 */
622
+ if (ret < 0) return ret;
623
+ }
624
+ }
625
+ lab0:
626
+ z->c = z->l - m2;
627
+ }
628
+ { int m4 = z->l - z->c; (void)m4; /* do, line 175 */
629
+ z->ket = z->c; /* [, line 175 */
630
+ if (in_grouping_b_U(z, g_AEI, 97, 228, 0)) goto lab1;
631
+ z->bra = z->c; /* ], line 175 */
632
+ if (out_grouping_b_U(z, g_V1, 97, 246, 0)) goto lab1;
633
+ { int ret = slice_del(z); /* delete, line 175 */
634
+ if (ret < 0) return ret;
635
+ }
636
+ lab1:
637
+ z->c = z->l - m4;
638
+ }
639
+ { int m5 = z->l - z->c; (void)m5; /* do, line 176 */
640
+ z->ket = z->c; /* [, line 176 */
641
+ if (!(eq_s_b(z, 1, s_15))) goto lab2;
642
+ z->bra = z->c; /* ], line 176 */
643
+ { int m6 = z->l - z->c; (void)m6; /* or, line 176 */
644
+ if (!(eq_s_b(z, 1, s_16))) goto lab4;
645
+ goto lab3;
646
+ lab4:
647
+ z->c = z->l - m6;
648
+ if (!(eq_s_b(z, 1, s_17))) goto lab2;
649
+ }
650
+ lab3:
651
+ { int ret = slice_del(z); /* delete, line 176 */
652
+ if (ret < 0) return ret;
653
+ }
654
+ lab2:
655
+ z->c = z->l - m5;
656
+ }
657
+ { int m7 = z->l - z->c; (void)m7; /* do, line 177 */
658
+ z->ket = z->c; /* [, line 177 */
659
+ if (!(eq_s_b(z, 1, s_18))) goto lab5;
660
+ z->bra = z->c; /* ], line 177 */
661
+ if (!(eq_s_b(z, 1, s_19))) goto lab5;
662
+ { int ret = slice_del(z); /* delete, line 177 */
663
+ if (ret < 0) return ret;
664
+ }
665
+ lab5:
666
+ z->c = z->l - m7;
667
+ }
668
+ z->lb = mlimit;
669
+ }
670
+ if (in_grouping_b_U(z, g_V1, 97, 246, 1) < 0) return 0; /* goto */ /* non V1, line 179 */
671
+ z->ket = z->c; /* [, line 179 */
672
+ { int ret = skip_utf8(z->p, z->c, z->lb, 0, -1);
673
+ if (ret < 0) return 0;
674
+ z->c = ret; /* next, line 179 */
675
+ }
676
+ z->bra = z->c; /* ], line 179 */
677
+ z->S[0] = slice_to(z, z->S[0]); /* -> x, line 179 */
678
+ if (z->S[0] == 0) return -1; /* -> x, line 179 */
679
+ if (!(eq_v_b(z, z->S[0]))) return 0; /* name x, line 179 */
680
+ { int ret = slice_del(z); /* delete, line 179 */
681
+ if (ret < 0) return ret;
682
+ }
683
+ return 1;
684
+ }
685
+
686
+ extern int finnish_UTF_8_stem(struct SN_env * z) {
687
+ { int c1 = z->c; /* do, line 185 */
688
+ { int ret = r_mark_regions(z);
689
+ if (ret == 0) goto lab0; /* call mark_regions, line 185 */
690
+ if (ret < 0) return ret;
691
+ }
692
+ lab0:
693
+ z->c = c1;
694
+ }
695
+ z->B[0] = 0; /* unset ending_removed, line 186 */
696
+ z->lb = z->c; z->c = z->l; /* backwards, line 187 */
697
+
698
+ { int m2 = z->l - z->c; (void)m2; /* do, line 188 */
699
+ { int ret = r_particle_etc(z);
700
+ if (ret == 0) goto lab1; /* call particle_etc, line 188 */
701
+ if (ret < 0) return ret;
702
+ }
703
+ lab1:
704
+ z->c = z->l - m2;
705
+ }
706
+ { int m3 = z->l - z->c; (void)m3; /* do, line 189 */
707
+ { int ret = r_possessive(z);
708
+ if (ret == 0) goto lab2; /* call possessive, line 189 */
709
+ if (ret < 0) return ret;
710
+ }
711
+ lab2:
712
+ z->c = z->l - m3;
713
+ }
714
+ { int m4 = z->l - z->c; (void)m4; /* do, line 190 */
715
+ { int ret = r_case_ending(z);
716
+ if (ret == 0) goto lab3; /* call case_ending, line 190 */
717
+ if (ret < 0) return ret;
718
+ }
719
+ lab3:
720
+ z->c = z->l - m4;
721
+ }
722
+ { int m5 = z->l - z->c; (void)m5; /* do, line 191 */
723
+ { int ret = r_other_endings(z);
724
+ if (ret == 0) goto lab4; /* call other_endings, line 191 */
725
+ if (ret < 0) return ret;
726
+ }
727
+ lab4:
728
+ z->c = z->l - m5;
729
+ }
730
+ { int m6 = z->l - z->c; (void)m6; /* or, line 192 */
731
+ if (!(z->B[0])) goto lab6; /* Boolean test ending_removed, line 192 */
732
+ { int m7 = z->l - z->c; (void)m7; /* do, line 192 */
733
+ { int ret = r_i_plural(z);
734
+ if (ret == 0) goto lab7; /* call i_plural, line 192 */
735
+ if (ret < 0) return ret;
736
+ }
737
+ lab7:
738
+ z->c = z->l - m7;
739
+ }
740
+ goto lab5;
741
+ lab6:
742
+ z->c = z->l - m6;
743
+ { int m8 = z->l - z->c; (void)m8; /* do, line 192 */
744
+ { int ret = r_t_plural(z);
745
+ if (ret == 0) goto lab8; /* call t_plural, line 192 */
746
+ if (ret < 0) return ret;
747
+ }
748
+ lab8:
749
+ z->c = z->l - m8;
750
+ }
751
+ }
752
+ lab5:
753
+ { int m9 = z->l - z->c; (void)m9; /* do, line 193 */
754
+ { int ret = r_tidy(z);
755
+ if (ret == 0) goto lab9; /* call tidy, line 193 */
756
+ if (ret < 0) return ret;
757
+ }
758
+ lab9:
759
+ z->c = z->l - m9;
760
+ }
761
+ z->c = z->lb;
762
+ return 1;
763
+ }
764
+
765
+ extern struct SN_env * finnish_UTF_8_create_env(void) { return SN_create_env(1, 2, 1); }
766
+
767
+ extern void finnish_UTF_8_close_env(struct SN_env * z) { SN_close_env(z, 1); }
768
+