ferret 0.11.6 → 0.11.8.4
Sign up to get free protection for your applications and to get access to all the features.
- data/README +10 -22
- data/RELEASE_CHANGES +137 -0
- data/RELEASE_NOTES +60 -0
- data/Rakefile +379 -274
- data/TODO +100 -8
- data/bin/ferret-browser +0 -0
- data/ext/BZLIB_blocksort.c +1094 -0
- data/ext/BZLIB_bzlib.c +1578 -0
- data/ext/BZLIB_compress.c +672 -0
- data/ext/BZLIB_crctable.c +104 -0
- data/ext/BZLIB_decompress.c +626 -0
- data/ext/BZLIB_huffman.c +205 -0
- data/ext/BZLIB_randtable.c +84 -0
- data/ext/{api.c → STEMMER_api.c} +7 -10
- data/ext/{libstemmer.c → STEMMER_libstemmer.c} +3 -2
- data/ext/{stem_ISO_8859_1_danish.c → STEMMER_stem_ISO_8859_1_danish.c} +123 -124
- data/ext/{stem_ISO_8859_1_dutch.c → STEMMER_stem_ISO_8859_1_dutch.c} +177 -188
- data/ext/STEMMER_stem_ISO_8859_1_english.c +1117 -0
- data/ext/{stem_ISO_8859_1_finnish.c → STEMMER_stem_ISO_8859_1_finnish.c} +276 -306
- data/ext/STEMMER_stem_ISO_8859_1_french.c +1246 -0
- data/ext/{stem_ISO_8859_1_german.c → STEMMER_stem_ISO_8859_1_german.c} +161 -170
- data/ext/STEMMER_stem_ISO_8859_1_hungarian.c +1230 -0
- data/ext/STEMMER_stem_ISO_8859_1_italian.c +1065 -0
- data/ext/STEMMER_stem_ISO_8859_1_norwegian.c +297 -0
- data/ext/{stem_ISO_8859_1_porter.c → STEMMER_stem_ISO_8859_1_porter.c} +263 -290
- data/ext/{stem_ISO_8859_1_portuguese.c → STEMMER_stem_ISO_8859_1_portuguese.c} +362 -380
- data/ext/STEMMER_stem_ISO_8859_1_spanish.c +1093 -0
- data/ext/STEMMER_stem_ISO_8859_1_swedish.c +307 -0
- data/ext/STEMMER_stem_ISO_8859_2_romanian.c +998 -0
- data/ext/{stem_KOI8_R_russian.c → STEMMER_stem_KOI8_R_russian.c} +244 -245
- data/ext/STEMMER_stem_UTF_8_danish.c +339 -0
- data/ext/{stem_UTF_8_dutch.c → STEMMER_stem_UTF_8_dutch.c} +192 -211
- data/ext/STEMMER_stem_UTF_8_english.c +1125 -0
- data/ext/{stem_UTF_8_finnish.c → STEMMER_stem_UTF_8_finnish.c} +284 -324
- data/ext/STEMMER_stem_UTF_8_french.c +1256 -0
- data/ext/{stem_UTF_8_german.c → STEMMER_stem_UTF_8_german.c} +170 -187
- data/ext/STEMMER_stem_UTF_8_hungarian.c +1234 -0
- data/ext/STEMMER_stem_UTF_8_italian.c +1073 -0
- data/ext/STEMMER_stem_UTF_8_norwegian.c +299 -0
- data/ext/{stem_UTF_8_porter.c → STEMMER_stem_UTF_8_porter.c} +271 -310
- data/ext/STEMMER_stem_UTF_8_portuguese.c +1023 -0
- data/ext/STEMMER_stem_UTF_8_romanian.c +1004 -0
- data/ext/STEMMER_stem_UTF_8_russian.c +694 -0
- data/ext/STEMMER_stem_UTF_8_spanish.c +1097 -0
- data/ext/STEMMER_stem_UTF_8_swedish.c +309 -0
- data/ext/STEMMER_stem_UTF_8_turkish.c +2205 -0
- data/ext/{utilities.c → STEMMER_utilities.c} +100 -68
- data/ext/analysis.c +276 -121
- data/ext/analysis.h +190 -143
- data/ext/api.h +3 -4
- data/ext/array.c +5 -3
- data/ext/array.h +52 -43
- data/ext/bitvector.c +38 -482
- data/ext/bitvector.h +446 -124
- data/ext/bzlib.h +282 -0
- data/ext/bzlib_private.h +503 -0
- data/ext/compound_io.c +23 -22
- data/ext/config.h +21 -11
- data/ext/document.c +43 -40
- data/ext/document.h +31 -21
- data/ext/except.c +20 -38
- data/ext/except.h +89 -76
- data/ext/extconf.rb +3 -2
- data/ext/ferret.c +49 -35
- data/ext/ferret.h +14 -11
- data/ext/field_index.c +262 -0
- data/ext/field_index.h +52 -0
- data/ext/filter.c +11 -10
- data/ext/fs_store.c +65 -47
- data/ext/global.c +245 -165
- data/ext/global.h +252 -54
- data/ext/hash.c +200 -243
- data/ext/hash.h +205 -163
- data/ext/hashset.c +118 -96
- data/ext/hashset.h +110 -82
- data/ext/header.h +19 -19
- data/ext/helper.c +11 -10
- data/ext/helper.h +14 -6
- data/ext/index.c +745 -366
- data/ext/index.h +503 -529
- data/ext/internal.h +1020 -0
- data/ext/lang.c +10 -0
- data/ext/lang.h +35 -15
- data/ext/mempool.c +5 -4
- data/ext/mempool.h +30 -22
- data/ext/modules.h +35 -7
- data/ext/multimapper.c +43 -2
- data/ext/multimapper.h +32 -23
- data/ext/posh.c +0 -0
- data/ext/posh.h +4 -38
- data/ext/priorityqueue.c +10 -12
- data/ext/priorityqueue.h +33 -21
- data/ext/q_boolean.c +22 -9
- data/ext/q_const_score.c +3 -2
- data/ext/q_filtered_query.c +15 -12
- data/ext/q_fuzzy.c +147 -135
- data/ext/q_match_all.c +3 -2
- data/ext/q_multi_term.c +28 -32
- data/ext/q_parser.c +451 -173
- data/ext/q_phrase.c +158 -79
- data/ext/q_prefix.c +16 -18
- data/ext/q_range.c +363 -31
- data/ext/q_span.c +130 -141
- data/ext/q_term.c +21 -21
- data/ext/q_wildcard.c +19 -23
- data/ext/r_analysis.c +369 -242
- data/ext/r_index.c +421 -434
- data/ext/r_qparser.c +142 -92
- data/ext/r_search.c +790 -407
- data/ext/r_store.c +44 -44
- data/ext/r_utils.c +264 -96
- data/ext/ram_store.c +29 -23
- data/ext/scanner.c +895 -0
- data/ext/scanner.h +36 -0
- data/ext/scanner_mb.c +6701 -0
- data/ext/scanner_utf8.c +4415 -0
- data/ext/search.c +210 -87
- data/ext/search.h +556 -488
- data/ext/similarity.c +17 -16
- data/ext/similarity.h +51 -44
- data/ext/sort.c +157 -354
- data/ext/stem_ISO_8859_1_hungarian.h +16 -0
- data/ext/stem_ISO_8859_2_romanian.h +16 -0
- data/ext/stem_UTF_8_hungarian.h +16 -0
- data/ext/stem_UTF_8_romanian.h +16 -0
- data/ext/stem_UTF_8_turkish.h +16 -0
- data/ext/stopwords.c +287 -278
- data/ext/store.c +57 -51
- data/ext/store.h +308 -286
- data/ext/symbol.c +10 -0
- data/ext/symbol.h +23 -0
- data/ext/term_vectors.c +14 -293
- data/ext/threading.h +22 -22
- data/ext/win32.h +12 -4
- data/lib/ferret.rb +2 -1
- data/lib/ferret/browser.rb +1 -1
- data/lib/ferret/field_symbol.rb +94 -0
- data/lib/ferret/index.rb +221 -34
- data/lib/ferret/number_tools.rb +6 -6
- data/lib/ferret/version.rb +3 -0
- data/test/{unit → long_running}/largefile/tc_largefile.rb +1 -1
- data/test/test_helper.rb +7 -2
- data/test/test_installed.rb +1 -0
- data/test/threading/thread_safety_index_test.rb +10 -1
- data/test/threading/thread_safety_read_write_test.rb +4 -7
- data/test/threading/thread_safety_test.rb +0 -0
- data/test/unit/analysis/tc_analyzer.rb +29 -27
- data/test/unit/analysis/tc_token_stream.rb +23 -16
- data/test/unit/index/tc_index.rb +116 -11
- data/test/unit/index/tc_index_reader.rb +27 -27
- data/test/unit/index/tc_index_writer.rb +10 -0
- data/test/unit/index/th_doc.rb +38 -21
- data/test/unit/search/tc_filter.rb +31 -10
- data/test/unit/search/tc_index_searcher.rb +6 -0
- data/test/unit/search/tm_searcher.rb +53 -1
- data/test/unit/store/tc_fs_store.rb +40 -2
- data/test/unit/store/tc_ram_store.rb +0 -0
- data/test/unit/store/tm_store.rb +0 -0
- data/test/unit/store/tm_store_lock.rb +7 -6
- data/test/unit/tc_field_symbol.rb +26 -0
- data/test/unit/ts_analysis.rb +0 -0
- data/test/unit/ts_index.rb +0 -0
- data/test/unit/ts_store.rb +0 -0
- data/test/unit/ts_utils.rb +0 -0
- data/test/unit/utils/tc_number_tools.rb +0 -0
- data/test/utils/content_generator.rb +226 -0
- metadata +262 -221
- data/ext/inc/lang.h +0 -48
- data/ext/inc/threading.h +0 -31
- data/ext/stem_ISO_8859_1_english.c +0 -1156
- data/ext/stem_ISO_8859_1_french.c +0 -1276
- data/ext/stem_ISO_8859_1_italian.c +0 -1091
- data/ext/stem_ISO_8859_1_norwegian.c +0 -296
- data/ext/stem_ISO_8859_1_spanish.c +0 -1119
- data/ext/stem_ISO_8859_1_swedish.c +0 -307
- data/ext/stem_UTF_8_danish.c +0 -344
- data/ext/stem_UTF_8_english.c +0 -1176
- data/ext/stem_UTF_8_french.c +0 -1296
- data/ext/stem_UTF_8_italian.c +0 -1113
- data/ext/stem_UTF_8_norwegian.c +0 -302
- data/ext/stem_UTF_8_portuguese.c +0 -1055
- data/ext/stem_UTF_8_russian.c +0 -709
- data/ext/stem_UTF_8_spanish.c +0 -1137
- data/ext/stem_UTF_8_swedish.c +0 -313
- data/lib/ferret_version.rb +0 -3
@@ -0,0 +1,299 @@
|
|
1
|
+
|
2
|
+
/* This file was generated automatically by the Snowball to ANSI C compiler */
|
3
|
+
|
4
|
+
#include "header.h"
|
5
|
+
|
6
|
+
#ifdef __cplusplus
|
7
|
+
extern "C" {
|
8
|
+
#endif
|
9
|
+
extern int norwegian_UTF_8_stem(struct SN_env * z);
|
10
|
+
#ifdef __cplusplus
|
11
|
+
}
|
12
|
+
#endif
|
13
|
+
static int r_other_suffix(struct SN_env * z);
|
14
|
+
static int r_consonant_pair(struct SN_env * z);
|
15
|
+
static int r_main_suffix(struct SN_env * z);
|
16
|
+
static int r_mark_regions(struct SN_env * z);
|
17
|
+
#ifdef __cplusplus
|
18
|
+
extern "C" {
|
19
|
+
#endif
|
20
|
+
|
21
|
+
|
22
|
+
extern struct SN_env * norwegian_UTF_8_create_env(void);
|
23
|
+
extern void norwegian_UTF_8_close_env(struct SN_env * z);
|
24
|
+
|
25
|
+
|
26
|
+
#ifdef __cplusplus
|
27
|
+
}
|
28
|
+
#endif
|
29
|
+
static const symbol s_0_0[1] = { 'a' };
|
30
|
+
static const symbol s_0_1[1] = { 'e' };
|
31
|
+
static const symbol s_0_2[3] = { 'e', 'd', 'e' };
|
32
|
+
static const symbol s_0_3[4] = { 'a', 'n', 'd', 'e' };
|
33
|
+
static const symbol s_0_4[4] = { 'e', 'n', 'd', 'e' };
|
34
|
+
static const symbol s_0_5[3] = { 'a', 'n', 'e' };
|
35
|
+
static const symbol s_0_6[3] = { 'e', 'n', 'e' };
|
36
|
+
static const symbol s_0_7[6] = { 'h', 'e', 't', 'e', 'n', 'e' };
|
37
|
+
static const symbol s_0_8[4] = { 'e', 'r', 't', 'e' };
|
38
|
+
static const symbol s_0_9[2] = { 'e', 'n' };
|
39
|
+
static const symbol s_0_10[5] = { 'h', 'e', 't', 'e', 'n' };
|
40
|
+
static const symbol s_0_11[2] = { 'a', 'r' };
|
41
|
+
static const symbol s_0_12[2] = { 'e', 'r' };
|
42
|
+
static const symbol s_0_13[5] = { 'h', 'e', 't', 'e', 'r' };
|
43
|
+
static const symbol s_0_14[1] = { 's' };
|
44
|
+
static const symbol s_0_15[2] = { 'a', 's' };
|
45
|
+
static const symbol s_0_16[2] = { 'e', 's' };
|
46
|
+
static const symbol s_0_17[4] = { 'e', 'd', 'e', 's' };
|
47
|
+
static const symbol s_0_18[5] = { 'e', 'n', 'd', 'e', 's' };
|
48
|
+
static const symbol s_0_19[4] = { 'e', 'n', 'e', 's' };
|
49
|
+
static const symbol s_0_20[7] = { 'h', 'e', 't', 'e', 'n', 'e', 's' };
|
50
|
+
static const symbol s_0_21[3] = { 'e', 'n', 's' };
|
51
|
+
static const symbol s_0_22[6] = { 'h', 'e', 't', 'e', 'n', 's' };
|
52
|
+
static const symbol s_0_23[3] = { 'e', 'r', 's' };
|
53
|
+
static const symbol s_0_24[3] = { 'e', 't', 's' };
|
54
|
+
static const symbol s_0_25[2] = { 'e', 't' };
|
55
|
+
static const symbol s_0_26[3] = { 'h', 'e', 't' };
|
56
|
+
static const symbol s_0_27[3] = { 'e', 'r', 't' };
|
57
|
+
static const symbol s_0_28[3] = { 'a', 's', 't' };
|
58
|
+
|
59
|
+
static const struct among a_0[29] =
|
60
|
+
{
|
61
|
+
/* 0 */ { 1, s_0_0, -1, 1, 0},
|
62
|
+
/* 1 */ { 1, s_0_1, -1, 1, 0},
|
63
|
+
/* 2 */ { 3, s_0_2, 1, 1, 0},
|
64
|
+
/* 3 */ { 4, s_0_3, 1, 1, 0},
|
65
|
+
/* 4 */ { 4, s_0_4, 1, 1, 0},
|
66
|
+
/* 5 */ { 3, s_0_5, 1, 1, 0},
|
67
|
+
/* 6 */ { 3, s_0_6, 1, 1, 0},
|
68
|
+
/* 7 */ { 6, s_0_7, 6, 1, 0},
|
69
|
+
/* 8 */ { 4, s_0_8, 1, 3, 0},
|
70
|
+
/* 9 */ { 2, s_0_9, -1, 1, 0},
|
71
|
+
/* 10 */ { 5, s_0_10, 9, 1, 0},
|
72
|
+
/* 11 */ { 2, s_0_11, -1, 1, 0},
|
73
|
+
/* 12 */ { 2, s_0_12, -1, 1, 0},
|
74
|
+
/* 13 */ { 5, s_0_13, 12, 1, 0},
|
75
|
+
/* 14 */ { 1, s_0_14, -1, 2, 0},
|
76
|
+
/* 15 */ { 2, s_0_15, 14, 1, 0},
|
77
|
+
/* 16 */ { 2, s_0_16, 14, 1, 0},
|
78
|
+
/* 17 */ { 4, s_0_17, 16, 1, 0},
|
79
|
+
/* 18 */ { 5, s_0_18, 16, 1, 0},
|
80
|
+
/* 19 */ { 4, s_0_19, 16, 1, 0},
|
81
|
+
/* 20 */ { 7, s_0_20, 19, 1, 0},
|
82
|
+
/* 21 */ { 3, s_0_21, 14, 1, 0},
|
83
|
+
/* 22 */ { 6, s_0_22, 21, 1, 0},
|
84
|
+
/* 23 */ { 3, s_0_23, 14, 1, 0},
|
85
|
+
/* 24 */ { 3, s_0_24, 14, 1, 0},
|
86
|
+
/* 25 */ { 2, s_0_25, -1, 1, 0},
|
87
|
+
/* 26 */ { 3, s_0_26, 25, 1, 0},
|
88
|
+
/* 27 */ { 3, s_0_27, -1, 3, 0},
|
89
|
+
/* 28 */ { 3, s_0_28, -1, 1, 0}
|
90
|
+
};
|
91
|
+
|
92
|
+
static const symbol s_1_0[2] = { 'd', 't' };
|
93
|
+
static const symbol s_1_1[2] = { 'v', 't' };
|
94
|
+
|
95
|
+
static const struct among a_1[2] =
|
96
|
+
{
|
97
|
+
/* 0 */ { 2, s_1_0, -1, -1, 0},
|
98
|
+
/* 1 */ { 2, s_1_1, -1, -1, 0}
|
99
|
+
};
|
100
|
+
|
101
|
+
static const symbol s_2_0[3] = { 'l', 'e', 'g' };
|
102
|
+
static const symbol s_2_1[4] = { 'e', 'l', 'e', 'g' };
|
103
|
+
static const symbol s_2_2[2] = { 'i', 'g' };
|
104
|
+
static const symbol s_2_3[3] = { 'e', 'i', 'g' };
|
105
|
+
static const symbol s_2_4[3] = { 'l', 'i', 'g' };
|
106
|
+
static const symbol s_2_5[4] = { 'e', 'l', 'i', 'g' };
|
107
|
+
static const symbol s_2_6[3] = { 'e', 'l', 's' };
|
108
|
+
static const symbol s_2_7[3] = { 'l', 'o', 'v' };
|
109
|
+
static const symbol s_2_8[4] = { 'e', 'l', 'o', 'v' };
|
110
|
+
static const symbol s_2_9[4] = { 's', 'l', 'o', 'v' };
|
111
|
+
static const symbol s_2_10[7] = { 'h', 'e', 't', 's', 'l', 'o', 'v' };
|
112
|
+
|
113
|
+
static const struct among a_2[11] =
|
114
|
+
{
|
115
|
+
/* 0 */ { 3, s_2_0, -1, 1, 0},
|
116
|
+
/* 1 */ { 4, s_2_1, 0, 1, 0},
|
117
|
+
/* 2 */ { 2, s_2_2, -1, 1, 0},
|
118
|
+
/* 3 */ { 3, s_2_3, 2, 1, 0},
|
119
|
+
/* 4 */ { 3, s_2_4, 2, 1, 0},
|
120
|
+
/* 5 */ { 4, s_2_5, 4, 1, 0},
|
121
|
+
/* 6 */ { 3, s_2_6, -1, 1, 0},
|
122
|
+
/* 7 */ { 3, s_2_7, -1, 1, 0},
|
123
|
+
/* 8 */ { 4, s_2_8, 7, 1, 0},
|
124
|
+
/* 9 */ { 4, s_2_9, 7, 1, 0},
|
125
|
+
/* 10 */ { 7, s_2_10, 9, 1, 0}
|
126
|
+
};
|
127
|
+
|
128
|
+
static const unsigned char g_v[] = { 17, 65, 16, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 48, 0, 128 };
|
129
|
+
|
130
|
+
static const unsigned char g_s_ending[] = { 119, 125, 149, 1 };
|
131
|
+
|
132
|
+
static const symbol s_0[] = { 'k' };
|
133
|
+
static const symbol s_1[] = { 'e', 'r' };
|
134
|
+
|
135
|
+
static int r_mark_regions(struct SN_env * z) {
|
136
|
+
z->I[0] = z->l;
|
137
|
+
{ int c_test = z->c; /* test, line 30 */
|
138
|
+
{ int ret = skip_utf8(z->p, z->c, 0, z->l, + 3);
|
139
|
+
if (ret < 0) return 0;
|
140
|
+
z->c = ret; /* hop, line 30 */
|
141
|
+
}
|
142
|
+
z->I[1] = z->c; /* setmark x, line 30 */
|
143
|
+
z->c = c_test;
|
144
|
+
}
|
145
|
+
if (out_grouping_U(z, g_v, 97, 248, 1) < 0) return 0; /* goto */ /* grouping v, line 31 */
|
146
|
+
{ /* gopast */ /* non v, line 31 */
|
147
|
+
int ret = in_grouping_U(z, g_v, 97, 248, 1);
|
148
|
+
if (ret < 0) return 0;
|
149
|
+
z->c += ret;
|
150
|
+
}
|
151
|
+
z->I[0] = z->c; /* setmark p1, line 31 */
|
152
|
+
/* try, line 32 */
|
153
|
+
if (!(z->I[0] < z->I[1])) goto lab0;
|
154
|
+
z->I[0] = z->I[1];
|
155
|
+
lab0:
|
156
|
+
return 1;
|
157
|
+
}
|
158
|
+
|
159
|
+
static int r_main_suffix(struct SN_env * z) {
|
160
|
+
int among_var;
|
161
|
+
{ int mlimit; /* setlimit, line 38 */
|
162
|
+
int m1 = z->l - z->c; (void)m1;
|
163
|
+
if (z->c < z->I[0]) return 0;
|
164
|
+
z->c = z->I[0]; /* tomark, line 38 */
|
165
|
+
mlimit = z->lb; z->lb = z->c;
|
166
|
+
z->c = z->l - m1;
|
167
|
+
z->ket = z->c; /* [, line 38 */
|
168
|
+
if (z->c <= z->lb || z->p[z->c - 1] >> 5 != 3 || !((1851426 >> (z->p[z->c - 1] & 0x1f)) & 1)) { z->lb = mlimit; return 0; }
|
169
|
+
among_var = find_among_b(z, a_0, 29); /* substring, line 38 */
|
170
|
+
if (!(among_var)) { z->lb = mlimit; return 0; }
|
171
|
+
z->bra = z->c; /* ], line 38 */
|
172
|
+
z->lb = mlimit;
|
173
|
+
}
|
174
|
+
switch(among_var) {
|
175
|
+
case 0: return 0;
|
176
|
+
case 1:
|
177
|
+
{ int ret = slice_del(z); /* delete, line 44 */
|
178
|
+
if (ret < 0) return ret;
|
179
|
+
}
|
180
|
+
break;
|
181
|
+
case 2:
|
182
|
+
{ int m2 = z->l - z->c; (void)m2; /* or, line 46 */
|
183
|
+
if (in_grouping_b_U(z, g_s_ending, 98, 122, 0)) goto lab1;
|
184
|
+
goto lab0;
|
185
|
+
lab1:
|
186
|
+
z->c = z->l - m2;
|
187
|
+
if (!(eq_s_b(z, 1, s_0))) return 0;
|
188
|
+
if (out_grouping_b_U(z, g_v, 97, 248, 0)) return 0;
|
189
|
+
}
|
190
|
+
lab0:
|
191
|
+
{ int ret = slice_del(z); /* delete, line 46 */
|
192
|
+
if (ret < 0) return ret;
|
193
|
+
}
|
194
|
+
break;
|
195
|
+
case 3:
|
196
|
+
{ int ret = slice_from_s(z, 2, s_1); /* <-, line 48 */
|
197
|
+
if (ret < 0) return ret;
|
198
|
+
}
|
199
|
+
break;
|
200
|
+
}
|
201
|
+
return 1;
|
202
|
+
}
|
203
|
+
|
204
|
+
static int r_consonant_pair(struct SN_env * z) {
|
205
|
+
{ int m_test = z->l - z->c; /* test, line 53 */
|
206
|
+
{ int mlimit; /* setlimit, line 54 */
|
207
|
+
int m1 = z->l - z->c; (void)m1;
|
208
|
+
if (z->c < z->I[0]) return 0;
|
209
|
+
z->c = z->I[0]; /* tomark, line 54 */
|
210
|
+
mlimit = z->lb; z->lb = z->c;
|
211
|
+
z->c = z->l - m1;
|
212
|
+
z->ket = z->c; /* [, line 54 */
|
213
|
+
if (z->c - 1 <= z->lb || z->p[z->c - 1] != 116) { z->lb = mlimit; return 0; }
|
214
|
+
if (!(find_among_b(z, a_1, 2))) { z->lb = mlimit; return 0; } /* substring, line 54 */
|
215
|
+
z->bra = z->c; /* ], line 54 */
|
216
|
+
z->lb = mlimit;
|
217
|
+
}
|
218
|
+
z->c = z->l - m_test;
|
219
|
+
}
|
220
|
+
{ int ret = skip_utf8(z->p, z->c, z->lb, 0, -1);
|
221
|
+
if (ret < 0) return 0;
|
222
|
+
z->c = ret; /* next, line 59 */
|
223
|
+
}
|
224
|
+
z->bra = z->c; /* ], line 59 */
|
225
|
+
{ int ret = slice_del(z); /* delete, line 59 */
|
226
|
+
if (ret < 0) return ret;
|
227
|
+
}
|
228
|
+
return 1;
|
229
|
+
}
|
230
|
+
|
231
|
+
static int r_other_suffix(struct SN_env * z) {
|
232
|
+
int among_var;
|
233
|
+
{ int mlimit; /* setlimit, line 63 */
|
234
|
+
int m1 = z->l - z->c; (void)m1;
|
235
|
+
if (z->c < z->I[0]) return 0;
|
236
|
+
z->c = z->I[0]; /* tomark, line 63 */
|
237
|
+
mlimit = z->lb; z->lb = z->c;
|
238
|
+
z->c = z->l - m1;
|
239
|
+
z->ket = z->c; /* [, line 63 */
|
240
|
+
if (z->c - 1 <= z->lb || z->p[z->c - 1] >> 5 != 3 || !((4718720 >> (z->p[z->c - 1] & 0x1f)) & 1)) { z->lb = mlimit; return 0; }
|
241
|
+
among_var = find_among_b(z, a_2, 11); /* substring, line 63 */
|
242
|
+
if (!(among_var)) { z->lb = mlimit; return 0; }
|
243
|
+
z->bra = z->c; /* ], line 63 */
|
244
|
+
z->lb = mlimit;
|
245
|
+
}
|
246
|
+
switch(among_var) {
|
247
|
+
case 0: return 0;
|
248
|
+
case 1:
|
249
|
+
{ int ret = slice_del(z); /* delete, line 67 */
|
250
|
+
if (ret < 0) return ret;
|
251
|
+
}
|
252
|
+
break;
|
253
|
+
}
|
254
|
+
return 1;
|
255
|
+
}
|
256
|
+
|
257
|
+
extern int norwegian_UTF_8_stem(struct SN_env * z) {
|
258
|
+
{ int c1 = z->c; /* do, line 74 */
|
259
|
+
{ int ret = r_mark_regions(z);
|
260
|
+
if (ret == 0) goto lab0; /* call mark_regions, line 74 */
|
261
|
+
if (ret < 0) return ret;
|
262
|
+
}
|
263
|
+
lab0:
|
264
|
+
z->c = c1;
|
265
|
+
}
|
266
|
+
z->lb = z->c; z->c = z->l; /* backwards, line 75 */
|
267
|
+
|
268
|
+
{ int m2 = z->l - z->c; (void)m2; /* do, line 76 */
|
269
|
+
{ int ret = r_main_suffix(z);
|
270
|
+
if (ret == 0) goto lab1; /* call main_suffix, line 76 */
|
271
|
+
if (ret < 0) return ret;
|
272
|
+
}
|
273
|
+
lab1:
|
274
|
+
z->c = z->l - m2;
|
275
|
+
}
|
276
|
+
{ int m3 = z->l - z->c; (void)m3; /* do, line 77 */
|
277
|
+
{ int ret = r_consonant_pair(z);
|
278
|
+
if (ret == 0) goto lab2; /* call consonant_pair, line 77 */
|
279
|
+
if (ret < 0) return ret;
|
280
|
+
}
|
281
|
+
lab2:
|
282
|
+
z->c = z->l - m3;
|
283
|
+
}
|
284
|
+
{ int m4 = z->l - z->c; (void)m4; /* do, line 78 */
|
285
|
+
{ int ret = r_other_suffix(z);
|
286
|
+
if (ret == 0) goto lab3; /* call other_suffix, line 78 */
|
287
|
+
if (ret < 0) return ret;
|
288
|
+
}
|
289
|
+
lab3:
|
290
|
+
z->c = z->l - m4;
|
291
|
+
}
|
292
|
+
z->c = z->lb;
|
293
|
+
return 1;
|
294
|
+
}
|
295
|
+
|
296
|
+
extern struct SN_env * norwegian_UTF_8_create_env(void) { return SN_create_env(0, 2, 0); }
|
297
|
+
|
298
|
+
extern void norwegian_UTF_8_close_env(struct SN_env * z) { SN_close_env(z, 0); }
|
299
|
+
|
@@ -3,7 +3,13 @@
|
|
3
3
|
|
4
4
|
#include "header.h"
|
5
5
|
|
6
|
+
#ifdef __cplusplus
|
7
|
+
extern "C" {
|
8
|
+
#endif
|
6
9
|
extern int porter_UTF_8_stem(struct SN_env * z);
|
10
|
+
#ifdef __cplusplus
|
11
|
+
}
|
12
|
+
#endif
|
7
13
|
static int r_Step_5b(struct SN_env * z);
|
8
14
|
static int r_Step_5a(struct SN_env * z);
|
9
15
|
static int r_Step_4(struct SN_env * z);
|
@@ -15,16 +21,24 @@ static int r_Step_1a(struct SN_env * z);
|
|
15
21
|
static int r_R2(struct SN_env * z);
|
16
22
|
static int r_R1(struct SN_env * z);
|
17
23
|
static int r_shortv(struct SN_env * z);
|
24
|
+
#ifdef __cplusplus
|
25
|
+
extern "C" {
|
26
|
+
#endif
|
27
|
+
|
18
28
|
|
19
29
|
extern struct SN_env * porter_UTF_8_create_env(void);
|
20
30
|
extern void porter_UTF_8_close_env(struct SN_env * z);
|
21
31
|
|
22
|
-
static symbol s_0_0[1] = { 's' };
|
23
|
-
static symbol s_0_1[3] = { 'i', 'e', 's' };
|
24
|
-
static symbol s_0_2[4] = { 's', 's', 'e', 's' };
|
25
|
-
static symbol s_0_3[2] = { 's', 's' };
|
26
32
|
|
27
|
-
|
33
|
+
#ifdef __cplusplus
|
34
|
+
}
|
35
|
+
#endif
|
36
|
+
static const symbol s_0_0[1] = { 's' };
|
37
|
+
static const symbol s_0_1[3] = { 'i', 'e', 's' };
|
38
|
+
static const symbol s_0_2[4] = { 's', 's', 'e', 's' };
|
39
|
+
static const symbol s_0_3[2] = { 's', 's' };
|
40
|
+
|
41
|
+
static const struct among a_0[4] =
|
28
42
|
{
|
29
43
|
/* 0 */ { 1, s_0_0, -1, 3, 0},
|
30
44
|
/* 1 */ { 3, s_0_1, 0, 2, 0},
|
@@ -32,20 +46,20 @@ static struct among a_0[4] =
|
|
32
46
|
/* 3 */ { 2, s_0_3, 0, -1, 0}
|
33
47
|
};
|
34
48
|
|
35
|
-
static symbol s_1_1[2] = { 'b', 'b' };
|
36
|
-
static symbol s_1_2[2] = { 'd', 'd' };
|
37
|
-
static symbol s_1_3[2] = { 'f', 'f' };
|
38
|
-
static symbol s_1_4[2] = { 'g', 'g' };
|
39
|
-
static symbol s_1_5[2] = { 'b', 'l' };
|
40
|
-
static symbol s_1_6[2] = { 'm', 'm' };
|
41
|
-
static symbol s_1_7[2] = { 'n', 'n' };
|
42
|
-
static symbol s_1_8[2] = { 'p', 'p' };
|
43
|
-
static symbol s_1_9[2] = { 'r', 'r' };
|
44
|
-
static symbol s_1_10[2] = { 'a', 't' };
|
45
|
-
static symbol s_1_11[2] = { 't', 't' };
|
46
|
-
static symbol s_1_12[2] = { 'i', 'z' };
|
47
|
-
|
48
|
-
static struct among a_1[13] =
|
49
|
+
static const symbol s_1_1[2] = { 'b', 'b' };
|
50
|
+
static const symbol s_1_2[2] = { 'd', 'd' };
|
51
|
+
static const symbol s_1_3[2] = { 'f', 'f' };
|
52
|
+
static const symbol s_1_4[2] = { 'g', 'g' };
|
53
|
+
static const symbol s_1_5[2] = { 'b', 'l' };
|
54
|
+
static const symbol s_1_6[2] = { 'm', 'm' };
|
55
|
+
static const symbol s_1_7[2] = { 'n', 'n' };
|
56
|
+
static const symbol s_1_8[2] = { 'p', 'p' };
|
57
|
+
static const symbol s_1_9[2] = { 'r', 'r' };
|
58
|
+
static const symbol s_1_10[2] = { 'a', 't' };
|
59
|
+
static const symbol s_1_11[2] = { 't', 't' };
|
60
|
+
static const symbol s_1_12[2] = { 'i', 'z' };
|
61
|
+
|
62
|
+
static const struct among a_1[13] =
|
49
63
|
{
|
50
64
|
/* 0 */ { 0, 0, -1, 3, 0},
|
51
65
|
/* 1 */ { 2, s_1_1, 0, 2, 0},
|
@@ -62,39 +76,39 @@ static struct among a_1[13] =
|
|
62
76
|
/* 12 */ { 2, s_1_12, 0, 1, 0}
|
63
77
|
};
|
64
78
|
|
65
|
-
static symbol s_2_0[2] = { 'e', 'd' };
|
66
|
-
static symbol s_2_1[3] = { 'e', 'e', 'd' };
|
67
|
-
static symbol s_2_2[3] = { 'i', 'n', 'g' };
|
79
|
+
static const symbol s_2_0[2] = { 'e', 'd' };
|
80
|
+
static const symbol s_2_1[3] = { 'e', 'e', 'd' };
|
81
|
+
static const symbol s_2_2[3] = { 'i', 'n', 'g' };
|
68
82
|
|
69
|
-
static struct among a_2[3] =
|
83
|
+
static const struct among a_2[3] =
|
70
84
|
{
|
71
85
|
/* 0 */ { 2, s_2_0, -1, 2, 0},
|
72
86
|
/* 1 */ { 3, s_2_1, 0, 1, 0},
|
73
87
|
/* 2 */ { 3, s_2_2, -1, 2, 0}
|
74
88
|
};
|
75
89
|
|
76
|
-
static symbol s_3_0[4] = { 'a', 'n', 'c', 'i' };
|
77
|
-
static symbol s_3_1[4] = { 'e', 'n', 'c', 'i' };
|
78
|
-
static symbol s_3_2[4] = { 'a', 'b', 'l', 'i' };
|
79
|
-
static symbol s_3_3[3] = { 'e', 'l', 'i' };
|
80
|
-
static symbol s_3_4[4] = { 'a', 'l', 'l', 'i' };
|
81
|
-
static symbol s_3_5[5] = { 'o', 'u', 's', 'l', 'i' };
|
82
|
-
static symbol s_3_6[5] = { 'e', 'n', 't', 'l', 'i' };
|
83
|
-
static symbol s_3_7[5] = { 'a', 'l', 'i', 't', 'i' };
|
84
|
-
static symbol s_3_8[6] = { 'b', 'i', 'l', 'i', 't', 'i' };
|
85
|
-
static symbol s_3_9[5] = { 'i', 'v', 'i', 't', 'i' };
|
86
|
-
static symbol s_3_10[6] = { 't', 'i', 'o', 'n', 'a', 'l' };
|
87
|
-
static symbol s_3_11[7] = { 'a', 't', 'i', 'o', 'n', 'a', 'l' };
|
88
|
-
static symbol s_3_12[5] = { 'a', 'l', 'i', 's', 'm' };
|
89
|
-
static symbol s_3_13[5] = { 'a', 't', 'i', 'o', 'n' };
|
90
|
-
static symbol s_3_14[7] = { 'i', 'z', 'a', 't', 'i', 'o', 'n' };
|
91
|
-
static symbol s_3_15[4] = { 'i', 'z', 'e', 'r' };
|
92
|
-
static symbol s_3_16[4] = { 'a', 't', 'o', 'r' };
|
93
|
-
static symbol s_3_17[7] = { 'i', 'v', 'e', 'n', 'e', 's', 's' };
|
94
|
-
static symbol s_3_18[7] = { 'f', 'u', 'l', 'n', 'e', 's', 's' };
|
95
|
-
static symbol s_3_19[7] = { 'o', 'u', 's', 'n', 'e', 's', 's' };
|
96
|
-
|
97
|
-
static struct among a_3[20] =
|
90
|
+
static const symbol s_3_0[4] = { 'a', 'n', 'c', 'i' };
|
91
|
+
static const symbol s_3_1[4] = { 'e', 'n', 'c', 'i' };
|
92
|
+
static const symbol s_3_2[4] = { 'a', 'b', 'l', 'i' };
|
93
|
+
static const symbol s_3_3[3] = { 'e', 'l', 'i' };
|
94
|
+
static const symbol s_3_4[4] = { 'a', 'l', 'l', 'i' };
|
95
|
+
static const symbol s_3_5[5] = { 'o', 'u', 's', 'l', 'i' };
|
96
|
+
static const symbol s_3_6[5] = { 'e', 'n', 't', 'l', 'i' };
|
97
|
+
static const symbol s_3_7[5] = { 'a', 'l', 'i', 't', 'i' };
|
98
|
+
static const symbol s_3_8[6] = { 'b', 'i', 'l', 'i', 't', 'i' };
|
99
|
+
static const symbol s_3_9[5] = { 'i', 'v', 'i', 't', 'i' };
|
100
|
+
static const symbol s_3_10[6] = { 't', 'i', 'o', 'n', 'a', 'l' };
|
101
|
+
static const symbol s_3_11[7] = { 'a', 't', 'i', 'o', 'n', 'a', 'l' };
|
102
|
+
static const symbol s_3_12[5] = { 'a', 'l', 'i', 's', 'm' };
|
103
|
+
static const symbol s_3_13[5] = { 'a', 't', 'i', 'o', 'n' };
|
104
|
+
static const symbol s_3_14[7] = { 'i', 'z', 'a', 't', 'i', 'o', 'n' };
|
105
|
+
static const symbol s_3_15[4] = { 'i', 'z', 'e', 'r' };
|
106
|
+
static const symbol s_3_16[4] = { 'a', 't', 'o', 'r' };
|
107
|
+
static const symbol s_3_17[7] = { 'i', 'v', 'e', 'n', 'e', 's', 's' };
|
108
|
+
static const symbol s_3_18[7] = { 'f', 'u', 'l', 'n', 'e', 's', 's' };
|
109
|
+
static const symbol s_3_19[7] = { 'o', 'u', 's', 'n', 'e', 's', 's' };
|
110
|
+
|
111
|
+
static const struct among a_3[20] =
|
98
112
|
{
|
99
113
|
/* 0 */ { 4, s_3_0, -1, 3, 0},
|
100
114
|
/* 1 */ { 4, s_3_1, -1, 2, 0},
|
@@ -118,15 +132,15 @@ static struct among a_3[20] =
|
|
118
132
|
/* 19 */ { 7, s_3_19, -1, 12, 0}
|
119
133
|
};
|
120
134
|
|
121
|
-
static symbol s_4_0[5] = { 'i', 'c', 'a', 't', 'e' };
|
122
|
-
static symbol s_4_1[5] = { 'a', 't', 'i', 'v', 'e' };
|
123
|
-
static symbol s_4_2[5] = { 'a', 'l', 'i', 'z', 'e' };
|
124
|
-
static symbol s_4_3[5] = { 'i', 'c', 'i', 't', 'i' };
|
125
|
-
static symbol s_4_4[4] = { 'i', 'c', 'a', 'l' };
|
126
|
-
static symbol s_4_5[3] = { 'f', 'u', 'l' };
|
127
|
-
static symbol s_4_6[4] = { 'n', 'e', 's', 's' };
|
135
|
+
static const symbol s_4_0[5] = { 'i', 'c', 'a', 't', 'e' };
|
136
|
+
static const symbol s_4_1[5] = { 'a', 't', 'i', 'v', 'e' };
|
137
|
+
static const symbol s_4_2[5] = { 'a', 'l', 'i', 'z', 'e' };
|
138
|
+
static const symbol s_4_3[5] = { 'i', 'c', 'i', 't', 'i' };
|
139
|
+
static const symbol s_4_4[4] = { 'i', 'c', 'a', 'l' };
|
140
|
+
static const symbol s_4_5[3] = { 'f', 'u', 'l' };
|
141
|
+
static const symbol s_4_6[4] = { 'n', 'e', 's', 's' };
|
128
142
|
|
129
|
-
static struct among a_4[7] =
|
143
|
+
static const struct among a_4[7] =
|
130
144
|
{
|
131
145
|
/* 0 */ { 5, s_4_0, -1, 2, 0},
|
132
146
|
/* 1 */ { 5, s_4_1, -1, 3, 0},
|
@@ -137,27 +151,27 @@ static struct among a_4[7] =
|
|
137
151
|
/* 6 */ { 4, s_4_6, -1, 3, 0}
|
138
152
|
};
|
139
153
|
|
140
|
-
static symbol s_5_0[2] = { 'i', 'c' };
|
141
|
-
static symbol s_5_1[4] = { 'a', 'n', 'c', 'e' };
|
142
|
-
static symbol s_5_2[4] = { 'e', 'n', 'c', 'e' };
|
143
|
-
static symbol s_5_3[4] = { 'a', 'b', 'l', 'e' };
|
144
|
-
static symbol s_5_4[4] = { 'i', 'b', 'l', 'e' };
|
145
|
-
static symbol s_5_5[3] = { 'a', 't', 'e' };
|
146
|
-
static symbol s_5_6[3] = { 'i', 'v', 'e' };
|
147
|
-
static symbol s_5_7[3] = { 'i', 'z', 'e' };
|
148
|
-
static symbol s_5_8[3] = { 'i', 't', 'i' };
|
149
|
-
static symbol s_5_9[2] = { 'a', 'l' };
|
150
|
-
static symbol s_5_10[3] = { 'i', 's', 'm' };
|
151
|
-
static symbol s_5_11[3] = { 'i', 'o', 'n' };
|
152
|
-
static symbol s_5_12[2] = { 'e', 'r' };
|
153
|
-
static symbol s_5_13[3] = { 'o', 'u', 's' };
|
154
|
-
static symbol s_5_14[3] = { 'a', 'n', 't' };
|
155
|
-
static symbol s_5_15[3] = { 'e', 'n', 't' };
|
156
|
-
static symbol s_5_16[4] = { 'm', 'e', 'n', 't' };
|
157
|
-
static symbol s_5_17[5] = { 'e', 'm', 'e', 'n', 't' };
|
158
|
-
static symbol s_5_18[2] = { 'o', 'u' };
|
159
|
-
|
160
|
-
static struct among a_5[19] =
|
154
|
+
static const symbol s_5_0[2] = { 'i', 'c' };
|
155
|
+
static const symbol s_5_1[4] = { 'a', 'n', 'c', 'e' };
|
156
|
+
static const symbol s_5_2[4] = { 'e', 'n', 'c', 'e' };
|
157
|
+
static const symbol s_5_3[4] = { 'a', 'b', 'l', 'e' };
|
158
|
+
static const symbol s_5_4[4] = { 'i', 'b', 'l', 'e' };
|
159
|
+
static const symbol s_5_5[3] = { 'a', 't', 'e' };
|
160
|
+
static const symbol s_5_6[3] = { 'i', 'v', 'e' };
|
161
|
+
static const symbol s_5_7[3] = { 'i', 'z', 'e' };
|
162
|
+
static const symbol s_5_8[3] = { 'i', 't', 'i' };
|
163
|
+
static const symbol s_5_9[2] = { 'a', 'l' };
|
164
|
+
static const symbol s_5_10[3] = { 'i', 's', 'm' };
|
165
|
+
static const symbol s_5_11[3] = { 'i', 'o', 'n' };
|
166
|
+
static const symbol s_5_12[2] = { 'e', 'r' };
|
167
|
+
static const symbol s_5_13[3] = { 'o', 'u', 's' };
|
168
|
+
static const symbol s_5_14[3] = { 'a', 'n', 't' };
|
169
|
+
static const symbol s_5_15[3] = { 'e', 'n', 't' };
|
170
|
+
static const symbol s_5_16[4] = { 'm', 'e', 'n', 't' };
|
171
|
+
static const symbol s_5_17[5] = { 'e', 'm', 'e', 'n', 't' };
|
172
|
+
static const symbol s_5_18[2] = { 'o', 'u' };
|
173
|
+
|
174
|
+
static const struct among a_5[19] =
|
161
175
|
{
|
162
176
|
/* 0 */ { 2, s_5_0, -1, 1, 0},
|
163
177
|
/* 1 */ { 4, s_5_1, -1, 1, 0},
|
@@ -180,50 +194,50 @@ static struct among a_5[19] =
|
|
180
194
|
/* 18 */ { 2, s_5_18, -1, 1, 0}
|
181
195
|
};
|
182
196
|
|
183
|
-
static unsigned char g_v[] = { 17, 65, 16, 1 };
|
184
|
-
|
185
|
-
static unsigned char g_v_WXY[] = { 1, 17, 65, 208, 1 };
|
186
|
-
|
187
|
-
static symbol s_0[] = { 's', 's' };
|
188
|
-
static symbol s_1[] = { 'i' };
|
189
|
-
static symbol s_2[] = { 'e', 'e' };
|
190
|
-
static symbol s_3[] = { 'e' };
|
191
|
-
static symbol s_4[] = { 'e' };
|
192
|
-
static symbol s_5[] = { 'y' };
|
193
|
-
static symbol s_6[] = { 'Y' };
|
194
|
-
static symbol s_7[] = { 'i' };
|
195
|
-
static symbol s_8[] = { 't', 'i', 'o', 'n' };
|
196
|
-
static symbol s_9[] = { 'e', 'n', 'c', 'e' };
|
197
|
-
static symbol s_10[] = { 'a', 'n', 'c', 'e' };
|
198
|
-
static symbol s_11[] = { 'a', 'b', 'l', 'e' };
|
199
|
-
static symbol s_12[] = { 'e', 'n', 't' };
|
200
|
-
static symbol s_13[] = { 'e' };
|
201
|
-
static symbol s_14[] = { 'i', 'z', 'e' };
|
202
|
-
static symbol s_15[] = { 'a', 't', 'e' };
|
203
|
-
static symbol s_16[] = { 'a', 'l' };
|
204
|
-
static symbol s_17[] = { 'a', 'l' };
|
205
|
-
static symbol s_18[] = { 'f', 'u', 'l' };
|
206
|
-
static symbol s_19[] = { 'o', 'u', 's' };
|
207
|
-
static symbol s_20[] = { 'i', 'v', 'e' };
|
208
|
-
static symbol s_21[] = { 'b', 'l', 'e' };
|
209
|
-
static symbol s_22[] = { 'a', 'l' };
|
210
|
-
static symbol s_23[] = { 'i', 'c' };
|
211
|
-
static symbol s_24[] = { 's' };
|
212
|
-
static symbol s_25[] = { 't' };
|
213
|
-
static symbol s_26[] = { 'e' };
|
214
|
-
static symbol s_27[] = { 'l' };
|
215
|
-
static symbol s_28[] = { 'l' };
|
216
|
-
static symbol s_29[] = { 'y' };
|
217
|
-
static symbol s_30[] = { 'Y' };
|
218
|
-
static symbol s_31[] = { 'y' };
|
219
|
-
static symbol s_32[] = { 'Y' };
|
220
|
-
static symbol s_33[] = { 'Y' };
|
221
|
-
static symbol s_34[] = { 'y' };
|
197
|
+
static const unsigned char g_v[] = { 17, 65, 16, 1 };
|
198
|
+
|
199
|
+
static const unsigned char g_v_WXY[] = { 1, 17, 65, 208, 1 };
|
200
|
+
|
201
|
+
static const symbol s_0[] = { 's', 's' };
|
202
|
+
static const symbol s_1[] = { 'i' };
|
203
|
+
static const symbol s_2[] = { 'e', 'e' };
|
204
|
+
static const symbol s_3[] = { 'e' };
|
205
|
+
static const symbol s_4[] = { 'e' };
|
206
|
+
static const symbol s_5[] = { 'y' };
|
207
|
+
static const symbol s_6[] = { 'Y' };
|
208
|
+
static const symbol s_7[] = { 'i' };
|
209
|
+
static const symbol s_8[] = { 't', 'i', 'o', 'n' };
|
210
|
+
static const symbol s_9[] = { 'e', 'n', 'c', 'e' };
|
211
|
+
static const symbol s_10[] = { 'a', 'n', 'c', 'e' };
|
212
|
+
static const symbol s_11[] = { 'a', 'b', 'l', 'e' };
|
213
|
+
static const symbol s_12[] = { 'e', 'n', 't' };
|
214
|
+
static const symbol s_13[] = { 'e' };
|
215
|
+
static const symbol s_14[] = { 'i', 'z', 'e' };
|
216
|
+
static const symbol s_15[] = { 'a', 't', 'e' };
|
217
|
+
static const symbol s_16[] = { 'a', 'l' };
|
218
|
+
static const symbol s_17[] = { 'a', 'l' };
|
219
|
+
static const symbol s_18[] = { 'f', 'u', 'l' };
|
220
|
+
static const symbol s_19[] = { 'o', 'u', 's' };
|
221
|
+
static const symbol s_20[] = { 'i', 'v', 'e' };
|
222
|
+
static const symbol s_21[] = { 'b', 'l', 'e' };
|
223
|
+
static const symbol s_22[] = { 'a', 'l' };
|
224
|
+
static const symbol s_23[] = { 'i', 'c' };
|
225
|
+
static const symbol s_24[] = { 's' };
|
226
|
+
static const symbol s_25[] = { 't' };
|
227
|
+
static const symbol s_26[] = { 'e' };
|
228
|
+
static const symbol s_27[] = { 'l' };
|
229
|
+
static const symbol s_28[] = { 'l' };
|
230
|
+
static const symbol s_29[] = { 'y' };
|
231
|
+
static const symbol s_30[] = { 'Y' };
|
232
|
+
static const symbol s_31[] = { 'y' };
|
233
|
+
static const symbol s_32[] = { 'Y' };
|
234
|
+
static const symbol s_33[] = { 'Y' };
|
235
|
+
static const symbol s_34[] = { 'y' };
|
222
236
|
|
223
237
|
static int r_shortv(struct SN_env * z) {
|
224
|
-
if (
|
225
|
-
if (
|
226
|
-
if (
|
238
|
+
if (out_grouping_b_U(z, g_v_WXY, 89, 121, 0)) return 0;
|
239
|
+
if (in_grouping_b_U(z, g_v, 97, 121, 0)) return 0;
|
240
|
+
if (out_grouping_b_U(z, g_v, 97, 121, 0)) return 0;
|
227
241
|
return 1;
|
228
242
|
}
|
229
243
|
|
@@ -240,26 +254,24 @@ static int r_R2(struct SN_env * z) {
|
|
240
254
|
static int r_Step_1a(struct SN_env * z) {
|
241
255
|
int among_var;
|
242
256
|
z->ket = z->c; /* [, line 25 */
|
257
|
+
if (z->c <= z->lb || z->p[z->c - 1] != 115) return 0;
|
243
258
|
among_var = find_among_b(z, a_0, 4); /* substring, line 25 */
|
244
259
|
if (!(among_var)) return 0;
|
245
260
|
z->bra = z->c; /* ], line 25 */
|
246
261
|
switch(among_var) {
|
247
262
|
case 0: return 0;
|
248
263
|
case 1:
|
249
|
-
{ int ret;
|
250
|
-
ret = slice_from_s(z, 2, s_0); /* <-, line 26 */
|
264
|
+
{ int ret = slice_from_s(z, 2, s_0); /* <-, line 26 */
|
251
265
|
if (ret < 0) return ret;
|
252
266
|
}
|
253
267
|
break;
|
254
268
|
case 2:
|
255
|
-
{ int ret;
|
256
|
-
ret = slice_from_s(z, 1, s_1); /* <-, line 27 */
|
269
|
+
{ int ret = slice_from_s(z, 1, s_1); /* <-, line 27 */
|
257
270
|
if (ret < 0) return ret;
|
258
271
|
}
|
259
272
|
break;
|
260
273
|
case 3:
|
261
|
-
{ int ret;
|
262
|
-
ret = slice_del(z); /* delete, line 29 */
|
274
|
+
{ int ret = slice_del(z); /* delete, line 29 */
|
263
275
|
if (ret < 0) return ret;
|
264
276
|
}
|
265
277
|
break;
|
@@ -270,6 +282,7 @@ static int r_Step_1a(struct SN_env * z) {
|
|
270
282
|
static int r_Step_1b(struct SN_env * z) {
|
271
283
|
int among_var;
|
272
284
|
z->ket = z->c; /* [, line 34 */
|
285
|
+
if (z->c - 1 <= z->lb || (z->p[z->c - 1] != 100 && z->p[z->c - 1] != 103)) return 0;
|
273
286
|
among_var = find_among_b(z, a_2, 3); /* substring, line 34 */
|
274
287
|
if (!(among_var)) return 0;
|
275
288
|
z->bra = z->c; /* ], line 34 */
|
@@ -280,29 +293,24 @@ static int r_Step_1b(struct SN_env * z) {
|
|
280
293
|
if (ret == 0) return 0; /* call R1, line 35 */
|
281
294
|
if (ret < 0) return ret;
|
282
295
|
}
|
283
|
-
{ int ret;
|
284
|
-
ret = slice_from_s(z, 2, s_2); /* <-, line 35 */
|
296
|
+
{ int ret = slice_from_s(z, 2, s_2); /* <-, line 35 */
|
285
297
|
if (ret < 0) return ret;
|
286
298
|
}
|
287
299
|
break;
|
288
300
|
case 2:
|
289
301
|
{ int m_test = z->l - z->c; /* test, line 38 */
|
290
|
-
|
291
|
-
|
292
|
-
|
293
|
-
|
294
|
-
{ int c = skip_utf8(z->p, z->c, z->lb, 0, -1);
|
295
|
-
if (c < 0) return 0;
|
296
|
-
z->c = c; /* gopast, line 38 */
|
297
|
-
}
|
302
|
+
{ /* gopast */ /* grouping v, line 38 */
|
303
|
+
int ret = out_grouping_b_U(z, g_v, 97, 121, 1);
|
304
|
+
if (ret < 0) return 0;
|
305
|
+
z->c -= ret;
|
298
306
|
}
|
299
307
|
z->c = z->l - m_test;
|
300
308
|
}
|
301
|
-
{ int ret;
|
302
|
-
ret = slice_del(z); /* delete, line 38 */
|
309
|
+
{ int ret = slice_del(z); /* delete, line 38 */
|
303
310
|
if (ret < 0) return ret;
|
304
311
|
}
|
305
312
|
{ int m_test = z->l - z->c; /* test, line 39 */
|
313
|
+
if (z->c - 1 <= z->lb || z->p[z->c - 1] >> 5 != 3 || !((68514004 >> (z->p[z->c - 1] & 0x1f)) & 1)) among_var = 3; else
|
306
314
|
among_var = find_among_b(z, a_1, 13); /* substring, line 39 */
|
307
315
|
if (!(among_var)) return 0;
|
308
316
|
z->c = z->l - m_test;
|
@@ -310,23 +318,20 @@ static int r_Step_1b(struct SN_env * z) {
|
|
310
318
|
switch(among_var) {
|
311
319
|
case 0: return 0;
|
312
320
|
case 1:
|
313
|
-
{ int
|
314
|
-
|
315
|
-
|
316
|
-
z->c = c;
|
317
|
-
}
|
321
|
+
{ int c_keep = z->c;
|
322
|
+
int ret = insert_s(z, z->c, z->c, 1, s_3); /* <+, line 41 */
|
323
|
+
z->c = c_keep;
|
318
324
|
if (ret < 0) return ret;
|
319
325
|
}
|
320
326
|
break;
|
321
327
|
case 2:
|
322
328
|
z->ket = z->c; /* [, line 44 */
|
323
|
-
{ int
|
324
|
-
if (
|
325
|
-
z->c =
|
329
|
+
{ int ret = skip_utf8(z->p, z->c, z->lb, 0, -1);
|
330
|
+
if (ret < 0) return 0;
|
331
|
+
z->c = ret; /* next, line 44 */
|
326
332
|
}
|
327
333
|
z->bra = z->c; /* ], line 44 */
|
328
|
-
{ int ret;
|
329
|
-
ret = slice_del(z); /* delete, line 44 */
|
334
|
+
{ int ret = slice_del(z); /* delete, line 44 */
|
330
335
|
if (ret < 0) return ret;
|
331
336
|
}
|
332
337
|
break;
|
@@ -339,11 +344,9 @@ static int r_Step_1b(struct SN_env * z) {
|
|
339
344
|
}
|
340
345
|
z->c = z->l - m_test;
|
341
346
|
}
|
342
|
-
{ int
|
343
|
-
|
344
|
-
|
345
|
-
z->c = c;
|
346
|
-
}
|
347
|
+
{ int c_keep = z->c;
|
348
|
+
int ret = insert_s(z, z->c, z->c, 1, s_4); /* <+, line 45 */
|
349
|
+
z->c = c_keep;
|
347
350
|
if (ret < 0) return ret;
|
348
351
|
}
|
349
352
|
break;
|
@@ -355,26 +358,21 @@ static int r_Step_1b(struct SN_env * z) {
|
|
355
358
|
|
356
359
|
static int r_Step_1c(struct SN_env * z) {
|
357
360
|
z->ket = z->c; /* [, line 52 */
|
358
|
-
{ int
|
361
|
+
{ int m1 = z->l - z->c; (void)m1; /* or, line 52 */
|
359
362
|
if (!(eq_s_b(z, 1, s_5))) goto lab1;
|
360
363
|
goto lab0;
|
361
364
|
lab1:
|
362
|
-
z->c = z->l -
|
365
|
+
z->c = z->l - m1;
|
363
366
|
if (!(eq_s_b(z, 1, s_6))) return 0;
|
364
367
|
}
|
365
368
|
lab0:
|
366
369
|
z->bra = z->c; /* ], line 52 */
|
367
|
-
|
368
|
-
|
369
|
-
|
370
|
-
|
371
|
-
{ int c = skip_utf8(z->p, z->c, z->lb, 0, -1);
|
372
|
-
if (c < 0) return 0;
|
373
|
-
z->c = c; /* gopast, line 53 */
|
374
|
-
}
|
370
|
+
{ /* gopast */ /* grouping v, line 53 */
|
371
|
+
int ret = out_grouping_b_U(z, g_v, 97, 121, 1);
|
372
|
+
if (ret < 0) return 0;
|
373
|
+
z->c -= ret;
|
375
374
|
}
|
376
|
-
{ int ret;
|
377
|
-
ret = slice_from_s(z, 1, s_7); /* <-, line 54 */
|
375
|
+
{ int ret = slice_from_s(z, 1, s_7); /* <-, line 54 */
|
378
376
|
if (ret < 0) return ret;
|
379
377
|
}
|
380
378
|
return 1;
|
@@ -383,6 +381,7 @@ lab0:
|
|
383
381
|
static int r_Step_2(struct SN_env * z) {
|
384
382
|
int among_var;
|
385
383
|
z->ket = z->c; /* [, line 58 */
|
384
|
+
if (z->c - 2 <= z->lb || z->p[z->c - 1] >> 5 != 3 || !((815616 >> (z->p[z->c - 1] & 0x1f)) & 1)) return 0;
|
386
385
|
among_var = find_among_b(z, a_3, 20); /* substring, line 58 */
|
387
386
|
if (!(among_var)) return 0;
|
388
387
|
z->bra = z->c; /* ], line 58 */
|
@@ -393,86 +392,72 @@ static int r_Step_2(struct SN_env * z) {
|
|
393
392
|
switch(among_var) {
|
394
393
|
case 0: return 0;
|
395
394
|
case 1:
|
396
|
-
{ int ret;
|
397
|
-
ret = slice_from_s(z, 4, s_8); /* <-, line 59 */
|
395
|
+
{ int ret = slice_from_s(z, 4, s_8); /* <-, line 59 */
|
398
396
|
if (ret < 0) return ret;
|
399
397
|
}
|
400
398
|
break;
|
401
399
|
case 2:
|
402
|
-
{ int ret;
|
403
|
-
ret = slice_from_s(z, 4, s_9); /* <-, line 60 */
|
400
|
+
{ int ret = slice_from_s(z, 4, s_9); /* <-, line 60 */
|
404
401
|
if (ret < 0) return ret;
|
405
402
|
}
|
406
403
|
break;
|
407
404
|
case 3:
|
408
|
-
{ int ret;
|
409
|
-
ret = slice_from_s(z, 4, s_10); /* <-, line 61 */
|
405
|
+
{ int ret = slice_from_s(z, 4, s_10); /* <-, line 61 */
|
410
406
|
if (ret < 0) return ret;
|
411
407
|
}
|
412
408
|
break;
|
413
409
|
case 4:
|
414
|
-
{ int ret;
|
415
|
-
ret = slice_from_s(z, 4, s_11); /* <-, line 62 */
|
410
|
+
{ int ret = slice_from_s(z, 4, s_11); /* <-, line 62 */
|
416
411
|
if (ret < 0) return ret;
|
417
412
|
}
|
418
413
|
break;
|
419
414
|
case 5:
|
420
|
-
{ int ret;
|
421
|
-
ret = slice_from_s(z, 3, s_12); /* <-, line 63 */
|
415
|
+
{ int ret = slice_from_s(z, 3, s_12); /* <-, line 63 */
|
422
416
|
if (ret < 0) return ret;
|
423
417
|
}
|
424
418
|
break;
|
425
419
|
case 6:
|
426
|
-
{ int ret;
|
427
|
-
ret = slice_from_s(z, 1, s_13); /* <-, line 64 */
|
420
|
+
{ int ret = slice_from_s(z, 1, s_13); /* <-, line 64 */
|
428
421
|
if (ret < 0) return ret;
|
429
422
|
}
|
430
423
|
break;
|
431
424
|
case 7:
|
432
|
-
{ int ret;
|
433
|
-
ret = slice_from_s(z, 3, s_14); /* <-, line 66 */
|
425
|
+
{ int ret = slice_from_s(z, 3, s_14); /* <-, line 66 */
|
434
426
|
if (ret < 0) return ret;
|
435
427
|
}
|
436
428
|
break;
|
437
429
|
case 8:
|
438
|
-
{ int ret;
|
439
|
-
ret = slice_from_s(z, 3, s_15); /* <-, line 68 */
|
430
|
+
{ int ret = slice_from_s(z, 3, s_15); /* <-, line 68 */
|
440
431
|
if (ret < 0) return ret;
|
441
432
|
}
|
442
433
|
break;
|
443
434
|
case 9:
|
444
|
-
{ int ret;
|
445
|
-
ret = slice_from_s(z, 2, s_16); /* <-, line 69 */
|
435
|
+
{ int ret = slice_from_s(z, 2, s_16); /* <-, line 69 */
|
446
436
|
if (ret < 0) return ret;
|
447
437
|
}
|
448
438
|
break;
|
449
439
|
case 10:
|
450
|
-
{ int ret;
|
451
|
-
ret = slice_from_s(z, 2, s_17); /* <-, line 71 */
|
440
|
+
{ int ret = slice_from_s(z, 2, s_17); /* <-, line 71 */
|
452
441
|
if (ret < 0) return ret;
|
453
442
|
}
|
454
443
|
break;
|
455
444
|
case 11:
|
456
|
-
{ int ret;
|
457
|
-
ret = slice_from_s(z, 3, s_18); /* <-, line 72 */
|
445
|
+
{ int ret = slice_from_s(z, 3, s_18); /* <-, line 72 */
|
458
446
|
if (ret < 0) return ret;
|
459
447
|
}
|
460
448
|
break;
|
461
449
|
case 12:
|
462
|
-
{ int ret;
|
463
|
-
ret = slice_from_s(z, 3, s_19); /* <-, line 74 */
|
450
|
+
{ int ret = slice_from_s(z, 3, s_19); /* <-, line 74 */
|
464
451
|
if (ret < 0) return ret;
|
465
452
|
}
|
466
453
|
break;
|
467
454
|
case 13:
|
468
|
-
{ int ret;
|
469
|
-
ret = slice_from_s(z, 3, s_20); /* <-, line 76 */
|
455
|
+
{ int ret = slice_from_s(z, 3, s_20); /* <-, line 76 */
|
470
456
|
if (ret < 0) return ret;
|
471
457
|
}
|
472
458
|
break;
|
473
459
|
case 14:
|
474
|
-
{ int ret;
|
475
|
-
ret = slice_from_s(z, 3, s_21); /* <-, line 77 */
|
460
|
+
{ int ret = slice_from_s(z, 3, s_21); /* <-, line 77 */
|
476
461
|
if (ret < 0) return ret;
|
477
462
|
}
|
478
463
|
break;
|
@@ -483,6 +468,7 @@ static int r_Step_2(struct SN_env * z) {
|
|
483
468
|
static int r_Step_3(struct SN_env * z) {
|
484
469
|
int among_var;
|
485
470
|
z->ket = z->c; /* [, line 82 */
|
471
|
+
if (z->c - 2 <= z->lb || z->p[z->c - 1] >> 5 != 3 || !((528928 >> (z->p[z->c - 1] & 0x1f)) & 1)) return 0;
|
486
472
|
among_var = find_among_b(z, a_4, 7); /* substring, line 82 */
|
487
473
|
if (!(among_var)) return 0;
|
488
474
|
z->bra = z->c; /* ], line 82 */
|
@@ -493,20 +479,17 @@ static int r_Step_3(struct SN_env * z) {
|
|
493
479
|
switch(among_var) {
|
494
480
|
case 0: return 0;
|
495
481
|
case 1:
|
496
|
-
{ int ret;
|
497
|
-
ret = slice_from_s(z, 2, s_22); /* <-, line 83 */
|
482
|
+
{ int ret = slice_from_s(z, 2, s_22); /* <-, line 83 */
|
498
483
|
if (ret < 0) return ret;
|
499
484
|
}
|
500
485
|
break;
|
501
486
|
case 2:
|
502
|
-
{ int ret;
|
503
|
-
ret = slice_from_s(z, 2, s_23); /* <-, line 85 */
|
487
|
+
{ int ret = slice_from_s(z, 2, s_23); /* <-, line 85 */
|
504
488
|
if (ret < 0) return ret;
|
505
489
|
}
|
506
490
|
break;
|
507
491
|
case 3:
|
508
|
-
{ int ret;
|
509
|
-
ret = slice_del(z); /* delete, line 87 */
|
492
|
+
{ int ret = slice_del(z); /* delete, line 87 */
|
510
493
|
if (ret < 0) return ret;
|
511
494
|
}
|
512
495
|
break;
|
@@ -517,6 +500,7 @@ static int r_Step_3(struct SN_env * z) {
|
|
517
500
|
static int r_Step_4(struct SN_env * z) {
|
518
501
|
int among_var;
|
519
502
|
z->ket = z->c; /* [, line 92 */
|
503
|
+
if (z->c - 1 <= z->lb || z->p[z->c - 1] >> 5 != 3 || !((3961384 >> (z->p[z->c - 1] & 0x1f)) & 1)) return 0;
|
520
504
|
among_var = find_among_b(z, a_5, 19); /* substring, line 92 */
|
521
505
|
if (!(among_var)) return 0;
|
522
506
|
z->bra = z->c; /* ], line 92 */
|
@@ -527,22 +511,20 @@ static int r_Step_4(struct SN_env * z) {
|
|
527
511
|
switch(among_var) {
|
528
512
|
case 0: return 0;
|
529
513
|
case 1:
|
530
|
-
{ int ret;
|
531
|
-
ret = slice_del(z); /* delete, line 95 */
|
514
|
+
{ int ret = slice_del(z); /* delete, line 95 */
|
532
515
|
if (ret < 0) return ret;
|
533
516
|
}
|
534
517
|
break;
|
535
518
|
case 2:
|
536
|
-
{ int
|
519
|
+
{ int m1 = z->l - z->c; (void)m1; /* or, line 96 */
|
537
520
|
if (!(eq_s_b(z, 1, s_24))) goto lab1;
|
538
521
|
goto lab0;
|
539
522
|
lab1:
|
540
|
-
z->c = z->l -
|
523
|
+
z->c = z->l - m1;
|
541
524
|
if (!(eq_s_b(z, 1, s_25))) return 0;
|
542
525
|
}
|
543
526
|
lab0:
|
544
|
-
{ int ret;
|
545
|
-
ret = slice_del(z); /* delete, line 96 */
|
527
|
+
{ int ret = slice_del(z); /* delete, line 96 */
|
546
528
|
if (ret < 0) return ret;
|
547
529
|
}
|
548
530
|
break;
|
@@ -554,31 +536,30 @@ static int r_Step_5a(struct SN_env * z) {
|
|
554
536
|
z->ket = z->c; /* [, line 101 */
|
555
537
|
if (!(eq_s_b(z, 1, s_26))) return 0;
|
556
538
|
z->bra = z->c; /* ], line 101 */
|
557
|
-
{ int
|
539
|
+
{ int m1 = z->l - z->c; (void)m1; /* or, line 102 */
|
558
540
|
{ int ret = r_R2(z);
|
559
541
|
if (ret == 0) goto lab1; /* call R2, line 102 */
|
560
542
|
if (ret < 0) return ret;
|
561
543
|
}
|
562
544
|
goto lab0;
|
563
545
|
lab1:
|
564
|
-
z->c = z->l -
|
546
|
+
z->c = z->l - m1;
|
565
547
|
{ int ret = r_R1(z);
|
566
548
|
if (ret == 0) return 0; /* call R1, line 102 */
|
567
549
|
if (ret < 0) return ret;
|
568
550
|
}
|
569
|
-
{ int
|
551
|
+
{ int m2 = z->l - z->c; (void)m2; /* not, line 102 */
|
570
552
|
{ int ret = r_shortv(z);
|
571
553
|
if (ret == 0) goto lab2; /* call shortv, line 102 */
|
572
554
|
if (ret < 0) return ret;
|
573
555
|
}
|
574
556
|
return 0;
|
575
557
|
lab2:
|
576
|
-
z->c = z->l -
|
558
|
+
z->c = z->l - m2;
|
577
559
|
}
|
578
560
|
}
|
579
561
|
lab0:
|
580
|
-
{ int ret;
|
581
|
-
ret = slice_del(z); /* delete, line 103 */
|
562
|
+
{ int ret = slice_del(z); /* delete, line 103 */
|
582
563
|
if (ret < 0) return ret;
|
583
564
|
}
|
584
565
|
return 1;
|
@@ -593,8 +574,7 @@ static int r_Step_5b(struct SN_env * z) {
|
|
593
574
|
if (ret < 0) return ret;
|
594
575
|
}
|
595
576
|
if (!(eq_s_b(z, 1, s_28))) return 0;
|
596
|
-
{ int ret;
|
597
|
-
ret = slice_del(z); /* delete, line 109 */
|
577
|
+
{ int ret = slice_del(z); /* delete, line 109 */
|
598
578
|
if (ret < 0) return ret;
|
599
579
|
}
|
600
580
|
return 1;
|
@@ -602,193 +582,174 @@ static int r_Step_5b(struct SN_env * z) {
|
|
602
582
|
|
603
583
|
extern int porter_UTF_8_stem(struct SN_env * z) {
|
604
584
|
z->B[0] = 0; /* unset Y_found, line 115 */
|
605
|
-
{ int
|
585
|
+
{ int c1 = z->c; /* do, line 116 */
|
606
586
|
z->bra = z->c; /* [, line 116 */
|
607
587
|
if (!(eq_s(z, 1, s_29))) goto lab0;
|
608
588
|
z->ket = z->c; /* ], line 116 */
|
609
|
-
{ int ret;
|
610
|
-
ret = slice_from_s(z, 1, s_30); /* <-, line 116 */
|
589
|
+
{ int ret = slice_from_s(z, 1, s_30); /* <-, line 116 */
|
611
590
|
if (ret < 0) return ret;
|
612
591
|
}
|
613
592
|
z->B[0] = 1; /* set Y_found, line 116 */
|
614
593
|
lab0:
|
615
|
-
z->c =
|
594
|
+
z->c = c1;
|
616
595
|
}
|
617
|
-
{ int
|
596
|
+
{ int c2 = z->c; /* do, line 117 */
|
618
597
|
while(1) { /* repeat, line 117 */
|
619
|
-
int
|
598
|
+
int c3 = z->c;
|
620
599
|
while(1) { /* goto, line 117 */
|
621
|
-
int
|
622
|
-
if (
|
600
|
+
int c4 = z->c;
|
601
|
+
if (in_grouping_U(z, g_v, 97, 121, 0)) goto lab3;
|
623
602
|
z->bra = z->c; /* [, line 117 */
|
624
603
|
if (!(eq_s(z, 1, s_31))) goto lab3;
|
625
604
|
z->ket = z->c; /* ], line 117 */
|
626
|
-
z->c =
|
605
|
+
z->c = c4;
|
627
606
|
break;
|
628
607
|
lab3:
|
629
|
-
z->c =
|
630
|
-
{ int
|
631
|
-
if (
|
632
|
-
z->c =
|
608
|
+
z->c = c4;
|
609
|
+
{ int ret = skip_utf8(z->p, z->c, 0, z->l, 1);
|
610
|
+
if (ret < 0) goto lab2;
|
611
|
+
z->c = ret; /* goto, line 117 */
|
633
612
|
}
|
634
613
|
}
|
635
|
-
{ int ret;
|
636
|
-
ret = slice_from_s(z, 1, s_32); /* <-, line 117 */
|
614
|
+
{ int ret = slice_from_s(z, 1, s_32); /* <-, line 117 */
|
637
615
|
if (ret < 0) return ret;
|
638
616
|
}
|
639
617
|
z->B[0] = 1; /* set Y_found, line 117 */
|
640
618
|
continue;
|
641
619
|
lab2:
|
642
|
-
z->c =
|
620
|
+
z->c = c3;
|
643
621
|
break;
|
644
622
|
}
|
645
|
-
z->c =
|
623
|
+
z->c = c2;
|
646
624
|
}
|
647
625
|
z->I[0] = z->l;
|
648
626
|
z->I[1] = z->l;
|
649
|
-
{ int
|
650
|
-
|
651
|
-
|
652
|
-
|
653
|
-
|
654
|
-
{ int c = skip_utf8(z->p, z->c, 0, z->l, 1);
|
655
|
-
if (c < 0) goto lab4;
|
656
|
-
z->c = c; /* gopast, line 122 */
|
657
|
-
}
|
627
|
+
{ int c5 = z->c; /* do, line 121 */
|
628
|
+
{ /* gopast */ /* grouping v, line 122 */
|
629
|
+
int ret = out_grouping_U(z, g_v, 97, 121, 1);
|
630
|
+
if (ret < 0) goto lab4;
|
631
|
+
z->c += ret;
|
658
632
|
}
|
659
|
-
|
660
|
-
|
661
|
-
|
662
|
-
|
663
|
-
{ int c = skip_utf8(z->p, z->c, 0, z->l, 1);
|
664
|
-
if (c < 0) goto lab4;
|
665
|
-
z->c = c; /* gopast, line 122 */
|
666
|
-
}
|
633
|
+
{ /* gopast */ /* non v, line 122 */
|
634
|
+
int ret = in_grouping_U(z, g_v, 97, 121, 1);
|
635
|
+
if (ret < 0) goto lab4;
|
636
|
+
z->c += ret;
|
667
637
|
}
|
668
638
|
z->I[0] = z->c; /* setmark p1, line 122 */
|
669
|
-
|
670
|
-
|
671
|
-
|
672
|
-
|
673
|
-
{ int c = skip_utf8(z->p, z->c, 0, z->l, 1);
|
674
|
-
if (c < 0) goto lab4;
|
675
|
-
z->c = c; /* gopast, line 123 */
|
676
|
-
}
|
639
|
+
{ /* gopast */ /* grouping v, line 123 */
|
640
|
+
int ret = out_grouping_U(z, g_v, 97, 121, 1);
|
641
|
+
if (ret < 0) goto lab4;
|
642
|
+
z->c += ret;
|
677
643
|
}
|
678
|
-
|
679
|
-
|
680
|
-
|
681
|
-
|
682
|
-
{ int c = skip_utf8(z->p, z->c, 0, z->l, 1);
|
683
|
-
if (c < 0) goto lab4;
|
684
|
-
z->c = c; /* gopast, line 123 */
|
685
|
-
}
|
644
|
+
{ /* gopast */ /* non v, line 123 */
|
645
|
+
int ret = in_grouping_U(z, g_v, 97, 121, 1);
|
646
|
+
if (ret < 0) goto lab4;
|
647
|
+
z->c += ret;
|
686
648
|
}
|
687
649
|
z->I[1] = z->c; /* setmark p2, line 123 */
|
688
650
|
lab4:
|
689
|
-
z->c =
|
651
|
+
z->c = c5;
|
690
652
|
}
|
691
653
|
z->lb = z->c; z->c = z->l; /* backwards, line 126 */
|
692
654
|
|
693
|
-
{ int
|
655
|
+
{ int m6 = z->l - z->c; (void)m6; /* do, line 127 */
|
694
656
|
{ int ret = r_Step_1a(z);
|
695
|
-
if (ret == 0) goto
|
657
|
+
if (ret == 0) goto lab5; /* call Step_1a, line 127 */
|
696
658
|
if (ret < 0) return ret;
|
697
659
|
}
|
698
|
-
|
699
|
-
z->c = z->l -
|
660
|
+
lab5:
|
661
|
+
z->c = z->l - m6;
|
700
662
|
}
|
701
|
-
{ int
|
663
|
+
{ int m7 = z->l - z->c; (void)m7; /* do, line 128 */
|
702
664
|
{ int ret = r_Step_1b(z);
|
703
|
-
if (ret == 0) goto
|
665
|
+
if (ret == 0) goto lab6; /* call Step_1b, line 128 */
|
704
666
|
if (ret < 0) return ret;
|
705
667
|
}
|
706
|
-
|
707
|
-
z->c = z->l -
|
668
|
+
lab6:
|
669
|
+
z->c = z->l - m7;
|
708
670
|
}
|
709
|
-
{ int
|
671
|
+
{ int m8 = z->l - z->c; (void)m8; /* do, line 129 */
|
710
672
|
{ int ret = r_Step_1c(z);
|
711
|
-
if (ret == 0) goto
|
673
|
+
if (ret == 0) goto lab7; /* call Step_1c, line 129 */
|
712
674
|
if (ret < 0) return ret;
|
713
675
|
}
|
714
|
-
|
715
|
-
z->c = z->l -
|
676
|
+
lab7:
|
677
|
+
z->c = z->l - m8;
|
716
678
|
}
|
717
|
-
{ int
|
679
|
+
{ int m9 = z->l - z->c; (void)m9; /* do, line 130 */
|
718
680
|
{ int ret = r_Step_2(z);
|
719
|
-
if (ret == 0) goto
|
681
|
+
if (ret == 0) goto lab8; /* call Step_2, line 130 */
|
720
682
|
if (ret < 0) return ret;
|
721
683
|
}
|
722
|
-
|
723
|
-
z->c = z->l -
|
684
|
+
lab8:
|
685
|
+
z->c = z->l - m9;
|
724
686
|
}
|
725
|
-
{ int
|
687
|
+
{ int m10 = z->l - z->c; (void)m10; /* do, line 131 */
|
726
688
|
{ int ret = r_Step_3(z);
|
727
|
-
if (ret == 0) goto
|
689
|
+
if (ret == 0) goto lab9; /* call Step_3, line 131 */
|
728
690
|
if (ret < 0) return ret;
|
729
691
|
}
|
730
|
-
|
731
|
-
z->c = z->l -
|
692
|
+
lab9:
|
693
|
+
z->c = z->l - m10;
|
732
694
|
}
|
733
|
-
{ int
|
695
|
+
{ int m11 = z->l - z->c; (void)m11; /* do, line 132 */
|
734
696
|
{ int ret = r_Step_4(z);
|
735
|
-
if (ret == 0) goto
|
697
|
+
if (ret == 0) goto lab10; /* call Step_4, line 132 */
|
736
698
|
if (ret < 0) return ret;
|
737
699
|
}
|
738
|
-
|
739
|
-
z->c = z->l -
|
700
|
+
lab10:
|
701
|
+
z->c = z->l - m11;
|
740
702
|
}
|
741
|
-
{ int
|
703
|
+
{ int m12 = z->l - z->c; (void)m12; /* do, line 133 */
|
742
704
|
{ int ret = r_Step_5a(z);
|
743
|
-
if (ret == 0) goto
|
705
|
+
if (ret == 0) goto lab11; /* call Step_5a, line 133 */
|
744
706
|
if (ret < 0) return ret;
|
745
707
|
}
|
746
|
-
|
747
|
-
z->c = z->l -
|
708
|
+
lab11:
|
709
|
+
z->c = z->l - m12;
|
748
710
|
}
|
749
|
-
{ int
|
711
|
+
{ int m13 = z->l - z->c; (void)m13; /* do, line 134 */
|
750
712
|
{ int ret = r_Step_5b(z);
|
751
|
-
if (ret == 0) goto
|
713
|
+
if (ret == 0) goto lab12; /* call Step_5b, line 134 */
|
752
714
|
if (ret < 0) return ret;
|
753
715
|
}
|
754
|
-
|
755
|
-
z->c = z->l -
|
716
|
+
lab12:
|
717
|
+
z->c = z->l - m13;
|
756
718
|
}
|
757
719
|
z->c = z->lb;
|
758
|
-
{ int
|
759
|
-
if (!(z->B[0])) goto
|
720
|
+
{ int c14 = z->c; /* do, line 137 */
|
721
|
+
if (!(z->B[0])) goto lab13; /* Boolean test Y_found, line 137 */
|
760
722
|
while(1) { /* repeat, line 137 */
|
761
|
-
int
|
723
|
+
int c15 = z->c;
|
762
724
|
while(1) { /* goto, line 137 */
|
763
|
-
int
|
725
|
+
int c16 = z->c;
|
764
726
|
z->bra = z->c; /* [, line 137 */
|
765
|
-
if (!(eq_s(z, 1, s_33))) goto
|
727
|
+
if (!(eq_s(z, 1, s_33))) goto lab15;
|
766
728
|
z->ket = z->c; /* ], line 137 */
|
767
|
-
z->c =
|
729
|
+
z->c = c16;
|
768
730
|
break;
|
769
|
-
|
770
|
-
z->c =
|
771
|
-
{ int
|
772
|
-
if (
|
773
|
-
z->c =
|
731
|
+
lab15:
|
732
|
+
z->c = c16;
|
733
|
+
{ int ret = skip_utf8(z->p, z->c, 0, z->l, 1);
|
734
|
+
if (ret < 0) goto lab14;
|
735
|
+
z->c = ret; /* goto, line 137 */
|
774
736
|
}
|
775
737
|
}
|
776
|
-
{ int ret;
|
777
|
-
ret = slice_from_s(z, 1, s_34); /* <-, line 137 */
|
738
|
+
{ int ret = slice_from_s(z, 1, s_34); /* <-, line 137 */
|
778
739
|
if (ret < 0) return ret;
|
779
740
|
}
|
780
741
|
continue;
|
781
|
-
|
782
|
-
z->c =
|
742
|
+
lab14:
|
743
|
+
z->c = c15;
|
783
744
|
break;
|
784
745
|
}
|
785
|
-
|
786
|
-
z->c =
|
746
|
+
lab13:
|
747
|
+
z->c = c14;
|
787
748
|
}
|
788
749
|
return 1;
|
789
750
|
}
|
790
751
|
|
791
752
|
extern struct SN_env * porter_UTF_8_create_env(void) { return SN_create_env(0, 2, 1); }
|
792
753
|
|
793
|
-
extern void porter_UTF_8_close_env(struct SN_env * z) { SN_close_env(z); }
|
754
|
+
extern void porter_UTF_8_close_env(struct SN_env * z) { SN_close_env(z, 0); }
|
794
755
|
|