Line data Source code
1 : /* Generated by Snowball 2.2.0 - https://snowballstem.org/ */
2 :
3 : #include "header.h"
4 :
5 : #ifdef __cplusplus
6 : extern "C" {
7 : #endif
8 : extern int danish_UTF_8_stem(struct SN_env * z);
9 : #ifdef __cplusplus
10 : }
11 : #endif
12 : static int r_undouble(struct SN_env * z);
13 : static int r_other_suffix(struct SN_env * z);
14 : static int r_consonant_pair(struct SN_env * z);
15 : static int r_main_suffix(struct SN_env * z);
16 : static int r_mark_regions(struct SN_env * z);
17 : #ifdef __cplusplus
18 : extern "C" {
19 : #endif
20 :
21 :
22 : extern struct SN_env * danish_UTF_8_create_env(void);
23 : extern void danish_UTF_8_close_env(struct SN_env * z);
24 :
25 :
26 : #ifdef __cplusplus
27 : }
28 : #endif
29 : static const symbol s_0_0[3] = { 'h', 'e', 'd' };
30 : static const symbol s_0_1[5] = { 'e', 't', 'h', 'e', 'd' };
31 : static const symbol s_0_2[4] = { 'e', 'r', 'e', 'd' };
32 : static const symbol s_0_3[1] = { 'e' };
33 : static const symbol s_0_4[5] = { 'e', 'r', 'e', 'd', 'e' };
34 : static const symbol s_0_5[4] = { 'e', 'n', 'd', 'e' };
35 : static const symbol s_0_6[6] = { 'e', 'r', 'e', 'n', 'd', 'e' };
36 : static const symbol s_0_7[3] = { 'e', 'n', 'e' };
37 : static const symbol s_0_8[4] = { 'e', 'r', 'n', 'e' };
38 : static const symbol s_0_9[3] = { 'e', 'r', 'e' };
39 : static const symbol s_0_10[2] = { 'e', 'n' };
40 : static const symbol s_0_11[5] = { 'h', 'e', 'd', 'e', 'n' };
41 : static const symbol s_0_12[4] = { 'e', 'r', 'e', 'n' };
42 : static const symbol s_0_13[2] = { 'e', 'r' };
43 : static const symbol s_0_14[5] = { 'h', 'e', 'd', 'e', 'r' };
44 : static const symbol s_0_15[4] = { 'e', 'r', 'e', 'r' };
45 : static const symbol s_0_16[1] = { 's' };
46 : static const symbol s_0_17[4] = { 'h', 'e', 'd', 's' };
47 : static const symbol s_0_18[2] = { 'e', 's' };
48 : static const symbol s_0_19[5] = { 'e', 'n', 'd', 'e', 's' };
49 : static const symbol s_0_20[7] = { 'e', 'r', 'e', 'n', 'd', 'e', 's' };
50 : static const symbol s_0_21[4] = { 'e', 'n', 'e', 's' };
51 : static const symbol s_0_22[5] = { 'e', 'r', 'n', 'e', 's' };
52 : static const symbol s_0_23[4] = { 'e', 'r', 'e', 's' };
53 : static const symbol s_0_24[3] = { 'e', 'n', 's' };
54 : static const symbol s_0_25[6] = { 'h', 'e', 'd', 'e', 'n', 's' };
55 : static const symbol s_0_26[5] = { 'e', 'r', 'e', 'n', 's' };
56 : static const symbol s_0_27[3] = { 'e', 'r', 's' };
57 : static const symbol s_0_28[3] = { 'e', 't', 's' };
58 : static const symbol s_0_29[5] = { 'e', 'r', 'e', 't', 's' };
59 : static const symbol s_0_30[2] = { 'e', 't' };
60 : static const symbol s_0_31[4] = { 'e', 'r', 'e', 't' };
61 :
62 : static const struct among a_0[32] =
63 : {
64 : { 3, s_0_0, -1, 1, 0},
65 : { 5, s_0_1, 0, 1, 0},
66 : { 4, s_0_2, -1, 1, 0},
67 : { 1, s_0_3, -1, 1, 0},
68 : { 5, s_0_4, 3, 1, 0},
69 : { 4, s_0_5, 3, 1, 0},
70 : { 6, s_0_6, 5, 1, 0},
71 : { 3, s_0_7, 3, 1, 0},
72 : { 4, s_0_8, 3, 1, 0},
73 : { 3, s_0_9, 3, 1, 0},
74 : { 2, s_0_10, -1, 1, 0},
75 : { 5, s_0_11, 10, 1, 0},
76 : { 4, s_0_12, 10, 1, 0},
77 : { 2, s_0_13, -1, 1, 0},
78 : { 5, s_0_14, 13, 1, 0},
79 : { 4, s_0_15, 13, 1, 0},
80 : { 1, s_0_16, -1, 2, 0},
81 : { 4, s_0_17, 16, 1, 0},
82 : { 2, s_0_18, 16, 1, 0},
83 : { 5, s_0_19, 18, 1, 0},
84 : { 7, s_0_20, 19, 1, 0},
85 : { 4, s_0_21, 18, 1, 0},
86 : { 5, s_0_22, 18, 1, 0},
87 : { 4, s_0_23, 18, 1, 0},
88 : { 3, s_0_24, 16, 1, 0},
89 : { 6, s_0_25, 24, 1, 0},
90 : { 5, s_0_26, 24, 1, 0},
91 : { 3, s_0_27, 16, 1, 0},
92 : { 3, s_0_28, 16, 1, 0},
93 : { 5, s_0_29, 28, 1, 0},
94 : { 2, s_0_30, -1, 1, 0},
95 : { 4, s_0_31, 30, 1, 0}
96 : };
97 :
98 : static const symbol s_1_0[2] = { 'g', 'd' };
99 : static const symbol s_1_1[2] = { 'd', 't' };
100 : static const symbol s_1_2[2] = { 'g', 't' };
101 : static const symbol s_1_3[2] = { 'k', 't' };
102 :
103 : static const struct among a_1[4] =
104 : {
105 : { 2, s_1_0, -1, -1, 0},
106 : { 2, s_1_1, -1, -1, 0},
107 : { 2, s_1_2, -1, -1, 0},
108 : { 2, s_1_3, -1, -1, 0}
109 : };
110 :
111 : static const symbol s_2_0[2] = { 'i', 'g' };
112 : static const symbol s_2_1[3] = { 'l', 'i', 'g' };
113 : static const symbol s_2_2[4] = { 'e', 'l', 'i', 'g' };
114 : static const symbol s_2_3[3] = { 'e', 'l', 's' };
115 : static const symbol s_2_4[5] = { 'l', 0xC3, 0xB8, 's', 't' };
116 :
117 : static const struct among a_2[5] =
118 : {
119 : { 2, s_2_0, -1, 1, 0},
120 : { 3, s_2_1, 0, 1, 0},
121 : { 4, s_2_2, 1, 1, 0},
122 : { 3, s_2_3, -1, 1, 0},
123 : { 5, s_2_4, -1, 2, 0}
124 : };
125 :
126 : static const unsigned char g_c[] = { 119, 223, 119, 1 };
127 :
128 : static const unsigned char g_v[] = { 17, 65, 16, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 48, 0, 128 };
129 :
130 : static const unsigned char g_s_ending[] = { 239, 254, 42, 3, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 16 };
131 :
132 : static const symbol s_0[] = { 's', 't' };
133 : static const symbol s_1[] = { 'i', 'g' };
134 : static const symbol s_2[] = { 'l', 0xC3, 0xB8, 's' };
135 :
136 0 : static int r_mark_regions(struct SN_env * z) {
137 0 : z->I[1] = z->l;
138 0 : { int c_test1 = z->c;
139 0 : { int ret = skip_utf8(z->p, z->c, z->l, 3);
140 0 : if (ret < 0) return 0;
141 0 : z->c = ret;
142 : }
143 0 : z->I[0] = z->c;
144 0 : z->c = c_test1;
145 : }
146 0 : if (out_grouping_U(z, g_v, 97, 248, 1) < 0) return 0;
147 : {
148 0 : int ret = in_grouping_U(z, g_v, 97, 248, 1);
149 0 : if (ret < 0) return 0;
150 0 : z->c += ret;
151 : }
152 0 : z->I[1] = z->c;
153 :
154 0 : if (!(z->I[1] < z->I[0])) goto lab0;
155 0 : z->I[1] = z->I[0];
156 0 : lab0:
157 0 : return 1;
158 : }
159 :
160 0 : static int r_main_suffix(struct SN_env * z) {
161 : int among_var;
162 :
163 : { int mlimit1;
164 0 : if (z->c < z->I[1]) return 0;
165 0 : mlimit1 = z->lb; z->lb = z->I[1];
166 0 : z->ket = z->c;
167 0 : if (z->c <= z->lb || z->p[z->c - 1] >> 5 != 3 || !((1851440 >> (z->p[z->c - 1] & 0x1f)) & 1)) { z->lb = mlimit1; return 0; }
168 0 : among_var = find_among_b(z, a_0, 32);
169 0 : if (!(among_var)) { z->lb = mlimit1; return 0; }
170 0 : z->bra = z->c;
171 0 : z->lb = mlimit1;
172 : }
173 0 : switch (among_var) {
174 0 : case 1:
175 0 : { int ret = slice_del(z);
176 0 : if (ret < 0) return ret;
177 : }
178 0 : break;
179 0 : case 2:
180 0 : if (in_grouping_b_U(z, g_s_ending, 97, 229, 0)) return 0;
181 0 : { int ret = slice_del(z);
182 0 : if (ret < 0) return ret;
183 : }
184 0 : break;
185 : }
186 0 : return 1;
187 : }
188 :
189 0 : static int r_consonant_pair(struct SN_env * z) {
190 0 : { int m_test1 = z->l - z->c;
191 :
192 : { int mlimit2;
193 0 : if (z->c < z->I[1]) return 0;
194 0 : mlimit2 = z->lb; z->lb = z->I[1];
195 0 : z->ket = z->c;
196 0 : if (z->c - 1 <= z->lb || (z->p[z->c - 1] != 100 && z->p[z->c - 1] != 116)) { z->lb = mlimit2; return 0; }
197 0 : if (!(find_among_b(z, a_1, 4))) { z->lb = mlimit2; return 0; }
198 0 : z->bra = z->c;
199 0 : z->lb = mlimit2;
200 : }
201 0 : z->c = z->l - m_test1;
202 : }
203 0 : { int ret = skip_b_utf8(z->p, z->c, z->lb, 1);
204 0 : if (ret < 0) return 0;
205 0 : z->c = ret;
206 : }
207 0 : z->bra = z->c;
208 0 : { int ret = slice_del(z);
209 0 : if (ret < 0) return ret;
210 : }
211 0 : return 1;
212 : }
213 :
214 0 : static int r_other_suffix(struct SN_env * z) {
215 : int among_var;
216 0 : { int m1 = z->l - z->c; (void)m1;
217 0 : z->ket = z->c;
218 0 : if (!(eq_s_b(z, 2, s_0))) goto lab0;
219 0 : z->bra = z->c;
220 0 : if (!(eq_s_b(z, 2, s_1))) goto lab0;
221 0 : { int ret = slice_del(z);
222 0 : if (ret < 0) return ret;
223 : }
224 0 : lab0:
225 0 : z->c = z->l - m1;
226 : }
227 :
228 : { int mlimit2;
229 0 : if (z->c < z->I[1]) return 0;
230 0 : mlimit2 = z->lb; z->lb = z->I[1];
231 0 : z->ket = z->c;
232 0 : if (z->c - 1 <= z->lb || z->p[z->c - 1] >> 5 != 3 || !((1572992 >> (z->p[z->c - 1] & 0x1f)) & 1)) { z->lb = mlimit2; return 0; }
233 0 : among_var = find_among_b(z, a_2, 5);
234 0 : if (!(among_var)) { z->lb = mlimit2; return 0; }
235 0 : z->bra = z->c;
236 0 : z->lb = mlimit2;
237 : }
238 0 : switch (among_var) {
239 0 : case 1:
240 0 : { int ret = slice_del(z);
241 0 : if (ret < 0) return ret;
242 : }
243 0 : { int m3 = z->l - z->c; (void)m3;
244 0 : { int ret = r_consonant_pair(z);
245 0 : if (ret < 0) return ret;
246 : }
247 0 : z->c = z->l - m3;
248 : }
249 0 : break;
250 0 : case 2:
251 0 : { int ret = slice_from_s(z, 4, s_2);
252 0 : if (ret < 0) return ret;
253 : }
254 0 : break;
255 : }
256 0 : return 1;
257 : }
258 :
259 0 : static int r_undouble(struct SN_env * z) {
260 :
261 : { int mlimit1;
262 0 : if (z->c < z->I[1]) return 0;
263 0 : mlimit1 = z->lb; z->lb = z->I[1];
264 0 : z->ket = z->c;
265 0 : if (in_grouping_b_U(z, g_c, 98, 122, 0)) { z->lb = mlimit1; return 0; }
266 0 : z->bra = z->c;
267 0 : z->S[0] = slice_to(z, z->S[0]);
268 0 : if (z->S[0] == 0) return -1;
269 0 : z->lb = mlimit1;
270 : }
271 0 : if (!(eq_v_b(z, z->S[0]))) return 0;
272 0 : { int ret = slice_del(z);
273 0 : if (ret < 0) return ret;
274 : }
275 0 : return 1;
276 : }
277 :
278 0 : extern int danish_UTF_8_stem(struct SN_env * z) {
279 0 : { int c1 = z->c;
280 0 : { int ret = r_mark_regions(z);
281 0 : if (ret < 0) return ret;
282 : }
283 0 : z->c = c1;
284 : }
285 0 : z->lb = z->c; z->c = z->l;
286 :
287 0 : { int m2 = z->l - z->c; (void)m2;
288 0 : { int ret = r_main_suffix(z);
289 0 : if (ret < 0) return ret;
290 : }
291 0 : z->c = z->l - m2;
292 : }
293 0 : { int m3 = z->l - z->c; (void)m3;
294 0 : { int ret = r_consonant_pair(z);
295 0 : if (ret < 0) return ret;
296 : }
297 0 : z->c = z->l - m3;
298 : }
299 0 : { int m4 = z->l - z->c; (void)m4;
300 0 : { int ret = r_other_suffix(z);
301 0 : if (ret < 0) return ret;
302 : }
303 0 : z->c = z->l - m4;
304 : }
305 0 : { int m5 = z->l - z->c; (void)m5;
306 0 : { int ret = r_undouble(z);
307 0 : if (ret < 0) return ret;
308 : }
309 0 : z->c = z->l - m5;
310 : }
311 0 : z->c = z->lb;
312 0 : return 1;
313 : }
314 :
315 0 : extern struct SN_env * danish_UTF_8_create_env(void) { return SN_create_env(1, 2); }
316 :
317 0 : extern void danish_UTF_8_close_env(struct SN_env * z) { SN_close_env(z, 1); }
318 :
|