Line data Source code
1 : /* Generated from danish.sbl by Snowball 3.0.0 - https://snowballstem.org/ */
2 :
3 : #include "stem_UTF_8_danish.h"
4 :
5 : #include <stddef.h>
6 :
7 : #include "snowball_runtime.h"
8 :
9 : struct SN_local {
10 : struct SN_env z;
11 : int i_p1;
12 : symbol * s_ch;
13 : };
14 :
15 : typedef struct SN_local SN_local;
16 :
17 : #ifdef __cplusplus
18 : extern "C" {
19 : #endif
20 : extern int danish_UTF_8_stem(struct SN_env * z);
21 : #ifdef __cplusplus
22 : }
23 : #endif
24 :
25 : static int r_undouble(struct SN_env * z);
26 : static int r_other_suffix(struct SN_env * z);
27 : static int r_consonant_pair(struct SN_env * z);
28 : static int r_main_suffix(struct SN_env * z);
29 : static int r_mark_regions(struct SN_env * z);
30 :
31 : static const symbol s_0[] = { 's', 't' };
32 : static const symbol s_1[] = { 'i', 'g' };
33 : static const symbol s_2[] = { 'l', 0xC3, 0xB8, 's' };
34 :
35 : static const symbol s_0_0[3] = { 'h', 'e', 'd' };
36 : static const symbol s_0_1[5] = { 'e', 't', 'h', 'e', 'd' };
37 : static const symbol s_0_2[4] = { 'e', 'r', 'e', 'd' };
38 : static const symbol s_0_3[1] = { 'e' };
39 : static const symbol s_0_4[5] = { 'e', 'r', 'e', 'd', 'e' };
40 : static const symbol s_0_5[4] = { 'e', 'n', 'd', 'e' };
41 : static const symbol s_0_6[6] = { 'e', 'r', 'e', 'n', 'd', 'e' };
42 : static const symbol s_0_7[3] = { 'e', 'n', 'e' };
43 : static const symbol s_0_8[4] = { 'e', 'r', 'n', 'e' };
44 : static const symbol s_0_9[3] = { 'e', 'r', 'e' };
45 : static const symbol s_0_10[2] = { 'e', 'n' };
46 : static const symbol s_0_11[5] = { 'h', 'e', 'd', 'e', 'n' };
47 : static const symbol s_0_12[4] = { 'e', 'r', 'e', 'n' };
48 : static const symbol s_0_13[2] = { 'e', 'r' };
49 : static const symbol s_0_14[5] = { 'h', 'e', 'd', 'e', 'r' };
50 : static const symbol s_0_15[4] = { 'e', 'r', 'e', 'r' };
51 : static const symbol s_0_16[1] = { 's' };
52 : static const symbol s_0_17[4] = { 'h', 'e', 'd', 's' };
53 : static const symbol s_0_18[2] = { 'e', 's' };
54 : static const symbol s_0_19[5] = { 'e', 'n', 'd', 'e', 's' };
55 : static const symbol s_0_20[7] = { 'e', 'r', 'e', 'n', 'd', 'e', 's' };
56 : static const symbol s_0_21[4] = { 'e', 'n', 'e', 's' };
57 : static const symbol s_0_22[5] = { 'e', 'r', 'n', 'e', 's' };
58 : static const symbol s_0_23[4] = { 'e', 'r', 'e', 's' };
59 : static const symbol s_0_24[3] = { 'e', 'n', 's' };
60 : static const symbol s_0_25[6] = { 'h', 'e', 'd', 'e', 'n', 's' };
61 : static const symbol s_0_26[5] = { 'e', 'r', 'e', 'n', 's' };
62 : static const symbol s_0_27[3] = { 'e', 'r', 's' };
63 : static const symbol s_0_28[3] = { 'e', 't', 's' };
64 : static const symbol s_0_29[5] = { 'e', 'r', 'e', 't', 's' };
65 : static const symbol s_0_30[2] = { 'e', 't' };
66 : static const symbol s_0_31[4] = { 'e', 'r', 'e', 't' };
67 : static const struct among a_0[32] = {
68 : { 3, s_0_0, 0, 1, 0},
69 : { 5, s_0_1, -1, 1, 0},
70 : { 4, s_0_2, 0, 1, 0},
71 : { 1, s_0_3, 0, 1, 0},
72 : { 5, s_0_4, -1, 1, 0},
73 : { 4, s_0_5, -2, 1, 0},
74 : { 6, s_0_6, -1, 1, 0},
75 : { 3, s_0_7, -4, 1, 0},
76 : { 4, s_0_8, -5, 1, 0},
77 : { 3, s_0_9, -6, 1, 0},
78 : { 2, s_0_10, 0, 1, 0},
79 : { 5, s_0_11, -1, 1, 0},
80 : { 4, s_0_12, -2, 1, 0},
81 : { 2, s_0_13, 0, 1, 0},
82 : { 5, s_0_14, -1, 1, 0},
83 : { 4, s_0_15, -2, 1, 0},
84 : { 1, s_0_16, 0, 2, 0},
85 : { 4, s_0_17, -1, 1, 0},
86 : { 2, s_0_18, -2, 1, 0},
87 : { 5, s_0_19, -1, 1, 0},
88 : { 7, s_0_20, -1, 1, 0},
89 : { 4, s_0_21, -3, 1, 0},
90 : { 5, s_0_22, -4, 1, 0},
91 : { 4, s_0_23, -5, 1, 0},
92 : { 3, s_0_24, -8, 1, 0},
93 : { 6, s_0_25, -1, 1, 0},
94 : { 5, s_0_26, -2, 1, 0},
95 : { 3, s_0_27, -11, 1, 0},
96 : { 3, s_0_28, -12, 1, 0},
97 : { 5, s_0_29, -1, 1, 0},
98 : { 2, s_0_30, 0, 1, 0},
99 : { 4, s_0_31, -1, 1, 0}
100 : };
101 :
102 : static const symbol s_1_0[2] = { 'g', 'd' };
103 : static const symbol s_1_1[2] = { 'd', 't' };
104 : static const symbol s_1_2[2] = { 'g', 't' };
105 : static const symbol s_1_3[2] = { 'k', 't' };
106 : static const struct among a_1[4] = {
107 : { 2, s_1_0, 0, -1, 0},
108 : { 2, s_1_1, 0, -1, 0},
109 : { 2, s_1_2, 0, -1, 0},
110 : { 2, s_1_3, 0, -1, 0}
111 : };
112 :
113 : static const symbol s_2_0[2] = { 'i', 'g' };
114 : static const symbol s_2_1[3] = { 'l', 'i', 'g' };
115 : static const symbol s_2_2[4] = { 'e', 'l', 'i', 'g' };
116 : static const symbol s_2_3[3] = { 'e', 'l', 's' };
117 : static const symbol s_2_4[5] = { 'l', 0xC3, 0xB8, 's', 't' };
118 : static const struct among a_2[5] = {
119 : { 2, s_2_0, 0, 1, 0},
120 : { 3, s_2_1, -1, 1, 0},
121 : { 4, s_2_2, -1, 1, 0},
122 : { 3, s_2_3, 0, 1, 0},
123 : { 5, s_2_4, 0, 2, 0}
124 : };
125 :
126 : static const unsigned char g_c[] = { 119, 223, 119, 1 };
127 :
128 : static const unsigned char g_v[] = { 17, 65, 16, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 48, 0, 128 };
129 :
130 : static const unsigned char g_s_ending[] = { 239, 254, 42, 3, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 16 };
131 :
132 0 : static int r_mark_regions(struct SN_env * z) {
133 : int i_x;
134 0 : ((SN_local *)z)->i_p1 = z->l;
135 : {
136 0 : int v_1 = z->c;
137 : {
138 0 : int ret = skip_utf8(z->p, z->c, z->l, 3);
139 0 : if (ret < 0) return 0;
140 0 : z->c = ret;
141 : }
142 0 : i_x = z->c;
143 0 : z->c = v_1;
144 : }
145 : {
146 0 : int ret = out_grouping_U(z, g_v, 97, 248, 1);
147 0 : if (ret < 0) return 0;
148 0 : z->c += ret;
149 : }
150 : {
151 0 : int ret = in_grouping_U(z, g_v, 97, 248, 1);
152 0 : if (ret < 0) return 0;
153 0 : z->c += ret;
154 : }
155 0 : ((SN_local *)z)->i_p1 = z->c;
156 0 : if (((SN_local *)z)->i_p1 >= i_x) goto lab0;
157 0 : ((SN_local *)z)->i_p1 = i_x;
158 0 : lab0:
159 0 : return 1;
160 : }
161 :
162 0 : static int r_main_suffix(struct SN_env * z) {
163 : int among_var;
164 : {
165 : int v_1;
166 0 : if (z->c < ((SN_local *)z)->i_p1) return 0;
167 0 : v_1 = z->lb; z->lb = ((SN_local *)z)->i_p1;
168 0 : z->ket = z->c;
169 0 : if (z->c <= z->lb || z->p[z->c - 1] >> 5 != 3 || !((1851440 >> (z->p[z->c - 1] & 0x1f)) & 1)) { z->lb = v_1; return 0; }
170 0 : among_var = find_among_b(z, a_0, 32, 0);
171 0 : if (!among_var) { z->lb = v_1; return 0; }
172 0 : z->bra = z->c;
173 0 : z->lb = v_1;
174 : }
175 0 : switch (among_var) {
176 0 : case 1:
177 : {
178 0 : int ret = slice_del(z);
179 0 : if (ret < 0) return ret;
180 : }
181 0 : break;
182 0 : case 2:
183 0 : if (in_grouping_b_U(z, g_s_ending, 97, 229, 0)) return 0;
184 : {
185 0 : int ret = slice_del(z);
186 0 : if (ret < 0) return ret;
187 : }
188 0 : break;
189 : }
190 0 : return 1;
191 : }
192 :
193 0 : static int r_consonant_pair(struct SN_env * z) {
194 : {
195 0 : int v_1 = z->l - z->c;
196 : {
197 : int v_2;
198 0 : if (z->c < ((SN_local *)z)->i_p1) return 0;
199 0 : v_2 = z->lb; z->lb = ((SN_local *)z)->i_p1;
200 0 : z->ket = z->c;
201 0 : if (z->c - 1 <= z->lb || (z->p[z->c - 1] != 100 && z->p[z->c - 1] != 116)) { z->lb = v_2; return 0; }
202 0 : if (!find_among_b(z, a_1, 4, 0)) { z->lb = v_2; return 0; }
203 0 : z->bra = z->c;
204 0 : z->lb = v_2;
205 : }
206 0 : z->c = z->l - v_1;
207 : }
208 : {
209 0 : int ret = skip_b_utf8(z->p, z->c, z->lb, 1);
210 0 : if (ret < 0) return 0;
211 0 : z->c = ret;
212 : }
213 0 : z->bra = z->c;
214 : {
215 0 : int ret = slice_del(z);
216 0 : if (ret < 0) return ret;
217 : }
218 0 : return 1;
219 : }
220 :
221 0 : static int r_other_suffix(struct SN_env * z) {
222 : int among_var;
223 : {
224 0 : int v_1 = z->l - z->c;
225 0 : z->ket = z->c;
226 0 : if (!(eq_s_b(z, 2, s_0))) goto lab0;
227 0 : z->bra = z->c;
228 0 : if (!(eq_s_b(z, 2, s_1))) goto lab0;
229 : {
230 0 : int ret = slice_del(z);
231 0 : if (ret < 0) return ret;
232 : }
233 0 : lab0:
234 0 : z->c = z->l - v_1;
235 : }
236 : {
237 : int v_2;
238 0 : if (z->c < ((SN_local *)z)->i_p1) return 0;
239 0 : v_2 = z->lb; z->lb = ((SN_local *)z)->i_p1;
240 0 : z->ket = z->c;
241 0 : if (z->c - 1 <= z->lb || z->p[z->c - 1] >> 5 != 3 || !((1572992 >> (z->p[z->c - 1] & 0x1f)) & 1)) { z->lb = v_2; return 0; }
242 0 : among_var = find_among_b(z, a_2, 5, 0);
243 0 : if (!among_var) { z->lb = v_2; return 0; }
244 0 : z->bra = z->c;
245 0 : z->lb = v_2;
246 : }
247 0 : switch (among_var) {
248 0 : case 1:
249 : {
250 0 : int ret = slice_del(z);
251 0 : if (ret < 0) return ret;
252 : }
253 : {
254 0 : int v_3 = z->l - z->c;
255 : {
256 0 : int ret = r_consonant_pair(z);
257 0 : if (ret < 0) return ret;
258 : }
259 0 : z->c = z->l - v_3;
260 : }
261 0 : break;
262 0 : case 2:
263 : {
264 0 : int ret = slice_from_s(z, 4, s_2);
265 0 : if (ret < 0) return ret;
266 : }
267 0 : break;
268 : }
269 0 : return 1;
270 : }
271 :
272 0 : static int r_undouble(struct SN_env * z) {
273 : {
274 : int v_1;
275 0 : if (z->c < ((SN_local *)z)->i_p1) return 0;
276 0 : v_1 = z->lb; z->lb = ((SN_local *)z)->i_p1;
277 0 : z->ket = z->c;
278 0 : if (in_grouping_b_U(z, g_c, 98, 122, 0)) { z->lb = v_1; return 0; }
279 0 : z->bra = z->c;
280 : {
281 0 : int ret = slice_to(z, &((SN_local *)z)->s_ch);
282 0 : if (ret < 0) return ret;
283 : }
284 0 : z->lb = v_1;
285 : }
286 0 : if (!(eq_v_b(z, ((SN_local *)z)->s_ch))) return 0;
287 : {
288 0 : int ret = slice_del(z);
289 0 : if (ret < 0) return ret;
290 : }
291 0 : return 1;
292 : }
293 :
294 0 : extern int danish_UTF_8_stem(struct SN_env * z) {
295 : {
296 0 : int v_1 = z->c;
297 : {
298 0 : int ret = r_mark_regions(z);
299 0 : if (ret < 0) return ret;
300 : }
301 0 : z->c = v_1;
302 : }
303 0 : z->lb = z->c; z->c = z->l;
304 : {
305 0 : int v_2 = z->l - z->c;
306 : {
307 0 : int ret = r_main_suffix(z);
308 0 : if (ret < 0) return ret;
309 : }
310 0 : z->c = z->l - v_2;
311 : }
312 : {
313 0 : int v_3 = z->l - z->c;
314 : {
315 0 : int ret = r_consonant_pair(z);
316 0 : if (ret < 0) return ret;
317 : }
318 0 : z->c = z->l - v_3;
319 : }
320 : {
321 0 : int v_4 = z->l - z->c;
322 : {
323 0 : int ret = r_other_suffix(z);
324 0 : if (ret < 0) return ret;
325 : }
326 0 : z->c = z->l - v_4;
327 : }
328 : {
329 0 : int v_5 = z->l - z->c;
330 : {
331 0 : int ret = r_undouble(z);
332 0 : if (ret < 0) return ret;
333 : }
334 0 : z->c = z->l - v_5;
335 : }
336 0 : z->c = z->lb;
337 0 : return 1;
338 : }
339 :
340 0 : extern struct SN_env * danish_UTF_8_create_env(void) {
341 0 : struct SN_env * z = SN_new_env(sizeof(SN_local));
342 0 : if (z) {
343 0 : ((SN_local *)z)->i_p1 = 0;
344 0 : ((SN_local *)z)->s_ch = NULL;
345 :
346 0 : if ((((SN_local *)z)->s_ch = create_s()) == NULL) {
347 0 : danish_UTF_8_close_env(z);
348 0 : return NULL;
349 : }
350 : }
351 0 : return z;
352 : }
353 :
354 0 : extern void danish_UTF_8_close_env(struct SN_env * z) {
355 0 : if (z) {
356 0 : lose_s(((SN_local *)z)->s_ch);
357 : }
358 0 : SN_delete_env(z);
359 0 : }
360 :
|