Initial import into git.
[galago.git] / cpp / galago / contrib / libstemmer_c / libstemmer / modules_utf8.h
blob73b80443a4d6c20d66b7cf0d9a013c2c8c757827
1 /* libstemmer/modules_utf8.h: List of stemming modules.
3 * This file is generated by mkmodules.pl from a list of module names.
4 * Do not edit manually.
6 * Modules included by this file are: danish, dutch, english, finnish, french,
7 * german, hungarian, italian, norwegian, porter, portuguese, russian,
8 * spanish, swedish
9 */
11 #include "../src_c/stem_UTF_8_danish.h"
12 #include "../src_c/stem_UTF_8_dutch.h"
13 #include "../src_c/stem_UTF_8_english.h"
14 #include "../src_c/stem_UTF_8_finnish.h"
15 #include "../src_c/stem_UTF_8_french.h"
16 #include "../src_c/stem_UTF_8_german.h"
17 #include "../src_c/stem_UTF_8_hungarian.h"
18 #include "../src_c/stem_UTF_8_italian.h"
19 #include "../src_c/stem_UTF_8_norwegian.h"
20 #include "../src_c/stem_UTF_8_porter.h"
21 #include "../src_c/stem_UTF_8_portuguese.h"
22 #include "../src_c/stem_UTF_8_russian.h"
23 #include "../src_c/stem_UTF_8_spanish.h"
24 #include "../src_c/stem_UTF_8_swedish.h"
26 typedef enum {
27 ENC_UNKNOWN=0,
28 ENC_UTF_8
29 } stemmer_encoding_t;
31 struct stemmer_encoding {
32 const char * name;
33 stemmer_encoding_t enc;
35 static struct stemmer_encoding encodings[] = {
36 {"UTF_8", ENC_UTF_8},
37 {0,ENC_UNKNOWN}
40 struct stemmer_modules {
41 const char * name;
42 stemmer_encoding_t enc;
43 struct SN_env * (*create)(void);
44 void (*close)(struct SN_env *);
45 int (*stem)(struct SN_env *);
47 static struct stemmer_modules modules[] = {
48 {"da", ENC_UTF_8, danish_UTF_8_create_env, danish_UTF_8_close_env, danish_UTF_8_stem},
49 {"dan", ENC_UTF_8, danish_UTF_8_create_env, danish_UTF_8_close_env, danish_UTF_8_stem},
50 {"danish", ENC_UTF_8, danish_UTF_8_create_env, danish_UTF_8_close_env, danish_UTF_8_stem},
51 {"de", ENC_UTF_8, german_UTF_8_create_env, german_UTF_8_close_env, german_UTF_8_stem},
52 {"deu", ENC_UTF_8, german_UTF_8_create_env, german_UTF_8_close_env, german_UTF_8_stem},
53 {"dut", ENC_UTF_8, dutch_UTF_8_create_env, dutch_UTF_8_close_env, dutch_UTF_8_stem},
54 {"dutch", ENC_UTF_8, dutch_UTF_8_create_env, dutch_UTF_8_close_env, dutch_UTF_8_stem},
55 {"en", ENC_UTF_8, english_UTF_8_create_env, english_UTF_8_close_env, english_UTF_8_stem},
56 {"eng", ENC_UTF_8, english_UTF_8_create_env, english_UTF_8_close_env, english_UTF_8_stem},
57 {"english", ENC_UTF_8, english_UTF_8_create_env, english_UTF_8_close_env, english_UTF_8_stem},
58 {"es", ENC_UTF_8, spanish_UTF_8_create_env, spanish_UTF_8_close_env, spanish_UTF_8_stem},
59 {"esl", ENC_UTF_8, spanish_UTF_8_create_env, spanish_UTF_8_close_env, spanish_UTF_8_stem},
60 {"fi", ENC_UTF_8, finnish_UTF_8_create_env, finnish_UTF_8_close_env, finnish_UTF_8_stem},
61 {"fin", ENC_UTF_8, finnish_UTF_8_create_env, finnish_UTF_8_close_env, finnish_UTF_8_stem},
62 {"finnish", ENC_UTF_8, finnish_UTF_8_create_env, finnish_UTF_8_close_env, finnish_UTF_8_stem},
63 {"fr", ENC_UTF_8, french_UTF_8_create_env, french_UTF_8_close_env, french_UTF_8_stem},
64 {"fra", ENC_UTF_8, french_UTF_8_create_env, french_UTF_8_close_env, french_UTF_8_stem},
65 {"fre", ENC_UTF_8, french_UTF_8_create_env, french_UTF_8_close_env, french_UTF_8_stem},
66 {"french", ENC_UTF_8, french_UTF_8_create_env, french_UTF_8_close_env, french_UTF_8_stem},
67 {"ger", ENC_UTF_8, german_UTF_8_create_env, german_UTF_8_close_env, german_UTF_8_stem},
68 {"german", ENC_UTF_8, german_UTF_8_create_env, german_UTF_8_close_env, german_UTF_8_stem},
69 {"hu", ENC_UTF_8, hungarian_UTF_8_create_env, hungarian_UTF_8_close_env, hungarian_UTF_8_stem},
70 {"hun", ENC_UTF_8, hungarian_UTF_8_create_env, hungarian_UTF_8_close_env, hungarian_UTF_8_stem},
71 {"hungarian", ENC_UTF_8, hungarian_UTF_8_create_env, hungarian_UTF_8_close_env, hungarian_UTF_8_stem},
72 {"it", ENC_UTF_8, italian_UTF_8_create_env, italian_UTF_8_close_env, italian_UTF_8_stem},
73 {"ita", ENC_UTF_8, italian_UTF_8_create_env, italian_UTF_8_close_env, italian_UTF_8_stem},
74 {"italian", ENC_UTF_8, italian_UTF_8_create_env, italian_UTF_8_close_env, italian_UTF_8_stem},
75 {"nl", ENC_UTF_8, dutch_UTF_8_create_env, dutch_UTF_8_close_env, dutch_UTF_8_stem},
76 {"nld", ENC_UTF_8, dutch_UTF_8_create_env, dutch_UTF_8_close_env, dutch_UTF_8_stem},
77 {"no", ENC_UTF_8, norwegian_UTF_8_create_env, norwegian_UTF_8_close_env, norwegian_UTF_8_stem},
78 {"nor", ENC_UTF_8, norwegian_UTF_8_create_env, norwegian_UTF_8_close_env, norwegian_UTF_8_stem},
79 {"norwegian", ENC_UTF_8, norwegian_UTF_8_create_env, norwegian_UTF_8_close_env, norwegian_UTF_8_stem},
80 {"por", ENC_UTF_8, portuguese_UTF_8_create_env, portuguese_UTF_8_close_env, portuguese_UTF_8_stem},
81 {"porter", ENC_UTF_8, porter_UTF_8_create_env, porter_UTF_8_close_env, porter_UTF_8_stem},
82 {"portuguese", ENC_UTF_8, portuguese_UTF_8_create_env, portuguese_UTF_8_close_env, portuguese_UTF_8_stem},
83 {"pt", ENC_UTF_8, portuguese_UTF_8_create_env, portuguese_UTF_8_close_env, portuguese_UTF_8_stem},
84 {"ru", ENC_UTF_8, russian_UTF_8_create_env, russian_UTF_8_close_env, russian_UTF_8_stem},
85 {"rus", ENC_UTF_8, russian_UTF_8_create_env, russian_UTF_8_close_env, russian_UTF_8_stem},
86 {"russian", ENC_UTF_8, russian_UTF_8_create_env, russian_UTF_8_close_env, russian_UTF_8_stem},
87 {"spa", ENC_UTF_8, spanish_UTF_8_create_env, spanish_UTF_8_close_env, spanish_UTF_8_stem},
88 {"spanish", ENC_UTF_8, spanish_UTF_8_create_env, spanish_UTF_8_close_env, spanish_UTF_8_stem},
89 {"sv", ENC_UTF_8, swedish_UTF_8_create_env, swedish_UTF_8_close_env, swedish_UTF_8_stem},
90 {"swe", ENC_UTF_8, swedish_UTF_8_create_env, swedish_UTF_8_close_env, swedish_UTF_8_stem},
91 {"swedish", ENC_UTF_8, swedish_UTF_8_create_env, swedish_UTF_8_close_env, swedish_UTF_8_stem},
92 {0,ENC_UNKNOWN,0,0,0}
94 static const char * algorithm_names[] = {
95 "danish",
96 "dutch",
97 "english",
98 "finnish",
99 "french",
100 "german",
101 "hungarian",
102 "italian",
103 "norwegian",
104 "porter",
105 "portuguese",
106 "russian",
107 "spanish",
108 "swedish",