Mercurial > hg > mpdl-group
comparison software/mpdl-services/mpiwg-mpdl-lt/src/de/mpg/mpiwg/berlin/mpdl/lt/text/norm/lang/MpdlNormalizerLexFR.java @ 23:e845310098ba
diverse Korrekturen
author | Josef Willenborg <jwillenborg@mpiwg-berlin.mpg.de> |
---|---|
date | Tue, 27 Nov 2012 12:35:19 +0100 |
parents | 4a3641ae14d2 |
children |
comparison
equal
deleted
inserted
replaced
22:6a45a982c333 | 23:e845310098ba |
---|---|
1 /* The following code was generated by JFlex 1.4.3 on 05.09.11 10:35 */ | 1 /* The following code was generated by JFlex 1.4.3 on 28.03.12 18:57 */ |
2 | 2 |
3 /* | 3 /* |
4 * Normalization rules for French text | 4 * Normalization rules for French text |
5 * [this is a JFlex specification] | 5 * [this is a JFlex specification] |
6 * | 6 * |
7 * Wolfgang Schmidle | 7 * Wolfgang Schmidle |
8 * version 2011-08-10 | 8 * version 2011-07-12 |
9 * | 9 * |
10 */ | 10 */ |
11 | 11 |
12 package de.mpg.mpiwg.berlin.mpdl.lt.text.norm.lang; | 12 package de.mpg.mpiwg.berlin.mpdl.lt.text.norm.lang; |
13 | 13 |
14 | 14 |
15 /** | 15 /** |
16 * This class is a scanner generated by | 16 * This class is a scanner generated by |
17 * <a href="http://www.jflex.de/">JFlex</a> 1.4.3 | 17 * <a href="http://www.jflex.de/">JFlex</a> 1.4.3 |
18 * on 05.09.11 10:35 from the specification file | 18 * on 28.03.12 18:57 from the specification file |
19 * <tt>MpdlNormalizerLexFR.lex</tt> | 19 * <tt>/Users/jwillenborg/test/jflexNew/MpdlNormalizerLexFR.lex</tt> |
20 */ | 20 */ |
21 public class MpdlNormalizerLexFR { | 21 public class MpdlNormalizerLexFR { |
22 | 22 |
23 /** This character denotes the end of file */ | 23 /** This character denotes the end of file */ |
24 public static final int YYEOF = -1; | 24 public static final int YYEOF = -1; |
25 | 25 |
26 /** initial size of the lookahead buffer */ | 26 /** initial size of the lookahead buffer */ |
27 private static final int ZZ_BUFFERSIZE = 16384; | 27 private static final int ZZ_BUFFERSIZE = 16384; |
28 | 28 |
29 /** lexical states */ | 29 /** lexical states */ |
30 public static final int DICT_ASCII = 8; | |
31 public static final int SEARCH = 6; | 30 public static final int SEARCH = 6; |
32 public static final int DICT = 4; | 31 public static final int DICT = 4; |
33 public static final int YYINITIAL = 0; | 32 public static final int YYINITIAL = 0; |
33 public static final int CELEX = 8; | |
34 public static final int DISP = 2; | 34 public static final int DISP = 2; |
35 | 35 |
36 /** | 36 /** |
37 * ZZ_LEXSTATE[l] is the state in the DFA for the lexical state l | 37 * ZZ_LEXSTATE[l] is the state in the DFA for the lexical state l |
38 * ZZ_LEXSTATE[l+1] is the state in the DFA for the lexical state l | 38 * ZZ_LEXSTATE[l+1] is the state in the DFA for the lexical state l |
45 | 45 |
46 /** | 46 /** |
47 * Translates characters to character classes | 47 * Translates characters to character classes |
48 */ | 48 */ |
49 private static final String ZZ_CMAP_PACKED = | 49 private static final String ZZ_CMAP_PACKED = |
50 "\12\0\1\3\25\0\1\2\14\0\1\1\2\0\1\1\17\0\1\20"+ | 50 "\12\0\1\3\25\0\1\2\14\0\1\11\1\0\1\10\1\1\13\0"+ |
51 "\32\4\6\0\1\5\2\4\1\5\20\4\1\5\5\4\1\1\1\0"+ | 51 "\1\6\1\0\1\7\1\0\1\24\32\4\6\0\1\5\2\4\1\5"+ |
52 "\1\1\141\0\1\7\3\12\3\0\1\10\1\0\3\13\1\0\3\14"+ | 52 "\20\4\1\5\5\4\1\1\1\0\1\1\141\0\1\13\3\16\3\0"+ |
53 "\3\0\3\15\4\0\3\16\126\0\2\11\53\0\1\6\u1e99\0\1\17"+ | 53 "\1\14\1\0\3\17\1\0\3\20\3\0\3\21\4\0\3\22\126\0"+ |
54 "\udfe6\0"; | 54 "\2\15\53\0\1\12\u1e99\0\1\23\udfe6\0"; |
55 | 55 |
56 /** | 56 /** |
57 * Translates characters to character classes | 57 * Translates characters to character classes |
58 */ | 58 */ |
59 private static final char [] ZZ_CMAP = zzUnpackCMap(ZZ_CMAP_PACKED); | 59 private static final char [] ZZ_CMAP = zzUnpackCMap(ZZ_CMAP_PACKED); |
62 * Translates DFA states to action switch labels. | 62 * Translates DFA states to action switch labels. |
63 */ | 63 */ |
64 private static final int [] ZZ_ACTION = zzUnpackAction(); | 64 private static final int [] ZZ_ACTION = zzUnpackAction(); |
65 | 65 |
66 private static final String ZZ_ACTION_PACKED_0 = | 66 private static final String ZZ_ACTION_PACKED_0 = |
67 "\5\0\2\1\1\2\1\3\1\4\1\5\1\6\1\7"+ | 67 "\5\0\4\1\1\2\1\3\1\4\1\5\1\6\1\7"+ |
68 "\1\10\1\2\1\11\1\12\1\13\1\14\1\15\1\16"+ | 68 "\1\10\3\2\1\11\1\12\1\13\1\14\1\15\1\16"+ |
69 "\1\17"; | 69 "\1\17\5\0\1\1\2\0"; |
70 | 70 |
71 private static int [] zzUnpackAction() { | 71 private static int [] zzUnpackAction() { |
72 int [] result = new int[22]; | 72 int [] result = new int[34]; |
73 int offset = 0; | 73 int offset = 0; |
74 offset = zzUnpackAction(ZZ_ACTION_PACKED_0, offset, result); | 74 offset = zzUnpackAction(ZZ_ACTION_PACKED_0, offset, result); |
75 return result; | 75 return result; |
76 } | 76 } |
77 | 77 |
92 * Translates a state to a row index in the transition table | 92 * Translates a state to a row index in the transition table |
93 */ | 93 */ |
94 private static final int [] ZZ_ROWMAP = zzUnpackRowMap(); | 94 private static final int [] ZZ_ROWMAP = zzUnpackRowMap(); |
95 | 95 |
96 private static final String ZZ_ROWMAP_PACKED_0 = | 96 private static final String ZZ_ROWMAP_PACKED_0 = |
97 "\0\0\0\21\0\42\0\63\0\104\0\125\0\146\0\125"+ | 97 "\0\0\0\25\0\52\0\77\0\124\0\151\0\176\0\223"+ |
98 "\0\125\0\125\0\125\0\125\0\125\0\125\0\146\0\125"+ | 98 "\0\250\0\151\0\151\0\151\0\151\0\151\0\151\0\151"+ |
99 "\0\125\0\125\0\125\0\125\0\125\0\125"; | 99 "\0\176\0\223\0\250\0\151\0\151\0\151\0\151\0\151"+ |
100 "\0\151\0\151\0\275\0\223\0\322\0\347\0\374\0\322"+ | |
101 "\0\u0111\0\u0126"; | |
100 | 102 |
101 private static int [] zzUnpackRowMap() { | 103 private static int [] zzUnpackRowMap() { |
102 int [] result = new int[22]; | 104 int [] result = new int[34]; |
103 int offset = 0; | 105 int offset = 0; |
104 offset = zzUnpackRowMap(ZZ_ROWMAP_PACKED_0, offset, result); | 106 offset = zzUnpackRowMap(ZZ_ROWMAP_PACKED_0, offset, result); |
105 return result; | 107 return result; |
106 } | 108 } |
107 | 109 |
120 * The transition table of the DFA | 122 * The transition table of the DFA |
121 */ | 123 */ |
122 private static final int [] ZZ_TRANS = zzUnpackTrans(); | 124 private static final int [] ZZ_TRANS = zzUnpackTrans(); |
123 | 125 |
124 private static final String ZZ_TRANS_PACKED_0 = | 126 private static final String ZZ_TRANS_PACKED_0 = |
125 "\1\6\1\7\1\6\1\0\1\6\1\7\12\6\1\10"+ | 127 "\1\6\1\7\1\6\1\0\1\6\1\7\1\10\2\6"+ |
126 "\1\6\1\7\1\6\1\11\1\6\1\7\1\12\1\13"+ | 128 "\1\11\12\6\1\12\1\6\1\7\1\6\1\13\1\6"+ |
127 "\1\14\7\6\1\10\1\6\1\7\1\6\1\15\1\6"+ | 129 "\1\7\1\10\2\6\1\11\1\14\1\15\1\16\7\6"+ |
128 "\1\7\1\12\1\13\1\14\7\6\1\10\1\6\1\7"+ | 130 "\1\12\1\6\1\7\1\6\1\17\1\6\1\7\1\10"+ |
129 "\1\6\1\16\1\6\1\7\1\12\1\13\1\14\7\6"+ | 131 "\2\6\1\11\1\14\1\15\1\16\7\6\1\12\1\6"+ |
130 "\2\10\1\17\1\10\1\15\1\6\1\7\1\12\1\13"+ | 132 "\1\7\1\6\1\20\1\6\1\7\1\10\2\6\1\11"+ |
131 "\1\14\1\20\1\21\1\22\1\23\1\24\1\25\1\26"+ | 133 "\1\14\1\15\1\16\7\6\2\12\1\21\1\12\1\17"+ |
132 "\1\10\23\0\1\6\16\0"; | 134 "\1\6\1\7\1\22\2\12\1\23\1\14\1\15\1\16"+ |
135 "\1\24\1\25\1\26\1\27\1\30\1\31\1\32\1\12"+ | |
136 "\27\0\1\6\22\0\6\33\2\0\15\33\2\0\1\6"+ | |
137 "\3\0\1\34\16\0\6\33\1\0\1\35\1\36\14\33"+ | |
138 "\6\0\1\37\16\0\6\33\1\0\1\40\1\36\14\33"+ | |
139 "\10\0\1\41\14\0\6\42\2\0\23\42\1\0\1\6"+ | |
140 "\15\42"; | |
133 | 141 |
134 private static int [] zzUnpackTrans() { | 142 private static int [] zzUnpackTrans() { |
135 int [] result = new int[119]; | 143 int [] result = new int[315]; |
136 int offset = 0; | 144 int offset = 0; |
137 offset = zzUnpackTrans(ZZ_TRANS_PACKED_0, offset, result); | 145 offset = zzUnpackTrans(ZZ_TRANS_PACKED_0, offset, result); |
138 return result; | 146 return result; |
139 } | 147 } |
140 | 148 |
168 * ZZ_ATTRIBUTE[aState] contains the attributes of state <code>aState</code> | 176 * ZZ_ATTRIBUTE[aState] contains the attributes of state <code>aState</code> |
169 */ | 177 */ |
170 private static final int [] ZZ_ATTRIBUTE = zzUnpackAttribute(); | 178 private static final int [] ZZ_ATTRIBUTE = zzUnpackAttribute(); |
171 | 179 |
172 private static final String ZZ_ATTRIBUTE_PACKED_0 = | 180 private static final String ZZ_ATTRIBUTE_PACKED_0 = |
173 "\5\0\1\11\1\1\7\11\1\1\7\11"; | 181 "\5\0\1\11\3\1\7\11\3\1\7\11\5\0\1\1"+ |
182 "\2\0"; | |
174 | 183 |
175 private static int [] zzUnpackAttribute() { | 184 private static int [] zzUnpackAttribute() { |
176 int [] result = new int[22]; | 185 int [] result = new int[34]; |
177 int offset = 0; | 186 int offset = 0; |
178 offset = zzUnpackAttribute(ZZ_ATTRIBUTE_PACKED_0, offset, result); | 187 offset = zzUnpackAttribute(ZZ_ATTRIBUTE_PACKED_0, offset, result); |
179 return result; | 188 return result; |
180 } | 189 } |
181 | 190 |
281 */ | 290 */ |
282 private static char [] zzUnpackCMap(String packed) { | 291 private static char [] zzUnpackCMap(String packed) { |
283 char [] map = new char[0x10000]; | 292 char [] map = new char[0x10000]; |
284 int i = 0; /* index in packed string */ | 293 int i = 0; /* index in packed string */ |
285 int j = 0; /* index in unpacked array */ | 294 int j = 0; /* index in unpacked array */ |
286 while (i < 82) { | 295 while (i < 92) { |
287 int count = packed.charAt(i++); | 296 int count = packed.charAt(i++); |
288 char value = packed.charAt(i++); | 297 char value = packed.charAt(i++); |
289 do map[j++] = value; while (--count > 0); | 298 do map[j++] = value; while (--count > 0); |
290 } | 299 } |
291 return map; | 300 return map; |