comparison software/mpdl-services/mpiwg-mpdl-lt/src/de/mpg/mpiwg/berlin/mpdl/lt/text/norm/lang/MpdlNormalizerLexEL.lex @ 23:e845310098ba

diverse Korrekturen
author Josef Willenborg <jwillenborg@mpiwg-berlin.mpg.de>
date Tue, 27 Nov 2012 12:35:19 +0100
parents 4a3641ae14d2
children
comparison
equal deleted inserted replaced
22:6a45a982c333 23:e845310098ba
5 * Wolfgang Schmidle 5 * Wolfgang Schmidle
6 * version 2011-08-03 6 * version 2011-08-03
7 * 7 *
8 */ 8 */
9 9
10 package de.mpg.mpiwg.berlin.mpdl.lt.analyzer.lang; 10 package de.mpg.mpiwg.berlin.mpdl.lt.text.norm.lang;
11 11
12 %% 12 %%
13 13
14 %public 14 %public
15 %class MpdlNormalizerLexEL 15 %class MpdlNormalizerLexEL
44 44
45 Latin = [abcdefghijklmnopqrstuvwxyzABCDEFGHIJKLMNOPQRSTUVWXYZ] 45 Latin = [abcdefghijklmnopqrstuvwxyzABCDEFGHIJKLMNOPQRSTUVWXYZ]
46 46
47 47
48 %% 48 %%
49
50 // jump over empty xml elements
51 "<"[^><]+"/>" { add(yytext()); }
52 "-<"[^><]+"/>" { add(yytext()); }
53 "<"[^><]+"></"[^><]+">" { add(yytext()); }
54 "-<"[^><]+"></"[^><]+">" { add(yytext()); }
49 55
50 56
51 // always replace tonos by oxia 57 // always replace tonos by oxia
52 // (although this should really be corrected in the text rather than normalized) 58 // (although this should really be corrected in the text rather than normalized)
53 ά { add("ά"); } 59 ά { add("ά"); }