Mercurial > hg > mpdl-group
comparison software/mpdl-services/mpiwg-mpdl-lt/src/de/mpg/mpiwg/berlin/mpdl/lt/text/norm/Normalizer.java @ 20:7d6d969b10cf
little corrections
author | Josef Willenborg <jwillenborg@mpiwg-berlin.mpg.de> |
---|---|
date | Wed, 14 Dec 2011 12:48:43 +0100 |
parents | 4a3641ae14d2 |
children | e845310098ba |
comparison
equal
deleted
inserted
replaced
19:4a3641ae14d2 | 20:7d6d969b10cf |
---|---|
17 import de.mpg.mpiwg.berlin.mpdl.lt.text.norm.lang.MpdlNormalizerLexZH; | 17 import de.mpg.mpiwg.berlin.mpdl.lt.text.norm.lang.MpdlNormalizerLexZH; |
18 import de.mpg.mpiwg.berlin.mpdl.lt.text.reg.Regularization; | 18 import de.mpg.mpiwg.berlin.mpdl.lt.text.reg.Regularization; |
19 import de.mpg.mpiwg.berlin.mpdl.lt.text.reg.RegularizationManager; | 19 import de.mpg.mpiwg.berlin.mpdl.lt.text.reg.RegularizationManager; |
20 | 20 |
21 public class Normalizer { | 21 public class Normalizer { |
22 public static int NONE = -1; // no normalization | |
22 public static int DISPLAY = 1; // normalization in DISPLAY mode | 23 public static int DISPLAY = 1; // normalization in DISPLAY mode |
23 public static int DICTIONARY = 2; // normalization in DICTIONARY mode | 24 public static int DICTIONARY = 2; // normalization in DICTIONARY mode |
24 public static int SEARCH = 3; // normalization in SEARCH mode; never used so far in indexing because it does not support the morph. lexicons such as CELEX (e.g. eingeschränkt would not be stemmed to eingeschraenkt) | 25 public static int SEARCH = 3; // normalization in SEARCH mode; never used so far in indexing because it does not support the morph. lexicons such as CELEX (e.g. eingeschränkt would not be stemmed to eingeschraenkt) |
25 private int normMode = DISPLAY; // Default e.g. for indexing and querying | 26 private int normMode = DISPLAY; // Default e.g. for indexing and querying |
26 private String[] normFunctions = {"norm"}; // default is to use the norm function | 27 private String[] normFunctions = {"norm"}; // default is to use the norm function |