--- cdli/cdliSplitter.py 2007/04/23 13:07:10 1.6 +++ cdli/cdliSplitter.py 2007/08/31 14:22:52 1.7 @@ -30,7 +30,7 @@ def getSupportedEncoding(encodings): """beta of a fulltext splitter for cdli """ -ignoreLines=['$','@','#','&'] +ignoreLines=['$','@','#','&','>'] separators=[''] komma_exception="([^sStThH])," # komma relevant for graphemes will not be deleted deleteGraphems="\{|\}|<|>|\(|\)|-|_|\#|,|\||\]|\[|\!|\?" # for graphems