Mercurial > hg > mpdl-group
comparison software/eXist/mpdl-modules/src/de/mpg/mpiwg/berlin/mpdl/util/StringUtilEscapeChars.java @ 12:fba5577e49d9
diverse Fehlerbehebungen
author | Josef Willenborg <jwillenborg@mpiwg-berlin.mpg.de> |
---|---|
date | Tue, 19 Apr 2011 16:51:26 +0200 |
parents | 408254cf2f1d |
children |
comparison
equal
deleted
inserted
replaced
11:d6f528ad5d96 | 12:fba5577e49d9 |
---|---|
6 import java.text.StringCharacterIterator; | 6 import java.text.StringCharacterIterator; |
7 import java.util.regex.Matcher; | 7 import java.util.regex.Matcher; |
8 import java.util.regex.Pattern; | 8 import java.util.regex.Pattern; |
9 | 9 |
10 public class StringUtilEscapeChars { | 10 public class StringUtilEscapeChars { |
11 | |
12 /** | |
13 * Puts a zwsp between two ideographic characters (e.g. in CJK Unified Ideographs) | |
14 * @param str | |
15 * @return | |
16 */ | |
17 public static String zwsp(String str) { | |
18 // based on Unicode 3.2 | |
19 String ideographic = "[\u3300-\u33ff\u3400-\u4dbf\u4e00-\u9fff\uf900-\ufaff]"; | |
20 String regex = "(" + ideographic + ")(" + ideographic + ")"; | |
21 String retStr = str.replaceAll(regex, "$1\u200b$2"); | |
22 retStr = retStr.replaceAll(regex, "$1\u200b$2"); | |
23 return retStr; | |
24 } | |
25 | |
26 | |
11 public static String deleteSpecialXmlEntities(String inputStr) { | 27 public static String deleteSpecialXmlEntities(String inputStr) { |
12 inputStr = inputStr.replaceAll("<", ""); | 28 inputStr = inputStr.replaceAll("<", ""); |
13 inputStr = inputStr.replaceAll(">", ""); | 29 inputStr = inputStr.replaceAll(">", ""); |
14 inputStr = inputStr.replaceAll("&lt;", ""); | 30 inputStr = inputStr.replaceAll("&lt;", ""); |
15 inputStr = inputStr.replaceAll("&gt;", ""); | 31 inputStr = inputStr.replaceAll("&gt;", ""); |