comparison software/eXist/mpdl-modules/src/de/mpg/mpiwg/berlin/mpdl/util/StringUtilEscapeChars.java @ 12:fba5577e49d9

diverse Fehlerbehebungen
author Josef Willenborg <jwillenborg@mpiwg-berlin.mpg.de>
date Tue, 19 Apr 2011 16:51:26 +0200
parents 408254cf2f1d
children
comparison
equal deleted inserted replaced
11:d6f528ad5d96 12:fba5577e49d9
6 import java.text.StringCharacterIterator; 6 import java.text.StringCharacterIterator;
7 import java.util.regex.Matcher; 7 import java.util.regex.Matcher;
8 import java.util.regex.Pattern; 8 import java.util.regex.Pattern;
9 9
10 public class StringUtilEscapeChars { 10 public class StringUtilEscapeChars {
11
12 /**
13 * Puts a zwsp between two ideographic characters (e.g. in CJK Unified Ideographs)
14 * @param str
15 * @return
16 */
17 public static String zwsp(String str) {
18 // based on Unicode 3.2
19 String ideographic = "[\u3300-\u33ff\u3400-\u4dbf\u4e00-\u9fff\uf900-\ufaff]";
20 String regex = "(" + ideographic + ")(" + ideographic + ")";
21 String retStr = str.replaceAll(regex, "$1\u200b$2");
22 retStr = retStr.replaceAll(regex, "$1\u200b$2");
23 return retStr;
24 }
25
26
11 public static String deleteSpecialXmlEntities(String inputStr) { 27 public static String deleteSpecialXmlEntities(String inputStr) {
12 inputStr = inputStr.replaceAll("&lt;", ""); 28 inputStr = inputStr.replaceAll("&lt;", "");
13 inputStr = inputStr.replaceAll("&gt;", ""); 29 inputStr = inputStr.replaceAll("&gt;", "");
14 inputStr = inputStr.replaceAll("&amp;lt;", ""); 30 inputStr = inputStr.replaceAll("&amp;lt;", "");
15 inputStr = inputStr.replaceAll("&amp;gt;", ""); 31 inputStr = inputStr.replaceAll("&amp;gt;", "");