1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148
|
/*
* Copyright (C) 2001-2013 Michael Fuchs
*
* This file is part of herold.
*
* herold is free software: you can redistribute it and/or modify
* it under the terms of the GNU General Public License as published by
* the Free Software Foundation, either version 3 of the License, or
* (at your option) any later version.
*
* herold is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU General Public License for more details.
*
* You should have received a copy of the GNU General Public License
* along with herold. If not, see <http://www.gnu.org/licenses/>.
*/
package org.dbdoclet.service;
import java.util.regex.Matcher;
import java.util.regex.Pattern;
/**
* Die Klasse <code>UnicodeServices</code> stellt eine Sammlung statischer
* Methoden zur Bearbeitung von Unicode zur Verfügung.
*
* @author <a href="mailto:michael.fuchs@unico-group.com">Michael Fuchs</a>
* @version 1.0
*/
public class UnicodeServices {
private static Pattern pattern = Pattern.compile("\\\\u[0-9a-fA-F]{4}");
public static String escape(char c) {
char[] v = new char[1];
v[0] = c;
return escape(new String(v));
}
/**
* Die Methode <code>escape</code> wandelt die Zeichenkette
* <code>str</code> in eine 7-bit ASCII Darstellung um.
*
* @param str <code>String</code>
* @return <code>String</code>
*/
public static String escape(String str) {
if (str == null) {
return "";
}
StringBuffer buffer = new StringBuffer();
for (int i = 0; i < str.length(); i++) {
char c = str.charAt(i);
int n = c;
if (c == '\r') {
continue;
}
if (n >= 0 && n < 128 && c != '\n' && c != '\\') {
buffer.append(c);
} else {
buffer.append("\\u");
String hex = Integer.toHexString(n);
for (int j = 0; j < 4 - hex.length(); j++) {
buffer.append("0");
}
buffer.append(hex);
}
}
return buffer.toString();
}
public static String unescape(String str) {
Matcher matcher = pattern.matcher(str);
char[] c = new char[1];
String escape;
String buffer;
String part1;
String part2;
while (matcher.find()) {
escape = matcher.group();
c[0] = (char) Integer.parseInt(escape.substring(2), 16);
buffer = new String(c);
// System.out.println("buffer = " + buffer);
part1 = str.substring(0, matcher.start());
// System.out.println("part1 = " + part1);
part2 = str.substring(matcher.end());
// System.out.println("part2 = " + part2);
str = part1 + buffer + part2;
// System.out.println("str = " + str);
matcher.reset(str);
}
return str;
}
public static String removeUndefinedCharacters(String text) {
if (text == null || text.length() == 0) {
return "";
}
StringBuffer textBuffer = new StringBuffer(text);
StringBuffer buffer = new StringBuffer();
char c;
for (int i = 0; i < textBuffer.length(); i++) {
c = textBuffer.charAt(i);
if (c == '\n' || c == '\t') {
buffer.append(c);
continue;
}
if (Character.isISOControl(c) == false
&& Character.isDefined(c) == true) {
buffer.append(c);
}
}
return buffer.toString();
}
}
|