中国語をunicodeに変換し、unicodeを中国語に変換する方法
2440 ワード
import java.util.regex.Matcher;
import java.util.regex.Pattern;
/**
* @date 2013-8-27 02:05:38
*/
public class CodeChange {
/**
* @date 2013-8-27 02:05:38
*/
/*
19
20
* Unicode
21
22
*/
public static String stringToUnicode(String s) {
String str = "";
for (int i = 0; i < s.length(); i++) {
int ch = (int) s.charAt(i);
if (ch > 255)
str += "\\u" + Integer.toHexString(ch);
else
str += "\\" + Integer.toHexString(ch);
}
return str;
}
/*
39
40
* Unicode
41
42
*/
public static String unicodeToString(String str) {
Pattern pattern = Pattern.compile("(\\\\u(\\p{XDigit}{4}))");
Matcher matcher = pattern.matcher(str);
char ch;
while (matcher.find()) {
ch = (char) Integer.parseInt(matcher.group(2), 16);
str = str.replace(matcher.group(1), ch + "");
}
return str;
}
public static void main(String[] args) {
// Unicode ,
String s1 = "\\ \\ \\ \\ \\,\\ \\ \\ \\ \\ ";
System.out.println("s1: " + s1);
// Unicode
String s2 = " , ";
s2 = CodeChange.stringToUnicode(s2);
System.out.println("s2: " + s2);
// Unicode
String aaa ="\u4ec0\u4e48\u662f\u5b89\u5168\u63a7\u4ef6\uff1f###\u5b89\u5168\u63a7\u4ef6\u53ef\u4ee5\u4fdd\u8bc1\u7528\u6237\u7684\u5bc6\u7801\u4e0d\u88ab\u7a83\u53d6\uff0c\u4ece\u800c\u4fdd\u8bc1\u8d44\u91d1\u5b89\u5168";
String s3 = CodeChange.unicodeToString(aaa);
System.out.println("s3: " + s3);
}
}