中国語をunicodeに変換し、unicodeを中国語に変換する方法

2440 ワード


import java.util.regex.Matcher;
import java.util.regex.Pattern;

/**
 * @date 2013-8-27  02:05:38
 */
public class CodeChange {
	/**
	 * @date 2013-8-27  02:05:38
	 */
			/*
			19
			 
			20
			 *   Unicode 
			21
			 
			22
			 */
			    public static String stringToUnicode(String s) {
			
			        String str = "";
			
			        for (int i = 0; i < s.length(); i++) {
			
			            int ch = (int) s.charAt(i);
			
			            if (ch > 255)
			
			                str += "\\u" + Integer.toHexString(ch);
			
			            else
			
			                str += "\\" + Integer.toHexString(ch);
			
			        }
			
			        return str;
			
			    }
		
			/*
			39
			 
			40
			 *   Unicode 
			41
			 
			42
			 */
			    public static String unicodeToString(String str) {
			        Pattern pattern = Pattern.compile("(\\\\u(\\p{XDigit}{4}))");   
			
			        Matcher matcher = pattern.matcher(str);
		
			        char ch;
		
			        while (matcher.find()) {
		
			            ch = (char) Integer.parseInt(matcher.group(2), 16);
		
			            str = str.replace(matcher.group(1), ch + "");   
			        }
			        return str;
			    }
			    public static void main(String[] args) {
			        //  Unicode , 
		
			        String s1 = "\\ \\ \\ \\ \\,\\ \\ \\ \\ \\ ";
		
			        System.out.println("s1: " + s1);
	
			        // Unicode 
			        String s2 = " , ";
	
			        s2 = CodeChange.stringToUnicode(s2);

			        System.out.println("s2: " + s2);

			        // Unicode 
			        String aaa ="\u4ec0\u4e48\u662f\u5b89\u5168\u63a7\u4ef6\uff1f###\u5b89\u5168\u63a7\u4ef6\u53ef\u4ee5\u4fdd\u8bc1\u7528\u6237\u7684\u5bc6\u7801\u4e0d\u88ab\u7a83\u53d6\uff0c\u4ece\u800c\u4fdd\u8bc1\u8d44\u91d1\u5b89\u5168";
			        String s3 = CodeChange.unicodeToString(aaa);

			        System.out.println("s3: " + s3);
			    }
	}