Java中文字符串和Unicode编码互换

| 阅读数:--次| 作者:小豆豆
摘要:Java中文字符串和Unicode编码互换
java代码
public class Test {

	public static void main(String[] args) {
		// 把中文转成Unicode编码
		System.out.println(gbEncoding("测试中文"));
		// 把Unicode编码转成中文
		String tt=decodeUnicode("\\u6d4b\\u8bd5\\u4e2d\\u6587");
		System.out.println(tt);
	}

	/**
	 * 把中文转成Unicode编码
	 * 
	 * @param gbString
	 * @return
	 */
	public static String gbEncoding(final String gbString) {
		char[] utfBytes = gbString.toCharArray();
		String unicodeBytes = "";
		for (int byteIndex = 0; byteIndex < utfBytes.length; byteIndex++) {
			String hexB = Integer.toHexString(utfBytes[byteIndex]);
			if (hexB.length() <= 2) {
				hexB = "00" + hexB;
			}
			unicodeBytes = unicodeBytes + "\\u" + hexB;
		}
		//System.out.println("unicodeBytes is: " + unicodeBytes);
		return unicodeBytes;
	}

	/**
	 * 把Unicode编码转成中文
	 * 
	 * @param dataStr
	 * @return
	 */
	public static String decodeUnicode(final String dataStr) {
		int start = 0;
		int end = 0;
		final StringBuffer buffer = new StringBuffer();
		while (start > -1) {
			end = dataStr.indexOf("\\u", start + 2);
			String charStr = "";
			if (end == -1) {
				charStr = dataStr.substring(start + 2, dataStr.length());
			} else {
				charStr = dataStr.substring(start + 2, end);
			}
			char letter = (char) Integer.parseInt(charStr, 16); // 16进制parse整形字符串。
			buffer.append(new Character(letter).toString());
			start = end;
		}
		return buffer.toString();
	}

}
返回顶部
学到老代码浏览 关闭浏览