package data.test;

import org.slf4j.Logger;
import org.slf4j.LoggerFactory;

public class UnicodeToUtf8 {
	
	private static final Logger logger = LoggerFactory.getLogger(UnicodeToUtf8.class);
	
	public static String decodeUnicode(String unicodeStr) {
		char aChar;
		int len = unicodeStr.length();
		StringBuffer outBuffer = new StringBuffer(len);
		for (int x = 0; x < len;) {
			aChar = unicodeStr.charAt(x++);
			if (aChar == '\\') {
				aChar = unicodeStr.charAt(x++);
				if (aChar == 'u') {
					// Read the xxxx
					int value = 0;
					for (int i = 0; i < 4; i++) {
						aChar = unicodeStr.charAt(x++);
						switch (aChar) {
						case '0':
						case '1':
						case '2':
						case '3':
						case '4':
						case '5':
						case '6':
						case '7':
						case '8':
						case '9':
							value = (value << 4) + aChar - '0';
							break;
						case 'a':
						case 'b':
						case 'c':
						case 'd':
						case 'e':
						case 'f':
							value = (value << 4) + 10 + aChar - 'a';
							break;
						case 'A':
						case 'B':
						case 'C':
						case 'D':
						case 'E':
						case 'F':
							value = (value << 4) + 10 + aChar - 'A';
							break;
						default:
							logger.warn("{}","UnicodeToUtf8 exception!");
							return "";
						}

					}
					outBuffer.append((char) value);
				} else {
					if (aChar == 't')
						aChar = '\t';
					else if (aChar == 'r')
						aChar = '\r';
					else if (aChar == 'n')
						aChar = '\n';
					else if (aChar == 'f')
						aChar = '\f';
					outBuffer.append(aChar);
				}
			} else
				outBuffer.append(aChar);
		}
		return outBuffer.toString();
	}
	
	public static void main(String[] args) {
		String str = "\u7acb\u767d_\u5168\u81ea\u52a8\u6d53\u7f29_\u6d17\u8863\u7c89_900g";
		str = decodeUnicode(str);
		System.out.println(str);
		
	}
	
}

Logo

技术共进,成长同行——讯飞AI开发者社区

更多推荐