热门标签 | HotTags
当前位置:  开发笔记 > 编程语言 > 正文

javagbk转机内码_Java实现的UTF8,GBK,Unicode编码相互转换的代码

java实现UTF-8,GBK,Unicode编码相互转换,代码如下:publicclassUTF2GBK{publicSt

java实现UTF-8,GBK,Unicode编码相互转换,代码如下:

public class UTF2GBK {

public String gbk2utf8(String gbk) {

String l_temp = GBK2Unicode(gbk);

l_temp = unicodeToUtf8(l_temp);

return l_temp;

}

public String utf82gbk(String utf) {

String l_temp = utf8ToUnicode(utf);

l_temp = Unicode2GBK(l_temp);

return l_temp;

}

/**

*

* @param str

* @return String

*/

public static String GBK2Unicode(String str) {

StringBuffer result = new StringBuffer();

for (int i = 0; i

char chr1 = (char) str.charAt(i);

if (!isNeedConvert(chr1)) {

result.append(chr1);

continue;

}

result.append("\\u" + Integer.toHexString((int) chr1));

}

return result.toString();

}

/**

*

* @param dataStr

* @return String

*/

public static String Unicode2GBK(String dataStr) {

int index = 0;

StringBuffer buffer = new StringBuffer();

int li_len = dataStr.length();

while (index

if (index >= li_len - 1

|| !"\\u".equals(dataStr.substring(index, index + 2))) {

buffer.append(dataStr.charAt(index));

index++;

continue;

}

String charStr = "";

charStr = dataStr.substring(index + 2, index + 6);

char letter = (char) Integer.parseInt(charStr, 16);

buffer.append(letter);

index += 6;

}

return buffer.toString();

}

public static boolean isNeedConvert(char para) {

return ((para & (0x00FF)) != para);

}

/**

* utf-8 转unicode

*

* @param inStr

* @return String

*/

public static String utf8ToUnicode(String inStr) {

char[] myBuffer = inStr.toCharArray();

StringBuffer sb = new StringBuffer();

for (int i = 0; i

UnicodeBlock ub = UnicodeBlock.of(myBuffer[i]);

if (ub == UnicodeBlock.BASIC_LATIN) {

sb.append(myBuffer[i]);

} else if (ub == UnicodeBlock.HALFWIDTH_AND_FULLWIDTH_FORMS) {

int j = (int) myBuffer[i] - 65248;

sb.append((char) j);

} else {

short s = (short) myBuffer[i];

String hexS = Integer.toHexString(s);

String unicode = "\\u" + hexS;

sb.append(unicode.toLowerCase());

}

}

return sb.toString();

}

/**

*

* @param theString

* @return String

*/

public static String unicodeToUtf8(String theString) {

char aChar;

int len = theString.length();

StringBuffer outBuffer = new StringBuffer(len);

for (int x = 0; x

aChar = theString.charAt(x++);

if (aChar == '\\') {

aChar = theString.charAt(x++);

if (aChar == 'u') {

// Read the xxxx

int value = 0;

for (int i &#61; 0; i <4; i&#43;&#43;) {

aChar &#61; theString.charAt(x&#43;&#43;);

switch (aChar) {

case &#39;0&#39;:

case &#39;1&#39;:

case &#39;2&#39;:

case &#39;3&#39;:

case &#39;4&#39;:

case &#39;5&#39;:

case &#39;6&#39;:

case &#39;7&#39;:

case &#39;8&#39;:

case &#39;9&#39;:

value &#61; (value <<4) &#43; aChar - &#39;0&#39;;

break;

case &#39;a&#39;:

case &#39;b&#39;:

case &#39;c&#39;:

case &#39;d&#39;:

case &#39;e&#39;:

case &#39;f&#39;:

value &#61; (value <<4) &#43; 10 &#43; aChar - &#39;a&#39;;

break;

case &#39;A&#39;:

case &#39;B&#39;:

case &#39;C&#39;:

case &#39;D&#39;:

case &#39;E&#39;:

case &#39;F&#39;:

value &#61; (value <<4) &#43; 10 &#43; aChar - &#39;A&#39;;

break;

default:

throw new IllegalArgumentException(

"Malformed \\uxxxx encoding.");

}

}

outBuffer.append((char) value);

} else {

if (aChar &#61;&#61; &#39;t&#39;)

aChar &#61; &#39;\t&#39;;

else if (aChar &#61;&#61; &#39;r&#39;)

aChar &#61; &#39;\r&#39;;

else if (aChar &#61;&#61; &#39;n&#39;)

aChar &#61; &#39;\n&#39;;

else if (aChar &#61;&#61; &#39;f&#39;)

aChar &#61; &#39;\f&#39;;

outBuffer.append(aChar);

}

} else

outBuffer.append(aChar);

}

return outBuffer.toString();

}

}



推荐阅读
author-avatar
LMS柳树_
这个家伙很懒,什么也没留下!
PHP1.CN | 中国最专业的PHP中文社区 | DevBox开发工具箱 | json解析格式化 |PHP资讯 | PHP教程 | 数据库技术 | 服务器技术 | 前端开发技术 | PHP框架 | 开发工具 | 在线工具
Copyright © 1998 - 2020 PHP1.CN. All Rights Reserved | 京公网安备 11010802041100号 | 京ICP备19059560号-4 | PHP1.CN 第一PHP社区 版权所有