java txt ansi_TXT文件编码为ANSI,怎么实现用JAVA程序转换为Uncoide

该博客提供了一个Java代码示例,实现了字符编码转换与判断功能。代码包含将汉字转Unicode、转16进制、16进制转区位码、Unicode转中文等方法,还提供了判断字符是否为中文和是否为乱码的方法。

摘要生成于 C知道 ,由 DeepSeek-R1 满血版支持, 前往体验 >

展开全部

package test;

import java.io.UnsupportedEncodingException;

import java.util.regex.Matcher;

import java.util.regex.Pattern;

public class CodeUtil { public static void main(String[] args) throws UnsupportedEncodingException {

String chinaString = "测试";

String unicode = convertToUnicode(chinaString);

System.out.println(unicode);

System.out.println(unicodeToChinese(unicode));

String _x16 = convertTo16Code(chinaString, "UTF-8").toLowerCase();

System.out.println(_x16);

String[] sby = convertToBitCode(_x16);

StringBuffer subf = new StringBuffer();

subf.append("byte[] bytes = {");

byte[] bytes = new byte[sby.length];

for (int i = 0; i < sby.length; i++) {

int icode = Integer.decode(sby[i]).intValue();

bytes[i] = (byte) icode;

subf.append("(byte)").append(sby[i]).append(",");

// System.out.println(sby[i]);

}

subf.deleteCharAt(subf.length() - 1);

subf.append("};");

System.out.println(subf.toString());

System.out.println(new String(bytes, "UTF-8"));

}

private final static String hexString = "0123456789ABCDEF";

/**

* 转e68a84323131333532363134313032313635333133333036376516进制,如果是中文,encoding-->>UTF-8

*/

public static String convertTo16Code(String str, String encoding)

throws UnsupportedEncodingException {

byte[] bytes = str.getBytes(encoding);

StringBuffer sb = new StringBuffer(bytes.length * 2);

for (int i = 0; i < bytes.length; i++) {

sb.append(hexString.charAt((bytes[i] & 0xf0) >> 4));

sb.append(hexString.charAt((bytes[i] & 0x0f) >> 0));

}

return sb.toString();

}

/**

* 将汉字转Unicode

*

* @param String

* s

* @return String sb.toString();

*/

public static String convertToUnicode(String s) {

if (s == null) {

return s;

}

char[] chars = s.toCharArray();

char c;

StringBuffer sb = new StringBuffer();

for (int i = 0; i < chars.length; i++) {

c = chars[i];

if (c > 0xff) {

sb.append("\\u").append(Integer.toHexString(c));

} else {

sb.append(c);

}

}

return sb.toString();

}

/**

* 将16进制转为区位码

*

* @param

*/

public static String[] convertToBitCode(String str_16) {

String[] result = null;

if (str_16 == null || str_16 == "" || str_16.length() % 2 != 0) {

return result;

}

result = new String[str_16.length() / 2];

for (int i = 0; i < str_16.length() / 2; i++) {

result[i] = "0x" + str_16.charAt(i * 2) + str_16.charAt(i * 2 + 1);

}

return result;

}

/**

*

*/

public static String unicodeToChinese(String unicodeStr) {

int start = 0;

int end = 0;

final StringBuffer buffer = new StringBuffer();

while (start > -1) {

end = unicodeStr.indexOf("\\u", start + 2);

String charStr = "";

if (end == -1) {

charStr = unicodeStr.substring(start + 2, unicodeStr.length());

} else {

charStr = unicodeStr.substring(start + 2, end);

}

char letter = (char) Integer.parseInt(charStr, 16);

buffer.append(new Character(letter).toString());

start = end;

}

return buffer.toString();

}

public static boolean isChinese(char c) {

Character.UnicodeBlock ub = Character.UnicodeBlock.of(c);

if (ub == Character.UnicodeBlock.CJK_UNIFIED_IDEOGRAPHS

|| ub == Character.UnicodeBlock.CJK_COMPATIBILITY_IDEOGRAPHS

|| ub == Character.UnicodeBlock.CJK_UNIFIED_IDEOGRAPHS_EXTENSION_A

|| ub == Character.UnicodeBlock.GENERAL_PUNCTUATION

|| ub == Character.UnicodeBlock.CJK_SYMBOLS_AND_PUNCTUATION

|| ub == Character.UnicodeBlock.HALFWIDTH_AND_FULLWIDTH_FORMS) {

return true;

}

return false;

}

public static boolean isMessyCode(String str) {

Pattern p = Pattern.compile("\\s*|\t*|\r*|\n*");

Matcher m = p.matcher(str);

String after = m.replaceAll("");

String temp = after.replaceAll("\\p{P}", "");

char[] ch = temp.trim().toCharArray();

float chLength = ch.length;

float count = 0;

for (int i = 0; i < ch.length; i++) {

char c = ch[i];

if (!Character.isLetterOrDigit(c)) {

if (!isChinese(c)) {

count = count + 1;

System.out.print(c);

}

}

}

float result = count / chLength;

if (result > 0.4) {

return true;

} else {

return false;

}

}

}

这个你懂了,解决你的问题就是小意思了

本回答由提问者推荐

2Q==

已赞过

已踩过<

你对这个回答的评价是?

评论

收起

评论
添加红包

请填写红包祝福语或标题

红包个数最小为10个

红包金额最低5元

当前余额3.43前往充值 >
需支付:10.00
成就一亿技术人!
领取后你会自动成为博主和红包主的粉丝 规则
hope_wisdom
发出的红包
实付
使用余额支付
点击重新获取
扫码支付
钱包余额 0

抵扣说明:

1.余额是钱包充值的虚拟货币,按照1:1的比例进行支付金额的抵扣。
2.余额无法直接购买下载,可以购买VIP、付费专栏及课程。

余额充值