Java 按字节截取字符串

最新推荐文章于 2024-05-07 09:19:13 发布

Aseveng

最新推荐文章于 2024-05-07 09:19:13 发布

阅读量502

点赞数

分类专栏： Java学习

本文链接：https://blog.csdn.net/aseveng/article/details/78255059

版权

Java学习专栏收录该内容

205 篇文章 0 订阅

订阅专栏

package io.p7.encoding;

import java.io.UnsupportedEncodingException;

public class Test {

	/*
	 * 在java中 字符串“abcd”与字符串"ab你好"长度是一样的 都是四个字符
	 * 但对应的字节数不同  一个汉子占两个字节
	 * 定义一个方法按照最大的字节数来取子串
	 * 如：对于“ab你好”,如果取三个字节 那么字串就是ab与 “你”字的半个
	 * 那 半个就要舍弃 如果取四个字节就是 “ab你” 取五个字节就是"ab你"加“好”半个
	 */
	public static void main(String[] args) throws UnsupportedEncodingException { 
		String str="ab你好cd谢谢";
/*		int len=str.getBytes("gbk").length;
		for(int x=0;x<len;x++) {
			System.out.println("截取"+(x+1)+"个字节结果为："+curStringByByte(str, x+1));*/
			
			
		int len=str.getBytes("utf-8").length;
		for(int x=0;x<len;x++) {
			System.out.println("截取"+(x+1)+"个字节结果为："+curStringByU8Byte(str, x+1));	
		}
		
	}
	private static String curStringByU8Byte(String str, int len) throws UnsupportedEncodingException {
		byte []buf=str.getBytes("utf-8");
		
		int count=0;
		for(int x=len-1;x>=0;x--) {
			if(buf[x]<0)
				count++;
			else
				break;
		}
		if(count%3==0)
			return new String(buf,0,len,"utf-8");
		else if(count%3==1)
			return new String(buf, 0, len-1,"utf-8");
		else
			return new String(buf,0,len-2,"utf-8");
		
	}
	public static String curStringByByte(String str,int len) throws UnsupportedEncodingException {
	
		byte []buf=str.getBytes("gbk");
		
		int count=0;
		for(int x=len-1;x>=0;x--) {
			if(buf[x]<0)
				count++;
			else
				break;
		}
		if(count%2==0)
			return new String(buf,0,len,"gbk");
		else 
			return new String(buf, 0, len,"gbk");
		
	}

}