UTF-8转换自写代码(1)
针对早上的代码做了一些美化,逻辑上更清楚一些。
主要用到通过二进制操作提取相应位的字节来实现。
package test;
import java.util.Scanner;
public class UnicodeTest {
public static void main(String[] args) {
// TODO Auto-generated method stub
System.out.println("Please input the Unicode:");
Scanner scanner=new Scanner(System.in);
String resultString=null;
int unicode=scanner.nextInt();
resultString=changeToUTF8(unicode);
resultString=formatString(resultString);
System.out.println(resultString);
}
public static String changeToUTF8(int unicode) {
String binary=Integer.toBinaryString(unicode);
int status=binary.length();
if(status>0&&status<8)
status=1;
if(status>7&&status<12)
status=2;
if(status>11&&status<17)
status=3;
if(status>16&&status<22)
status=4;
String result=null;
switch (status) {
case 1:
result=binary;
break;
case 2:
int part1=unicode>>6;
part1=192|part1; //2^7+2^6=192
result=Integer.toBinaryString(part1);
while(status-1!=0) {
part1=unicode>>(status-2)*6;
part1=part1&63;
part1=128|part1;
result=result+Integer.toBinaryString(part1);
status--;
}
break;
case 3:
part1=unicode>>12;
part1=224|part1; //2^7+2^6+2^5=224
result=Integer.toBinaryString(part1);
while(status-1!=0) {
part1=unicode>>(status-2)*6;
part1=part1&63;
part1=128|part1;
result=result+Integer.toBinaryString(part1);
status--;
}
break;
case 4:
part1=unicode>>18;
part1=240|part1; //2^7+2^6+2^5+2^4=240
result=Integer.toBinaryString(part1);
while(status-1!=0) {
part1=unicode>>(status-2)*6;
part1=part1&63;
part1=128|part1;
result=result+Integer.toBinaryString(part1);
status--;
}
break;
default:
result="Out of range!";
break;
}
return result;
}
public static String formatString(String resultString) {
String result=null;
int length=resultString.length();
result=resultString.substring(0, length%8);
for(int i=0;i<length/8;i++) {
result=result+" "+resultString.substring(length%8+8*i, length%8+8*(i+1));
}
return result;
}
}