在java中,char采用unicode编码,使用两个字节,16个二进制位。0x0000到0xFFFF,能够表示世界上一切的字符。
package com.sxu.cs.foundation;
public class Unicode {
public static void main(String[] args) {
// TODO Auto-generated method stub
char ch1 ='中';
int i = ch1;
System.out.println(i);//20013
char ch2 = 20013;
System.out.println(ch2);
char ch3 = 0x4E2D;
System.out.println(ch2 == ch3);
int high = 0;
int low = 0;
// Unicode编码0x0000~0x007F,C0控制符及基本拉丁文
//high = 0x007F;
//low = 0x0000;
//0080-00FF:C1控制符及拉丁文补充-1
high = 0x00FF;
low = 0x0080;
//0250-02AF:国际音标扩展
//high = 0x02AF;
//low = 0x0250;
//中文范围 4E00-9FBF
high = 0x9FBF;
low = 0x4E00;
char ch4[] = new char[(high - low)];
for(int j = 0;j< ch4.length; j++)
{
ch4[j] = (char)(j+low);
System.out.println(ch4[j]);
}
}
}