引用
import net.sourceforge.pinyin4j.PinyinHelper;
import net.sourceforge.pinyin4j.format.HanyuPinyinOutputFormat;
import net.sourceforge.pinyin4j.format.HanyuPinyinToneType;
import java.util.regex.Matcher;
import java.util.regex.Pattern;
public class ChineseCharacterUtil {
public static final char CHAR = '傦';
public static final char CHAR1 = '琻';
public static final char CHAR2 = '橴';
public static final char CHAR3 = '塰';
public static final char CHAR4 = '嚒';
public static final char CHAR5 = '哘';
public static final char CHAR6 = '渏';
/***
* 将汉字转成拼音(取首字母或全拼)
* @param hanZi
* @param full 是否全拼
* @return String
*/
public static String convertHanZi2Pinyin(String hanZi, boolean full) {
/***
* ^[\u2E80-\u9FFF]+$ 匹配所有东亚区的语言
* ^[\u4E00-\u9FFF]+$ 匹配简体和繁体
* ^[\u4E00-\u9FA5]+$ 匹配简体
*/
String regExp = "^[\u4E00-\u9FFF]+$";
StringBuffer sb = new StringBuffer();
if (hanZi == null || "".equals(hanZi.trim())) {
return "";
}
String pinyin = "";
for (int i = 0; i < hanZi.length(); i++) {
char unit = hanZi.charAt(i);
//是汉字,则转拼音
if (match(String.valueOf(unit), regExp)) {
pinyin = convertSingleHanZi2Pinyin(unit);
if (full) {
sb.append(pinyin);
} else {
sb.append(pinyin.charAt(0));
}
} else {
sb.append(unit);
}
}
return sb.toString();
}
/***
* 将单个汉字转成拼音
* @param hanZi
* @return String
*/
private static String convertSingleHanZi2Pinyin(char hanZi) {
if(hanZi == CHAR){
return "gu";
}else if(hanZi == CHAR1){
return "jin";
}else if(hanZi == CHAR2){
return "zi";
}else if(hanZi == CHAR3){
return "hai";
}else if(hanZi == CHAR4){
return "me";
}else if(hanZi == CHAR5){
return "xing";
}else if(hanZi == CHAR6){
return "yi";
}
HanyuPinyinOutputFormat outputFormat = new HanyuPinyinOutputFormat();
outputFormat.setToneType(HanyuPinyinToneType.WITHOUT_TONE);
String[] res;
StringBuilder sb = new StringBuilder();
try {
res = PinyinHelper.toHanyuPinyinStringArray(hanZi, outputFormat);
// 对于多音字,只用第一个拼音
sb.append(res == null ? "" : res[0]);
} catch (Exception e) {
e.printStackTrace();
return "";
}
return sb.toString();
}
/***
* @param str 源字符串
* @param regex 正则表达式
* @return 是否匹配
*/
public static boolean match(String str, String regex) {
Pattern pattern = Pattern.compile(regex);
Matcher matcher = pattern.matcher(str);
return matcher.find();
}
public static void main(String[] args) {
System.out.println(convertHanZi2Pinyin("渏", false));
}