JDK自带的Collator包含的汉字太少,对一些生僻的姓氏不能进行排序。推荐使用:
com.ibm.icu.text.Collator
<dependency>
<groupId>com.ibm.icu</groupId>
<artifactId>icu4j</artifactId>
<version>57.1</version>
</dependency>
package com.chinaunicom.planning.util;
import com.alibaba.fastjson.JSON;
import com.ibm.icu.text.Collator;
import com.ibm.icu.util.ULocale;
import lombok.extern.slf4j.Slf4j;
import java.util.List;
import java.util.Map;
/**
* @author shilei
* @date 2022-11-09 9:33
*/
@Slf4j
public class PinyinConvert {
static Collator collator;
static {
collator = Collator.getInstance(ULocale.SIMPLIFIED_CHINESE);
}
/**
* 按第一个汉字首字母默认升序
*
* @param o1
* @param o2
* @param keyName
* @return
*/
public static int orderByPinyinHeadChar(Object o1, Object o2, String keyName) {
return orderByPinyinHeadChar(o1, o2, keyName, false);
}
/**
* 按第一个汉字首字母排序
*
* @param o1
* @param o2
* @param keyName
* @param desc
* @return
*/
public static int orderByPinyinHeadChar(Object o1, Object o2, String keyName, boolean desc) {
Map<String, Object> d1;
Map<String, Object> d2;
if (!(o1 instanceof Map))
d1 = JSON.parseObject(JSON.toJSONString(o1), Map.class);
else
d1 = (Map<String, Object>) o1;
if (!(o2 instanceof Map))
d2 = JSON.parseObject(JSON.toJSONString(o2), Map.class);
else
d2 = (Map<String, Object>) o2;
if (desc)
return collator.compare(d2.get(keyName), d1.get(keyName));
else
return collator.compare(d1.get(keyName), d2.get(keyName));
}
/**
* 按第一个汉字首字母默认升序
*
* @param list
* @param keyName
* @return
*/
public static void orderByPinyinHeadChar(List<Map<String, Object>> list, String keyName) {
orderByPinyinHeadChar(list, keyName, false);
}
/**
* 按第一个汉字首字母排序
*
* @param list
* @param keyName
* @param desc
* @return
*/
public static void orderByPinyinHeadChar(List<Map<String, Object>> list, String keyName, boolean desc) {
if (desc)
list.sort((o1, o2) -> collator.compare(o2.get(keyName), o1.get(keyName)));
else
list.sort((o1, o2) -> collator.compare(o1.get(keyName), o2.get(keyName)));
}
}
另一种方式则是可先利用 pinyin4j 将其转换为拼音全拼,再取首字母进行比较排序:
<dependency>
<groupId>com.belerweb</groupId>
<artifactId>pinyin4j</artifactId>
<version>2.5.1</version>
</dependency>
// List<Map<String, Object>> list
Collections.sort(list, (o1, o2) -> {
String nameOne = PinyinConvert.getHeadCharLower((String) o1.get("a"));
String nameTwo = PinyinConvert.getHeadCharLower((String) o2.get("a"));
return nameOne.compareTo(nameTwo);
});
import net.sourceforge.pinyin4j.PinyinHelper;
import net.sourceforge.pinyin4j.format.HanyuPinyinCaseType;
import net.sourceforge.pinyin4j.format.HanyuPinyinOutputFormat;
import net.sourceforge.pinyin4j.format.HanyuPinyinToneType;
import net.sourceforge.pinyin4j.format.HanyuPinyinVCharType;
import net.sourceforge.pinyin4j.format.exception.BadHanyuPinyinOutputFormatCombination;
public class PinyinConvert {
/**
* 获取全拼
*
* @param src
* @return
*/
public static String getPingYin(String src) {
char[] chars = src.toCharArray();
String[] strings;
HanyuPinyinOutputFormat format = new HanyuPinyinOutputFormat();
format.setCaseType(HanyuPinyinCaseType.LOWERCASE);
format.setToneType(HanyuPinyinToneType.WITHOUT_TONE);
format.setVCharType(HanyuPinyinVCharType.WITH_V);
String result = "";
int t0 = chars.length;
try {
for (int i = 0; i < t0; i++) {
// 判断是否为汉字字符
if (java.lang.Character.toString(chars[i]).matches("[\\u4E00-\\u9FA5]+")) {
strings = PinyinHelper.toHanyuPinyinStringArray(chars[i], format);
result += strings[0] + " ";
} else {
result += java.lang.Character.toString(chars[i]);
}
}
return result;
} catch (BadHanyuPinyinOutputFormatCombination e) {
e.printStackTrace();
}
return result;
}
/**
* 获取所有中文首字母
*
* @param str
* @return
*/
public static String getPinYinHeadChar(String str) {
String convert = "";
for (int i = 0; i < str.length(); i++) {
char word = str.charAt(i);
String[] pinyinArray = PinyinHelper.toHanyuPinyinStringArray(word);
if (pinyinArray != null) {
convert += pinyinArray[0].charAt(0);
} else {
convert += word;
}
}
return convert;
}
/**
* 获取第一个中文首字母并装换为小写
*
* @param str
* @return
*/
public static String getHeadCharLower(String str) {
String convert = "";
for (int i = 0; i < str.length(); i++) {
char word = str.charAt(i);
String[] pinyinArray = PinyinHelper.toHanyuPinyinStringArray(word);
if (pinyinArray != null) {
convert += pinyinArray[0].charAt(0);
} else {
convert += word;
}
}
char charAt = convert.charAt(0);
convert = String.valueOf(charAt).toLowerCase();
return convert;
}
/**
* 将字符串转移为ASCII码
*
* @param cnStr
* @return
*/
public static String getAscii(String cnStr) {
StringBuffer strBuf = new StringBuffer();
byte[] bGBK = cnStr.getBytes();
for (int i = 0; i < bGBK.length; i++) {
strBuf.append(Integer.toHexString(bGBK[i] & 0xff));
}
return strBuf.toString();
}
public static void main(String[] args) {
String cnStr = "长寿区";
System.out.println("获取转换后的拼音: " + getPingYin(cnStr));
System.out.println("获取各汉字首字母: " + getPinYinHeadChar(cnStr));
System.out.println("第一个字首字母 : " + getHeadCharLower(cnStr));
}
}
在此以作小记。
https://www.itzhimei.com/archives/2399.html
https://www.jianshu.com/p/ef01c7d70d14
https://blog.csdn.net/abcde123_123/article/details/107693404