对汉字依据首字母进行排序

JDK自带的Collator包含的汉字太少,对一些生僻的姓氏不能进行排序。推荐使用:

com.ibm.icu.text.Collator

<dependency>
    <groupId>com.ibm.icu</groupId>
    <artifactId>icu4j</artifactId>
    <version>57.1</version>
</dependency>
package com.chinaunicom.planning.util;

import com.alibaba.fastjson.JSON;
import com.ibm.icu.text.Collator;
import com.ibm.icu.util.ULocale;
import lombok.extern.slf4j.Slf4j;

import java.util.List;
import java.util.Map;

/**
 * @author shilei
 * @date 2022-11-09 9:33
 */
@Slf4j
public class PinyinConvert {
    static Collator collator;

    static {
        collator = Collator.getInstance(ULocale.SIMPLIFIED_CHINESE);
    }

    /**
     * 按第一个汉字首字母默认升序
     *
     * @param o1
     * @param o2
     * @param keyName
     * @return
     */
    public static int orderByPinyinHeadChar(Object o1, Object o2, String keyName) {
        return orderByPinyinHeadChar(o1, o2, keyName, false);
    }

    /**
     * 按第一个汉字首字母排序
     *
     * @param o1
     * @param o2
     * @param keyName
     * @param desc
     * @return
     */
    public static int orderByPinyinHeadChar(Object o1, Object o2, String keyName, boolean desc) {
        Map<String, Object> d1;
        Map<String, Object> d2;
        if (!(o1 instanceof Map))
            d1 = JSON.parseObject(JSON.toJSONString(o1), Map.class);
        else
            d1 = (Map<String, Object>) o1;
        if (!(o2 instanceof Map))
            d2 = JSON.parseObject(JSON.toJSONString(o2), Map.class);
        else
            d2 = (Map<String, Object>) o2;
        if (desc)
            return collator.compare(d2.get(keyName), d1.get(keyName));
        else
            return collator.compare(d1.get(keyName), d2.get(keyName));
    }

    /**
     * 按第一个汉字首字母默认升序
     *
     * @param list
     * @param keyName
     * @return
     */
    public static void orderByPinyinHeadChar(List<Map<String, Object>> list, String keyName) {
        orderByPinyinHeadChar(list, keyName, false);
    }

    /**
     * 按第一个汉字首字母排序
     *
     * @param list
     * @param keyName
     * @param desc
     * @return
     */
    public static void orderByPinyinHeadChar(List<Map<String, Object>> list, String keyName, boolean desc) {
        if (desc)
            list.sort((o1, o2) -> collator.compare(o2.get(keyName), o1.get(keyName)));
        else
            list.sort((o1, o2) -> collator.compare(o1.get(keyName), o2.get(keyName)));
    }

}

另一种方式则是可先利用 pinyin4j 将其转换为拼音全拼,再取首字母进行比较排序:

<dependency>
   <groupId>com.belerweb</groupId>
   <artifactId>pinyin4j</artifactId>
   <version>2.5.1</version>
</dependency>
// List<Map<String, Object>> list
Collections.sort(list, (o1, o2) -> {
    String nameOne = PinyinConvert.getHeadCharLower((String) o1.get("a"));
    String nameTwo = PinyinConvert.getHeadCharLower((String) o2.get("a"));
    return nameOne.compareTo(nameTwo);
});
import net.sourceforge.pinyin4j.PinyinHelper;
import net.sourceforge.pinyin4j.format.HanyuPinyinCaseType;
import net.sourceforge.pinyin4j.format.HanyuPinyinOutputFormat;
import net.sourceforge.pinyin4j.format.HanyuPinyinToneType;
import net.sourceforge.pinyin4j.format.HanyuPinyinVCharType;
import net.sourceforge.pinyin4j.format.exception.BadHanyuPinyinOutputFormatCombination;

public class PinyinConvert {
    /**
     * 获取全拼
     *
     * @param src
     * @return
     */
    public static String getPingYin(String src) {
        char[] chars = src.toCharArray();
        String[] strings;
        HanyuPinyinOutputFormat format = new HanyuPinyinOutputFormat();
        format.setCaseType(HanyuPinyinCaseType.LOWERCASE);
        format.setToneType(HanyuPinyinToneType.WITHOUT_TONE);
        format.setVCharType(HanyuPinyinVCharType.WITH_V);
        String result = "";
        int t0 = chars.length;
        try {
            for (int i = 0; i < t0; i++) {
                // 判断是否为汉字字符
                if (java.lang.Character.toString(chars[i]).matches("[\\u4E00-\\u9FA5]+")) {
                    strings = PinyinHelper.toHanyuPinyinStringArray(chars[i], format);
                    result += strings[0] + " ";
                } else {
                    result += java.lang.Character.toString(chars[i]);
                }
            }
            return result;
        } catch (BadHanyuPinyinOutputFormatCombination e) {
            e.printStackTrace();
        }
        return result;
    }

    /**
     * 获取所有中文首字母
     *
     * @param str
     * @return
     */
    public static String getPinYinHeadChar(String str) {
        String convert = "";
        for (int i = 0; i < str.length(); i++) {
            char word = str.charAt(i);
            String[] pinyinArray = PinyinHelper.toHanyuPinyinStringArray(word);
            if (pinyinArray != null) {
                convert += pinyinArray[0].charAt(0);
            } else {
                convert += word;
            }
        }
        return convert;
    }

    /**
     * 获取第一个中文首字母并装换为小写
     *
     * @param str
     * @return
     */
    public static String getHeadCharLower(String str) {
        String convert = "";
        for (int i = 0; i < str.length(); i++) {
            char word = str.charAt(i);
            String[] pinyinArray = PinyinHelper.toHanyuPinyinStringArray(word);
            if (pinyinArray != null) {
                convert += pinyinArray[0].charAt(0);
            } else {
                convert += word;
            }
        }
        char charAt = convert.charAt(0);
        convert = String.valueOf(charAt).toLowerCase();
        return convert;
    }

    /**
     * 将字符串转移为ASCII码
     *
     * @param cnStr
     * @return
     */
    public static String getAscii(String cnStr) {
        StringBuffer strBuf = new StringBuffer();
        byte[] bGBK = cnStr.getBytes();
        for (int i = 0; i < bGBK.length; i++) {
            strBuf.append(Integer.toHexString(bGBK[i] & 0xff));
        }
        return strBuf.toString();
    }

    public static void main(String[] args) {
        String cnStr = "长寿区";
        System.out.println("获取转换后的拼音: " + getPingYin(cnStr));
        System.out.println("获取各汉字首字母: " + getPinYinHeadChar(cnStr));
        System.out.println("第一个字首字母 : " + getHeadCharLower(cnStr));
    }

}

在此以作小记。

https://www.itzhimei.com/archives/2399.html

https://www.jianshu.com/p/ef01c7d70d14

https://blog.csdn.net/abcde123_123/article/details/107693404

  • 0
    点赞
  • 0
    收藏
    觉得还不错? 一键收藏
  • 0
    评论
评论
添加红包

请填写红包祝福语或标题

红包个数最小为10个

红包金额最低5元

当前余额3.43前往充值 >
需支付:10.00
成就一亿技术人!
领取后你会自动成为博主和红包主的粉丝 规则
hope_wisdom
发出的红包
实付
使用余额支付
点击重新获取
扫码支付
钱包余额 0

抵扣说明:

1.余额是钱包充值的虚拟货币,按照1:1的比例进行支付金额的抵扣。
2.余额无法直接购买下载,可以购买VIP、付费专栏及课程。

余额充值