【自然语言NLP】02:hanlp词性对应中文枚举(java)

本文详细介绍了如何使用HanLP库在Java中进行自然语言处理,特别是针对中文词性的枚举解析,深入理解NLP中的词性标注及其在实际应用中的价值。

摘要生成于 C知道 ,由 DeepSeek-R1 满血版支持, 前往体验 >


/**
 * Hanlp内置词性 (目前仅用于提高输出可读性)
 */
public enum HanLPEnums {

    A("a","形容词"),
    AD("ad","副形词"),
    AG("ag","形容词性语素"),
    AL("al","形容词性惯用语"),
    AN("an","名形词"),
    B("b","区别词"),
    BEGIN("begin","仅用于始##始"),
    BG("bg","区别语素"),
    BL("bl","区别词性惯用语"),
    C("c","连词"),
    CC( "cc","并列连词"),
    D("d","副词"),
    DG("dg","辄,俱,复之类的副词"),
    DL("dl","连语"),
    E("e","叹词"),
    END("end","仅用于终##终"),
    F("f","方位词"),
    G("g","学术词汇"),
    GB("gb","生物相关词汇"),
    GBC("gbc","生物类别"),
    GC("gc","化学相关词汇"),
    GG("gg","地理地质相关词汇"),
    GI("gi","计算机相关词汇"),
    GM("gm","数学相关词汇"),
    GP("gp","物理相关词汇"),
    H("h","前缀"),
    I("i","成语"),
    J("j","简称略语"),
    K("k","后缀"),
    L("l","习用语"),
    M("m","数词"),
    MG("mg","数语素"),
    _MG( "Mg","甲乙丙丁之类的数词"),
    MQ("mq","数量词"),
    N("n","名词"),
    NB("nb","生物名"),
    NBA("nba","动物名"),
    NBC("nbc","动物纲目"),
    NBP("nbp","植物名"),
    NF("nf","食品,比如“薯片”"),
    NG("ng","名词性语素"),
    NH("nh","医药疾病等健康相关名词"),
    NHD("nhd","疾病"),
    NHM("nhm","药品"),
    NI("ni","机构相关(不是独立机构名)"),
    NIC("nic","下属机构"),
    NIS("nis","机构后缀"),
    NIT("nit","教育相关机构"),
    NL("nl","名词性惯用语"),
    NM("nm","物品名"),
    NMC("nmc","化学品名"),
    NN("nn","工作相关名词"),
    NND("nnd","职业"),
    NNT("nnt","职务职称"),
    NR("nr","人名"),
    NR1("nr1","复姓"),
    NR2("nr2","蒙古姓名"),
    NRF("nrf","音译人名"),
    NRJ("nrj","日语人名"),
    NS("ns","地名"),
    NSF("nsf","音译地名"),
    NT("nt","机构团体名"),
    NTC("ntc","公司名"),
    NTCB("ntcb","银行"),
    NTCF("ntcf","工厂"),
    NTCH("ntch","酒店宾馆"),
    NTH("nth","医院"),
    NTO("nto","政府机构"),
    NTS("nts","中小学"),
    NTU("ntu","大学"),
    NX("nx","字母专名"),
    NZ("nz","其他专名"),
    O("o","拟声词"),
    P("p","介词"),
    PBA("pba","介词“把”"),
    PBEI("pbei","介词“被”"),
    Q("q","量词"),
    QG("qg","量词语素"),
    QT("qt","时量词"),
    QV("qv","动量词"),
    R("r","代词"),
    RG("rg","代词性语素"),
    _RG("Rg","古汉语代词性语素"),
    RR("rr","人称代词"),
    RY("ry","疑问代词"),
    RYS("rys","处所疑问代词"),
    RYT("ryt","时间疑问代词"),
    RYV("ryv","谓词性疑问代词"),
    RZ("rz","指示代词"),
    RZS("rzs","处所指示代词"),
    RZT("rzt","时间指示代词"),
    RZV("rzv","谓词性指示代词"),
    S("s","处所词"),
    T("t","时间词"),
    TG("tg","时间词性语素"),
    U("u","助词"),
    UD("ud","助词"),
    UDE1("ude1","的 底"),
    UDE2("ude2","地"),
    UDE3("ude3","得"),
    UDENG("udeng","等 等等 云云"),
    UDH("udh","的话"),
    UG("ug","过"),
    UGUO("uguo","过"),
    UJ("uj","助词"),
    UL("ul","连词"),
    ULE("ule","了 喽"),
    ULIAN("ulian","连 (“连小学生都会”)"),
    ULS("uls","来讲 来说 而言 说来"),
    USUO("usuo","所"),
    UV("uv","连词"),
    UYY("uyy","一样 一般 似的 般"),
    UZ("uz","着"),
    UZHE("uzhe","着"),
    UZHI("uzhi","之"),
    V("v","动词"),
    VD("vd","副动词"),
    VF("vf","趋向动词"),
    VG("vg","动词性语素"),
    VI("vi","不及物动词(内动词)"),
    VL("vl","动词性惯用语"),
    VN("vn","名动词"),
    VSHI("vshi","动词“是”"),
    VX("vx","形式动词"),
    VYOU("vyou","动词“有”"),
    W("w","标点符号"),
    WB("wb","百分号千分号,全角:% ‰   半角:%"),
    WD("wd","逗号,全角:, 半角:,"),
    WF("wf","分号,全角:; 半角: ;"),
    WH("wh","单位符号,全角:¥ $ £  °  ℃  半角:$"),
    WJ("wj","句号,全角:。"),
    WKY("wky","右括号,全角:) 〕  ] } 》  】 〗 〉 半角: ) ] { >"),
    WKZ("wkz","左括号,全角:( 〔  [  {  《 【  〖 〈   半角:( [ { <"),
    WM("wm","冒号,全角:: 半角: :"),
    WN("wn","顿号,全角:、"),
    WP("wp","破折号,全角:——   --   ——-   半角:—  —-"),
    WS("ws","省略号,全角:……  …"),
    WT("wt","叹号,全角:!"),
    WW("ww","问号,全角:?"),
    WYY("wyy","右引号,全角:” ’ 』"),
    WYZ("wyz","左引号,全角:“ ‘ 『"),
    X("x","字符串"),
    XU("xu","网址URL"),
    XX("xx","非语素字"),
    Y("y","语气词(delete yg)"),
    YG("yg","语气语素"),
    Z("z","状态词"),
    ZG("zg","状态词")
    ;
        public String KEY;
        public String VALUE;
    private HanLPEnums(String key, String value) {
            this.KEY = key;
            this.VALUE = value;
        }
        public static HanLPEnums get(String key) {
            HanLPEnums[] values = HanLPEnums.values();
            for (HanLPEnums object : values) {
                if (key.equals(object.KEY.toString())) {
                    return object;
                }
            }
            return null;
        }


    }

评论 1
添加红包

请填写红包祝福语或标题

红包个数最小为10个

红包金额最低5元

当前余额3.43前往充值 >
需支付:10.00
成就一亿技术人!
领取后你会自动成为博主和红包主的粉丝 规则
hope_wisdom
发出的红包

打赏作者

coder阿龙

你的鼓励将是我创作的最大动力

¥1 ¥2 ¥4 ¥6 ¥10 ¥20
扫码支付:¥1
获取中
扫码支付

您的余额不足,请更换扫码支付或充值

打赏作者

实付
使用余额支付
点击重新获取
扫码支付
钱包余额 0

抵扣说明:

1.余额是钱包充值的虚拟货币,按照1:1的比例进行支付金额的抵扣。
2.余额无法直接购买下载,可以购买VIP、付费专栏及课程。

余额充值