字典文件读取

/**
 * 词工具
 *
 */
public class WordUtil {
    private final static Logger logger = LoggerFactory.getLogger(WordUtil.class);
    public static Map<Property,List<String>> synonymMap = Maps.newHashMap();
    public static Map<String,List<String>> propertySynonymMap = Maps.newHashMap();
    public static Map<String,List<String>> synnonymPropertyMap = Maps.newHashMap();
    public static Map<String,Integer> duplicateSyn = Maps.newHashMap();
    public static Map<String,Synonym> duplicateSynonymMap = Maps.newHashMap();
    public static Map<String,Synonym> unDuplicateSynonymMap = Maps.newHashMap();
    
    static {
        loadSynonymDic();
    }
    private static void loadSynonymDic(){
     //获取字典文件的io流进行读取
try (BufferedReader br = new BufferedReader(new InputStreamReader(WordUtil.class.getResourceAsStream("/dic/synonym.txt"), "UTF-8"))) { String line; while ((line = br.readLine()) != null) { String[] data = line.split("\\s+"); if(data!=null && data.length > 2){ Property p = new Property(); p.setKey(data[0]); p.setValue(data[1]); List<String> value = Lists.newArrayList(line.replaceAll(data[0], "").replaceAll(data[1], "").split("\\s+")); value.remove(""); synonymMap.put(p, value); propertySynonymMap.put(data[0]+":"+data[1], value); } } for (Property key : synonymMap.keySet()) { List<String> synonyms = synonymMap.get(key); for (String synonym : synonyms) { List<String> checkProperty = synnonymPropertyMap.get(synonym); if (checkProperty == null) { checkProperty = Lists.newArrayList(); } checkProperty.add(key.getKey()+":"+key.getValue()); synnonymPropertyMap.put(synonym, checkProperty); } } for (Property key : synonymMap.keySet()) { boolean exception = false; List<String> synonyms = synonymMap.get(key); // System.out.println(key.getKey()); // System.out.println(key.getValue()); for (String synonym : synonyms) { Synonym syn = new Synonym(); syn.setName(synonym); Synonym checkSyn = duplicateSynonymMap.get(synonym); if (checkSyn != null && StringUtils.isNotEmpty(checkSyn.getName()) && checkSyn.getName().equals(synonym)) { List<Property> changeProperty = checkSyn.getProperty(); changeProperty.add(key); syn.setProperty(changeProperty); syn.setNum(changeProperty.size()); } else if(checkSyn != null && StringUtils.isNotEmpty(checkSyn.getName()) && !checkSyn.getName().equals(synonym)) { logger.info("出现错误bug~~~~~~~~~~,两同义词:{},{}",checkSyn.getName(),synonym); exception = true; break; } else { syn.setNum(1); List<Property> newProperty = Lists.newArrayList(); newProperty.add(key); syn.setProperty(newProperty); } duplicateSynonymMap.put(synonym, syn); } if (exception) { logger.info("Warning~~~~~~~~~~~~"); break; } } // System.out.println(duplicateSynonymMap); logger.info("同义词总数:{}",duplicateSynonymMap.size()); List<String> outingSyn = Lists.newArrayList(); for (String syn : duplicateSynonymMap.keySet()) { Synonym message = duplicateSynonymMap.get(syn); if (message.getNum() > 1) { duplicateSyn.put(syn, message.getNum()); } else { outingSyn.add(syn); } } for (String syn : outingSyn) { unDuplicateSynonymMap.put(syn, duplicateSynonymMap.get(syn)); duplicateSynonymMap.remove(syn); } } catch (FileNotFoundException e) { e.printStackTrace(); } catch (IOException e) { e.printStackTrace(); } logger.info("Synonym map obtained.size is {}",synonymMap.size()); } /** * 获取同义词 * @param word * @return */ public static List<String> getSynonym(Property p){ if(p == null){ return Collections.emptyList(); } return synonymMap.get(p); } }

 

转载于:https://www.cnblogs.com/yzf666/p/7345053.html

  • 0
    点赞
  • 0
    收藏
    觉得还不错? 一键收藏
  • 0
    评论

“相关推荐”对你有帮助么?

  • 非常没帮助
  • 没帮助
  • 一般
  • 有帮助
  • 非常有帮助
提交
评论
添加红包

请填写红包祝福语或标题

红包个数最小为10个

红包金额最低5元

当前余额3.43前往充值 >
需支付:10.00
成就一亿技术人!
领取后你会自动成为博主和红包主的粉丝 规则
hope_wisdom
发出的红包
实付
使用余额支付
点击重新获取
扫码支付
钱包余额 0

抵扣说明:

1.余额是钱包充值的虚拟货币,按照1:1的比例进行支付金额的抵扣。
2.余额无法直接购买下载,可以购买VIP、付费专栏及课程。

余额充值