匿名处理
今天对用户名称进行匿名处理,但是用户名称中可能包含emoji表情符号,先附上匿名处理的方法
//1、用户+id正常显示;2、大于2个字,前后保留一个字,例如 小***吐;3、小与等于2个字,保留第一个字,例如 小***;
public static String anonymity(String name) {
//用户名称为空,为用户+id,只有一个字不做处理直接返回
if (StringUtils.isBlank(name) || name.matches("^用户[0-9]+$") || name.length() == 1) {
return name;
} else {
//名称长度:将表情符号的长度视为1
int length = name.codePointCount(0, name.length());
if (length == 2) {
//两个字后一个字匿名
int start = name.offsetByCodePoints(0, 0);
int end = name.offsetByCodePoints(0, 1);
return name.substring(start, end) + "*";
} else {
//三个字或以上,匿名处理中间部分
int start1 = name.offsetByCodePoints(0, 0);
int end1 = name.offsetByCodePoints(0, 1);
int start2 = name.offsetByCodePoints(0, length-1);
int end2 = name.offsetByCodePoints(0, length);
return name.substring(start1, end1) + "***" + name.substring(start2, end2);
}
}
}
emoji表情符号过滤
//替换String中的表情符号为空
public String filterEmoji(String source) {
if (StringUtils.isNotBlank(source)) {
return source.replaceAll("[\\ud800\\udc00-\\udbff\\udfff\\ud800-\\udfff]", "");
} else {
return source;
}
}
将emoji表情长度视为1,获取文本的长度
//source为文本,名称长度:将表情符号的长度视为1
int length = source.codePointCount(0, source.length());
截取一个第一个位置的emoji表情符
//name为文本,将表情符号的长度视为1的文本长度
int length = name.codePointCount(0, name.length());
//两个字后一个匿名
int start = name.offsetByCodePoints(0, 0);
int end = name.offsetByCodePoints(0, 1);
return name.substring(start, end) + "*";
判断文本中是否有emoji表情符
/**
* 判断文本中是否有emoji表情符
*/
public static boolean containsEmoji(String source) {
int len = source.length();
boolean isEmoji = false;
for (int i = 0; i < len; i++) {
char hs = source.charAt(i);
if (0xd800 <= hs && hs <= 0xdbff) {
if (source.length() > 1) {
char ls = source.charAt(i + 1);
int uc = ((hs - 0xd800) * 0x400) + (ls - 0xdc00) + 0x10000;
if (0x1d000 <= uc && uc <= 0x1f77f) {
return true;
}
}
} else {
// non surrogate
if (0x2100 <= hs && hs <= 0x27ff && hs != 0x263b) {
return true;
} else if (0x2B05 <= hs && hs <= 0x2b07) {
return true;
} else if (0x2934 <= hs && hs <= 0x2935) {
return true;
} else if (0x3297 <= hs && hs <= 0x3299) {
return true;
} else if (hs == 0xa9 || hs == 0xae || hs == 0x303d
|| hs == 0x3030 || hs == 0x2b55 || hs == 0x2b1c
|| hs == 0x2b1b || hs == 0x2b50 || hs == 0x231a) {
return true;
}
if (!isEmoji && source.length() > 1 && i < source.length() - 1) {
char ls = source.charAt(i + 1);
if (ls == 0x20e3) {
return true;
}
}
}
}
return isEmoji;
}