将查询sql中的中文字段和中文表名转成拼音

背景:数据装载时,有时候需要别人的数据表中读取数据,插入到自己的表中。如果别人的数据表是中文的,需要将表名称和表字段转成拼音首字母,此时可以直接用PinyinHelper.getShortPinyin()方法直接转换。但如果语句中有case when、where表达式时,是不能直接转出拼音首字母的。如:

case 学生表.学校 when 1 then '第一中学' when 1 then '第二中学'  end as school

where 学生表.姓名 not like '%测试%'

类似这些,需要特殊处理的。

依赖

<dependency>
    <groupId>com.github.stuxuhai</groupId>
    <artifactId>jpinyin</artifactId>
    <version>1.1.8</version>
</dependency>
<dependency>
    <artifactId>jsqlparser</artifactId>
    <groupId>com.github.jsqlparser</groupId>
    <version>4.4</version>
</dependency>

代码


import com.alibaba.druid.sql.SQLUtils;
import com.github.stuxuhai.jpinyin.PinyinException;
import com.github.stuxuhai.jpinyin.PinyinHelper;
import net.sf.jsqlparser.JSQLParserException;
import net.sf.jsqlparser.expression.*;
import net.sf.jsqlparser.expression.operators.conditional.AndExpression;
import net.sf.jsqlparser.expression.operators.relational.*;
import net.sf.jsqlparser.parser.CCJSqlParserUtil;
import net.sf.jsqlparser.schema.Column;
import net.sf.jsqlparser.schema.Table;
import net.sf.jsqlparser.statement.select.*;
import org.apache.commons.collections.CollectionUtils;
import java.util.*;

/**
 * Description:将中文表名和列名转成拼音
 *
 * @Date: 2024/05/07
 */
public class Test {
    public static void main(String[] args) {

        String sql = "SELECT 字段1, 字段2 FROM 表1 WHERE 字段3 IN (SELECT 字段4 FROM 表2 WHERE 条件 = '1') "
                + "UNION ALL "
                + "SELECT 字段5, 字段6 FROM 表3 WHERE 字段7 = '特定值'";
        String transformedSql = analysisSql(sql);
        String formattedSql = SQLUtils.formatMySql(transformedSql);
        System.out.println(formattedSql);
    }

    /**
     * 解析sql
     *
     * @param sql 输入的sql语句
     * @return
     * @throws JSQLParserException
     */
    private static String analysisSql(String sql) {
        Select select = null;
        try {
            select = (Select) CCJSqlParserUtil.parse(sql);
        } catch (JSQLParserException e) {
            throw new RuntimeException(e);
        }
        SelectBody selectBody = select.getSelectBody();
        if (selectBody instanceof SetOperationList) {
            SetOperationList operationList = (SetOperationList) selectBody;
            List<SelectBody> modifiedSelectBodies = new ArrayList<>();
            for (SelectBody plainSelect : operationList.getSelects()) {
                // 递归分析并修改,同时收集修改后的SelectBody
                String modifiedSql = analysisSql(plainSelect.toString());
                try {
                    modifiedSelectBodies.add(((Select)CCJSqlParserUtil.parse(modifiedSql)).getSelectBody());
                } catch (JSQLParserException e) {
                    throw new RuntimeException(e);
                }
            }
            // 替换原始的SelectBody列表为修改后的
            operationList.setSelects(modifiedSelectBodies);
        } else if (selectBody instanceof PlainSelect) {
            analysisSelectBody((PlainSelect) selectBody);
        }
        // 将最终修改后的Select对象转换为SQL字符串
        return select.toString();
    }

    /**
     * 解析查询语句
     *
     * @param plainSelect
     * @throws JSQLParserException
     */
    private static void analysisSelectBody(PlainSelect plainSelect) {
        // 转换select里的字段
        transformSelectItems(plainSelect);
        // 转换from的中文表名(可能含有子查询)
        transformFromItem(plainSelect.getFromItem());
        // 转换join里的中文表名和on表达式里的中文字段
        transformJoinItem(plainSelect.getJoins());
        // 转换where表达式里的中文字段字段
        transformWhereField(plainSelect.getWhere());
        // 转换group by里的中文字段
        transformGroupByItem(plainSelect.getGroupBy());
        // 转换having里的中文字段
        transformHavingField(plainSelect.getHaving());
    }

    private static void transformGroupByItem(GroupByElement groupByElement) {
        if (groupByElement == null) {
            return;
        }
        ExpressionList groupByExpressionList = groupByElement.getGroupByExpressionList();
        for (Expression expression : groupByExpressionList.getExpressions()) {
            if (expression instanceof Column) {
                Column column = (Column) expression;
                String pinyinColumnName = null;
                try {
                    pinyinColumnName = PinyinHelper.getShortPinyin(column.getColumnName());
                } catch (PinyinException e) {
                    throw new RuntimeException(e);
                }
                column.setColumnName(pinyinColumnName);
            } else {
                throw new RuntimeException("不支持的表达式类型:" + expression.toString());
            }
        }
    }

    private static void transformHavingField(Expression havingExpression) {
        if (havingExpression == null) {
            return;
        }
        if (havingExpression instanceof BinaryExpression) {
            BinaryExpression andExpression = (BinaryExpression) havingExpression;
            Expression leftExpression = andExpression.getLeftExpression();
            if (leftExpression instanceof Column) {
                Column column = (Column) leftExpression;
                String pinyinColumnName = null;
                try {
                    pinyinColumnName = PinyinHelper.getShortPinyin(column.getColumnName());
                } catch (PinyinException e) {
                    throw new RuntimeException(e);
                }
                column.setColumnName(pinyinColumnName);
                andExpression.setLeftExpression(column);
            } else if (leftExpression instanceof Function) {
                Function function = (Function) leftExpression;
                function.getParameters().getExpressions().forEach(expression -> {
                    if (expression instanceof Column) {
                        Column column = (Column) expression;
                        String pinyinColumnName = null;
                        try {
                            pinyinColumnName = PinyinHelper.getShortPinyin(column.getColumnName());
                        } catch (PinyinException e) {
                            throw new RuntimeException(e);
                        }
                        column.setColumnName(pinyinColumnName);
                        function.getParameters().getExpressions().set(function.getParameters().getExpressions().indexOf(expression), column);
                    } else {
                        throw new RuntimeException("不支持的表达式类型:" + expression.toString());
                    }
                });
            } else {
                throw new RuntimeException("不支持的表达式类型:" + leftExpression.toString());
            }
        }
    }

    /**
     * 将where语句中的中文列转成拼音
     *
     * @param whereExpression where表达式
     */
    public static void transformWhereField(Expression whereExpression) {
        if (whereExpression == null) {
            return;
        }
        if (whereExpression instanceof BinaryExpression) {
            //转成二进制基本表达式,遍历左、右表达式
            BinaryExpression andExpression = (BinaryExpression) whereExpression;
            if (andExpression.getLeftExpression() instanceof Column) {
                //说明已经是最终的表达式了,例如:学校 = '中学',只需将字段名转成拼音即可
                Column column = (Column) andExpression.getLeftExpression();
                try {
                    String pinyinColumnName = PinyinHelper.getShortPinyin(column.getColumnName());
                    column.setColumnName(pinyinColumnName);
                } catch (PinyinException e) {
                    throw new RuntimeException(e);
                }
            } else if (andExpression.getLeftExpression() instanceof BinaryExpression) {
                //还不是最小的表达式,继续递归
                transformWhereField(andExpression.getLeftExpression());
            } else {
                throw new RuntimeException("暂不支持该表达式类型: " + whereExpression);
            }
            //处理右表达式
            if (andExpression.getRightExpression() instanceof Column) {
                Column column = (Column) andExpression.getLeftExpression();
                try {
                    String pinyinColumnName = PinyinHelper.getShortPinyin(column.getColumnName());
                    column.setColumnName(pinyinColumnName);
                } catch (PinyinException e) {
                    throw new RuntimeException(e);
                }
            } else if (andExpression.getRightExpression() instanceof BinaryExpression) {
                transformWhereField(andExpression.getRightExpression());
            } else if (andExpression.getRightExpression() instanceof StringValue
                    || andExpression.getRightExpression() instanceof LongValue
                    || andExpression.getRightExpression() instanceof DateValue
                    || andExpression.getRightExpression() instanceof DoubleValue) {
                //如果是字符串,如 学校 = ‘中学’ 中的右表达式,不需要处理
            } else if (andExpression.getRightExpression() instanceof Parenthesis) {
                Parenthesis parenthesis = (Parenthesis) andExpression.getRightExpression();
                transformWhereField(parenthesis.getExpression());
            } else {
                throw new RuntimeException("暂不支持该表达式类型: " + whereExpression);
            }
        } else if (whereExpression instanceof InExpression) {
            InExpression inExpression = (InExpression) whereExpression;
            if (inExpression.getLeftExpression() instanceof Column) {
                Column column = (Column) inExpression.getLeftExpression();
                String pinyinColumnName = null;
                try {
                    pinyinColumnName = PinyinHelper.getShortPinyin(column.getColumnName());
                } catch (PinyinException e) {
                    throw new RuntimeException(e);
                }
                column.setColumnName(pinyinColumnName);
                inExpression.setLeftExpression(column);
            } else {
                throw new RuntimeException("暂不支持该表达式类型: " + inExpression);
            }
            if (inExpression.getRightExpression() instanceof SubSelect) {
                SubSelect subSelect = (SubSelect) inExpression.getRightExpression();
                analysisSelectBody((PlainSelect) subSelect.getSelectBody());
            } else {
                throw new RuntimeException("暂不支持该表达式类型: " + inExpression);
            }

        } else if (whereExpression instanceof Between) {
            Between between = (Between) whereExpression;
            if (between.getLeftExpression() instanceof Column) {
                Column column = (Column) between.getLeftExpression();
                String pinyinColumnName = null;
                try {
                    pinyinColumnName = PinyinHelper.getShortPinyin(column.getColumnName());
                } catch (PinyinException e) {
                    throw new RuntimeException(e);
                }
                column.setColumnName(pinyinColumnName);
                between.setLeftExpression(column);
            }
        } else {
            throw new RuntimeException("暂不支持该where表达式类型: " + whereExpression);
        }
    }

    /**
     * 将from中join的的中文表名和on表达式的中文列表段转成拼音
     *
     * @param joinList
     * @return
     */
    private static void transformJoinItem(List<Join> joinList) {
        if (joinList != null) {
            for (int i = 0; i < joinList.size(); i++) {
                Join join = joinList.get(i);
                FromItem rightItem = join.getRightItem();
                //处理join的中文表名
                if (rightItem instanceof Table) {
                    Table table = (Table) rightItem;
                    String pinyinTableName = null;
                    try {
                        pinyinTableName = PinyinHelper.getShortPinyin(table.getName());
                    } catch (PinyinException e) {
                        throw new RuntimeException(e);
                    }
                    table.setName(pinyinTableName);
                    join.setRightItem(table);
                } else {
                    throw new RuntimeException("暂不支持该join表达式类型: " + rightItem);
                }
                //遍历on表达式,处理中文列名
                join.getOnExpressions().forEach(expression -> {
                    transformLeftExpression(expression);
                });
            }
        }
    }

    /**
     * 将from中on表达式里的中文列名转成拼音
     *
     * @param expression
     */
    private static void transformLeftExpression(Expression expression) {
        //如果等于表达式,说明是最细的了,直接转成拼音即可
        if (expression instanceof EqualsTo) {
            EqualsTo equalsTo = (EqualsTo) expression;
            //将左右列表转成拼音
            Expression leftExpression = equalsTo.getLeftExpression();
            if (leftExpression instanceof  Column) {
                Column column = (Column) leftExpression;
                String columnName = column.getColumnName();
                String pinyinColumnName = null;
                try {
                    pinyinColumnName = PinyinHelper.getShortPinyin(columnName);
                } catch (PinyinException e) {
                    throw new RuntimeException(e);
                }
                column.setColumnName(pinyinColumnName);
            }
            Expression rigthExpression = equalsTo.getRightExpression();
            if (rigthExpression instanceof  Column) {
                Column column = (Column) rigthExpression;
                String columnName = column.getColumnName();
                String pinyinColumnName = null;
                try {
                    pinyinColumnName = PinyinHelper.getShortPinyin(columnName);
                } catch (PinyinException e) {
                    throw new RuntimeException(e);
                }
                column.setColumnName(pinyinColumnName);
            }
        } else if (expression instanceof AndExpression) {
            //如果是and表达式,继续递归
            AndExpression andExpression = (AndExpression) expression;
            transformLeftExpression(andExpression.getLeftExpression());
            transformLeftExpression(andExpression.getRightExpression());
        } else if (expression instanceof IsNullExpression) {
            //如果是is null表达式,只需处理左表达式即可
            IsNullExpression isNullExpression = (IsNullExpression) expression;
            Expression leftExpression = isNullExpression.getLeftExpression();
            if (leftExpression instanceof Column) {
                Column column = (Column) leftExpression;
                String pinyinColumnName = null;
                try {
                    pinyinColumnName = PinyinHelper.getShortPinyin(column.getColumnName());
                } catch (PinyinException e) {
                    throw new RuntimeException(e);
                }
                column.setColumnName(pinyinColumnName);
            }
        }
    }

    /**
     * 将from里的中文字段转成拼音
     *
     * @param fromItem
     * @return
     * @throws JSQLParserException 解析异常
     */
    private static void transformFromItem(FromItem fromItem) {
        // 判断fromItem属于哪种类型,如果是subSelect类型就是子查询
        if (fromItem instanceof SubSelect) {
            SelectBody selectBody = ((SubSelect) fromItem).getSelectBody();
            analysisSql(selectBody.toString());
        }
        try {
            Table table = (Table) fromItem;
            String tableName = PinyinHelper.getShortPinyin(table.getName());
            table.setName(tableName);
        } catch (Exception e) {
            throw new RuntimeException(e);
        }
    }

    /**
     * 将select中的列名转成拼音
     *
     * @param plainSelect
     */
    private static void transformSelectItems(PlainSelect plainSelect) {
        List<SelectItem> selectItems = plainSelect.getSelectItems();
        if (!CollectionUtils.isEmpty(selectItems)) {
            for (SelectItem selectItem : selectItems) {
                try {
                    if (selectItem instanceof SelectExpressionItem) {
                        SelectExpressionItem selectExpressionItem = (SelectExpressionItem) selectItem;
                        Expression expression = selectExpressionItem.getExpression();
                        if (expression instanceof Column) {
                            //表达式是列名,直接转
                            Column column = ((Column) expression);
                            String pinyinColumnName = PinyinHelper.getShortPinyin(column.getColumnName());
                            column.setColumnName(pinyinColumnName);
                        } else if (expression instanceof CaseExpression) {
                            //case表达式,只处理列名
                            CaseExpression caseExpression = (CaseExpression) expression;
                            Expression switchExpression = caseExpression.getSwitchExpression();
                            if (switchExpression instanceof Column) {
                                Column column = (Column) switchExpression;
                                String pinyinColumnName = PinyinHelper.getShortPinyin(column.getColumnName());
                                column.setColumnName(pinyinColumnName);
                            }
                        } else if (expression instanceof LongValue || expression instanceof StringValue || expression instanceof DateValue || expression instanceof DoubleValue) {
                            //如果是常量,忽略
                        } else if (expression instanceof TimeKeyExpression) {
                            throw new RuntimeException("暂不支持此类型的表达式:" + expression.toString());
                        } else if (expression instanceof NullValue) {
                            //如果是null,如null as updateTime,忽略
                        } else if (expression instanceof AnalyticExpression) {
                            AnalyticExpression analyticExpression = (AnalyticExpression) expression;
                            //处理avg里面的列名
                            Expression avgExpression = analyticExpression.getExpression();
                            if (avgExpression instanceof Column) {
                                //表达式是列名,直接转
                                Column column = ((Column) avgExpression);
                                String pinyinColumnName = PinyinHelper.getShortPinyin(column.getColumnName());
                                column.setColumnName(pinyinColumnName);
                            } else {
                                throw new RuntimeException("未知类型的表达式:" + avgExpression.toString());
                            }
                            //处理over里面的列名
                            ExpressionList partitionExpressionList = analyticExpression.getPartitionExpressionList();
                            if (partitionExpressionList != null) {
                                List<Expression> expressions = partitionExpressionList.getExpressions();
                                for (Expression partitionExpression : expressions) {
                                    if (partitionExpression instanceof Column) {
                                        //表达式是列名,直接转
                                        Column column = ((Column) partitionExpression);
                                        String pinyinColumnName = PinyinHelper.getShortPinyin(column.getColumnName());
                                        column.setColumnName(pinyinColumnName);
                                    }else {
                                        throw new RuntimeException("未知类型的表达式:" + selectItem.toString());
                                    }
                                }
                            }
                        } else {
                            throw new RuntimeException("未知类型的表达式:" + expression.toString());
                        }
                    } else if (selectItem instanceof AllTableColumns) {
                        //table.*类型的表达式,不处理
                    } else if (selectItem.toString().equals("*")) {
                        //*类型的表达式,不处理
                    } else if (selectItem instanceof NullValue) {
                        //如果是null,如null as updateTime,忽略
                    } else {
                        throw new RuntimeException("未知类型的表达式:" + selectItem.toString());
                    }
                } catch (Exception e) {
                    throw new RuntimeException(e);
                }
            }
        }
    }
}

 测试用例:

String sql = "SELECT 字段1, 字段2 FROM 表1 WHERE 字段3 IN (SELECT 字段4 FROM 表2 WHERE 条件 = '1') "
        + "UNION ALL "
        + "SELECT 字段5, 字段6 FROM 表3 WHERE 字段7 = '特定值'";

String sql1 = "SELECT * \n" +
        "FROM 商品表 \n" +
        "WHERE 类别 = '电子产品' \n" +
        "AND 价格 > 2000 \n" +
        "AND (品牌 = '华为' OR 品牌 = '小米') \n" +
        "AND (上市日期 BETWEEN '2020-01-01' AND '2022-12-31')";

String sql2 = "SELECT 中文列1, 中文列2 FROM 中文表1 LEFT JOIN 中文表2 ON 中文列1 = 中文列2";

String sql3 ="SELECT 列1, 列2 FROM 表3 GROUP BY 列1 HAVING sum(列3) > 100";

String sql4 ="SELECT 中文列 FROM 中文表1 INTERSECT SELECT 中文列 FROM 中文表2";

String sql5 ="SELECT 中文列, AVG(中文列2) OVER (PARTITION BY 中文列1) FROM 中文表";

对应的结果:

SELECT zd1, zd2
FROM b1
WHERE zd3 IN (
    SELECT zd4
    FROM b2
    WHERE tj = '1'
)
UNION ALL
SELECT zd5, zd6
FROM b3
WHERE zd7 = '特定值';


SELECT *
FROM spb
WHERE lb = '电子产品'
    AND jg > 2000
    AND (pp = '华为'
        OR pp = '小米')
    AND ssrq BETWEEN '2020-01-01' AND '2022-12-31';


SELECT zwl1, zwl2
FROM zwb1
    LEFT JOIN zwb2 ON zwl1 = zwl2;


SELECT l1, l2
FROM b3
GROUP BY l1
HAVING sum(l3) > 100;


SELECT zwl
FROM zwb1
INTERSECT
SELECT zwl
FROM zwb2;


SELECT zwl, AVG(zwl2) OVER (PARTITION BY zwl1 )
FROM zwb;

 可以处理case when、like、left join on、union all、intersect、avg、group by、having等情况。

对于不能处理的情况,会抛运行时异常。

不过有的测试例子无法覆盖复杂的情况,如需使用还需要继续完善。

  • 5
    点赞
  • 4
    收藏
    觉得还不错? 一键收藏
  • 0
    评论

“相关推荐”对你有帮助么?

  • 非常没帮助
  • 没帮助
  • 一般
  • 有帮助
  • 非常有帮助
提交
评论
添加红包

请填写红包祝福语或标题

红包个数最小为10个

红包金额最低5元

当前余额3.43前往充值 >
需支付:10.00
成就一亿技术人!
领取后你会自动成为博主和红包主的粉丝 规则
hope_wisdom
发出的红包
实付
使用余额支付
点击重新获取
扫码支付
钱包余额 0

抵扣说明:

1.余额是钱包充值的虚拟货币,按照1:1的比例进行支付金额的抵扣。
2.余额无法直接购买下载,可以购买VIP、付费专栏及课程。

余额充值