Datax oracle 支持增量并且支持全量更新

支持增量 ORACLE UPDATE

们使用datax 希望支持oracle 增量导入数据,同时保留原先的全量更新

修改 OracleWriter.java

删除限制

修改WriterUtil.java

添加oracle 数据增量模式插入类型转换

    // 替换原先的代码块
    public static String getWriteTemplate(List<String> columnHolders, List<String> valueHolders, String writeMode, DataBaseType dataBaseType, boolean forceUseUpdate) {
        boolean update = writeMode.trim().toLowerCase().startsWith("update");
        boolean isWriteModeLegal = writeMode.trim().toLowerCase().startsWith("insert") || writeMode.trim().toLowerCase().startsWith("replace") || update;

        if (!isWriteModeLegal) {
            throw DataXException.asDataXException(DBUtilErrorCode.ILLEGAL_VALUE,
                    String.format("您所配置的 writeMode:%s 错误. 因为DataX 目前仅支持replace,update 或 insert 方式. 请检查您的配置并作出修改.", writeMode));
        }

        // && writeMode.trim().toLowerCase().startsWith("replace")
        String writeDataSqlTemplate;
        if (forceUseUpdate || ((dataBaseType == DataBaseType.MySql || dataBaseType == DataBaseType.Tddl) && update)) {
            //update只在mysql下使用
            writeDataSqlTemplate = "INSERT INTO %s (" + StringUtils.join(columnHolders, ",") + ") VALUES(" + StringUtils.join(valueHolders, ",") + ")" + onDuplicateKeyUpdateString(columnHolders);
        } else {
            if (dataBaseType == DataBaseType.Oracle && update) {
                writeDataSqlTemplate = onMergeIntoDoString(writeMode, columnHolders, valueHolders) + "INSERT (" +
                        StringUtils.join(columnHolders, ",") +
                        ") VALUES(" + StringUtils.join(valueHolders, ",") +
                        ")";
            } else {
                //这里是保护,如果其他错误的使用了update,需要更换为replace
                if (update) {
                    writeMode = "replace";
                }
                writeDataSqlTemplate = writeMode +
                        " INTO %s (" + StringUtils.join(columnHolders, ",") +
                        ") VALUES(" + StringUtils.join(valueHolders, ",") +
                        ")";
            }
        }
        return writeDataSqlTemplate;
    }
   /**
     * 新增更新插入sql语句
     * @return String
     */
    public static String onMergeIntoDoString(String merge, List<String> columnHolders, List<String> valueHolders) {
        String[] sArray = getStrings(merge);
        StringBuilder sb = new StringBuilder();
        sb.append("MERGE INTO %s A USING ( SELECT ");

        boolean first = true;
        boolean first1 = true;
        StringBuilder str = new StringBuilder();
        StringBuilder update = new StringBuilder();
        for (String columnHolder : columnHolders) {
            if (Arrays.asList(sArray).contains(columnHolder)) {
                if (!first) {
                    sb.append(",");
                    str.append(" AND ");
                } else {
                    first = false;
                }
                str.append("TMP.").append(columnHolder);
                sb.append("?");
                str.append(" = ");
                sb.append(" AS ");
                str.append("A.").append(columnHolder);
                sb.append(columnHolder);
            }
        }

        for (String columnHolder : columnHolders) {
            if (!Arrays.asList(sArray).contains(columnHolder)) {
                if (!first1) {
                    update.append(",");
                } else {
                    first1 = false;
                }
                update.append(columnHolder);
                update.append(" = ");
                update.append("?");
            }
        }

        sb.append(" FROM DUAL ) TMP ON (");
        sb.append(str);
        sb.append(" ) WHEN MATCHED THEN UPDATE SET ");
        sb.append(update);
        sb.append(" WHEN NOT MATCHED THEN ");
        return sb.toString();
    }
    /**
     * 新增获取复合主键集合
     * @return String[]
     */
    public static String[] getStrings(String merge) {
        merge = merge.replace("update", "");
        merge = merge.replace("(", "");
        merge = merge.replace(")", "");
        merge = merge.replace(" ", "");
        return merge.split(",");
    }

修改CommonRdbmsWriter.java

        // 替换原先的代码块
        public void startWriteWithConnection(RecordReceiver recordReceiver, TaskPluginCollector taskPluginCollector, Connection connection) {
            this.taskPluginCollector = taskPluginCollector;
            List<String> columns = new LinkedList<>();
            if (this.dataBaseType == DataBaseType.Oracle && writeMode.trim().toLowerCase().startsWith("update") ) {
                String merge = this.writeMode;
                String[] sArray = WriterUtil.getStrings(merge);
                this.columns.forEach(column->{
                    if (Arrays.asList(sArray).contains(column)) {
                        columns.add(column);
                    }
                });
                this.columns.forEach(column->{
                    if (!Arrays.asList(sArray).contains(column)) {
                        columns.add(column);
                    }
                });
            }
            columns.addAll(this.columns);
            // 用于写入数据的时候的类型根据目的表字段类型转换
            this.resultSetMetaData = DBUtil.getColumnMetaData(connection, this.table, StringUtils.join(columns, ","));
            // 写数据库的SQL语句
            calcWriteRecordSql();

            List<Record> writeBuffer = new ArrayList<Record>(this.batchSize);
            int bufferBytes = 0;
            try {
                Record record;
                while ((record = recordReceiver.getFromReader()) != null) {
                    if (record.getColumnNumber() != this.columnNumber) {
                        // 源头读取字段列数与目的表字段写入列数不相等,直接报错
                        throw DataXException
                                .asDataXException(
                                        DBUtilErrorCode.CONF_ERROR,
                                        String.format(
                                                "列配置信息有错误. 因为您配置的任务中,源头读取字段数:%s 与 目的表要写入的字段数:%s 不相等. 请检查您的配置并作出修改.",
                                                record.getColumnNumber(),
                                                this.columnNumber));
                    }

                    writeBuffer.add(record);
                    bufferBytes += record.getMemorySize();

                    if (writeBuffer.size() >= batchSize || bufferBytes >= batchByteSize) {
                        doBatchInsert(connection, writeBuffer);
                        writeBuffer.clear();
                        bufferBytes = 0;
                    }
                }
                if (!writeBuffer.isEmpty()) {
                    doBatchInsert(connection, writeBuffer);
                    writeBuffer.clear();
                    bufferBytes = 0;
                }
            } catch (Exception e) {
                throw DataXException.asDataXException(
                        DBUtilErrorCode.WRITE_DATA_ERROR, e);
            } finally {
                writeBuffer.clear();
                bufferBytes = 0;
                DBUtil.closeDBResources(null, null, connection);
            }
        }
        // 替换原先代码块
        protected PreparedStatement fillPreparedStatement(PreparedStatement preparedStatement, Record record)
                throws SQLException {
            for (int i = 0; i < this.resultSetMetaData.getLeft().size(); i++) {
                int columnSqlType = this.resultSetMetaData.getMiddle().get(i);
                String typeName = this.resultSetMetaData.getRight().get(i);
                String column = this.resultSetMetaData.getLeft().get(i);
                Column columnValue = record.getColumn(this.columns.indexOf(column));
                preparedStatement = fillPreparedStatementColumnType(preparedStatement, i, columnSqlType, typeName,columnValue);
            }
            return preparedStatement;
        }

示例

{
  "job": {
    "setting": {
      "speed": {
        "channel": 5
      }
    },
    "content": [
      {
        "reader": {
          "name": "ftpreader",
          "parameter": {
            "username": "ftp",
            "password": "ftp",
            "column": [
              "*"
            ],
            "protocol": "ftp",
            "host": "*****",
            "encoding": "UTF-8",
            "fieldDelimiter": ",",
            "port": "21",
            "path": [
              "/csvTem/blade_log_api"
            ]
          }
        },
        "writer": {
          "name": "oraclewriter",
          "parameter": {
            "username": "****",
            "password": "****",
            "column": [
              "IS_SUCCESS",
              "RE_APP",
              "TENANT_ID",
              "SERVICE_ID",
              "SERVER_HOST",
              "SERVER_IP",
              "ENV",
              "TYPE",
              "TITLE",
              "METHOD",
              "ID"
            ],
            "writeMode": "update(ID)",
            "connection": [
              {
                "table": [
                  "BLADE_LOG_API"
                ],
                "jdbcUrl": "jdbc:oracle:thin:@localhost:1521/XE"
              }
            ]
          }
        }
      }
    ]
  }
}

改完后的jar包

https://www.aliyundrive.com/s/51SNJkfSLaj

  • 1
    点赞
  • 5
    收藏
    觉得还不错? 一键收藏
  • 4
    评论
DataX 中,实现 Oracle 增量替换的方式通常有两种: 1. 使用 `writer.oracle` 的 `replace` 参数 可以在 Oracle Writer 的配置文件中设置 `replace` 参数为 `true`,这样 DataX 就会使用 replace 方式进行增量替换。具体配置如下: ```json { "job": { "content": [ { "reader": { "name": "mysqlreader", "parameter": { "username": "root", "password": "123456", "column": [ "id", "name", "age", "sex" ], "splitPk": "id", "connection": [ { "jdbcUrl": "jdbc:mysql://localhost:3306/test?useSSL=false", "table": [ "user" ] } ] } }, "writer": { "name": "oraclewriter", "parameter": { "username": "test", "password": "test", "column": [ "id", "name", "age", "sex" ], "preSql": "truncate table user", "replace": true, "connection": [ { "jdbcUrl": "jdbc:oracle:thin:@localhost:1521:orcl", "table": [ "user" ] } ] } } } ], "setting": { "speed": { "channel": 3 } } } } ``` 通过设置 `replace` 参数为 `true`,Oracle Writer 将使用 `replace` 方式进行增量替换。 2. 在 SQL 语句中使用 `merge` 语句 另一种方式是在 SQL 语句中使用 `merge` 语句实现增量替换。具体实现方法如下: ```json { "job": { "content": [ { "reader": { "name": "mysqlreader", "parameter": { "username": "root", "password": "123456", "column": [ "id", "name", "age", "sex" ], "splitPk": "id", "connection": [ { "jdbcUrl": "jdbc:mysql://localhost:3306/test?useSSL=false", "table": [ "user" ] } ] } }, "writer": { "name": "oraclewriter", "parameter": { "username": "test", "password": "test", "column": [ "id", "name", "age", "sex" ], "preSql": "truncate table user", "connection": [ { "jdbcUrl": "jdbc:oracle:thin:@localhost:1521:orcl", "table": [ "user" ] } ], "writeMode": "batch", "postSql": [ "merge into user t1 using (select ? as id, ? as name, ? as age, ? as sex from dual) t2 on (t1.id = t2.id) when matched then update set t1.name = t2.name, t1.age = t2.age, t1.sex = t2.sex when not matched then insert (t1.id, t1.name, t1.age, t1.sex) values (t2.id, t2.name, t2.age, t2.sex)" ] } } } ], "setting": { "speed": { "channel": 3 } } } } ``` 在 Oracle Writer 的配置文件中设置 `writeMode` 参数为 `batch`,并在 `postSql` 中使用 `merge` 语句实现增量替换。在 `merge` 语句中,使用 `when matched then update` 来更新已有记录,使用 `when not matched then insert` 来插入新记录。
评论 4
添加红包

请填写红包祝福语或标题

红包个数最小为10个

红包金额最低5元

当前余额3.43前往充值 >
需支付:10.00
成就一亿技术人!
领取后你会自动成为博主和红包主的粉丝 规则
hope_wisdom
发出的红包
实付
使用余额支付
点击重新获取
扫码支付
钱包余额 0

抵扣说明:

1.余额是钱包充值的虚拟货币,按照1:1的比例进行支付金额的抵扣。
2.余额无法直接购买下载,可以购买VIP、付费专栏及课程。

余额充值