SQLServerBulkCopy大容量插入、更新操作

说明

pro环境在程序启动时需要运行50w update sql,在uat环境测试
1)分批1000每次,批量更新需要花时间120s左右;
2)采用下面类似第二个测试用例(先把数据插入临时表、临时表同步主表、删除临时表),最终只花了34s,其中插入花了14s,临时表更新到主表花了18s多
3)继承自SQLServerBulkCSVFileRecord进行大容量复制,比CachedRowSetImpl方式更快;

代码

package com.ydfind.driver.ok;

import com.microsoft.sqlserver.jdbc.SQLServerBulkCSVFileRecord;
import com.microsoft.sqlserver.jdbc.SQLServerBulkCopy;
import com.microsoft.sqlserver.jdbc.SQLServerBulkCopyOptions;
import com.microsoft.sqlserver.jdbc.SQLServerException;
import org.junit.Test;

import java.io.ByteArrayInputStream;
import java.sql.*;
import java.util.ArrayList;
import java.util.List;

public class MyBulkCopyTest {

    // 1w数据7332ms
    @Test
    public void testBulkInsert() throws SQLException {
        // drd notes:
        long time = System.currentTimeMillis();

        String connectionUrl = "jdbc:sqlserver://localhost:1433;databaseName=dev-data;user=sa;password=465628578";
        String tableName = "bulkCopyTest";
        String deleteSql = "if exists (select * from dbo.sysobjects where id = object_id(N'[dbo].["
                + tableName + "]') and OBJECTPROPERTY(id, N'IsUserTable') = 1) DROP TABLE [" + tableName + "]";
        String createSql = "create table " + tableName + " (c1 bigint, c2 varchar(20))";
        // 要插入的数据
        List<Object[]> list = new ArrayList<>();
        for (int i = 0; i < 10000; i++) {
            Object[] objects = new Object[2];
            objects[0] = Long.valueOf(i);
            objects[1] = "name_" + i;
            list.add(objects);
        }
        MySQLServerBulkRecord bulkRecord = new MySQLServerBulkRecord(list);
        bulkRecord.addColumnMetadata(1, "c1", Types.BIGINT, 19, 0);
//        bulkRecord.addColumnMetadata(1, "c1", Types.BIGINT, 19, 0);
        bulkRecord.addColumnMetadata(2, "c2", Types.VARCHAR, 20, 0);

        try (Connection connection = DriverManager.getConnection(connectionUrl);
             Statement statement = connection.createStatement();){
            connection.setAutoCommit(false);
            // 卸了旧的表
            statement.execute(deleteSql);
            // 创建新表
            statement.execute(createSql);

            // BULK INSERT
            SQLServerBulkCopyOptions options = new SQLServerBulkCopyOptions();
            options.setTableLock(true);
//            options.setBatchSize(10_0000);
            SQLServerBulkCopy bulkCopy = new SQLServerBulkCopy(connection);
            bulkCopy.setBulkCopyOptions(options);
            bulkCopy.setDestinationTableName(tableName);

            bulkCopy.writeToServer(bulkRecord);

            connection.commit();
            bulkCopy.close();
        }
        System.out.println("cost time " + (System.currentTimeMillis() - time));
    }

    public class MySQLServerBulkRecord extends SQLServerBulkCSVFileRecord {
        private List<Object[]> dataList;
        private int cur;
        public MySQLServerBulkRecord(List<Object[]> dataList) throws SQLServerException {
            super(new ByteArrayInputStream(new byte[]{}), "UTF-8", ",", false);
            this.dataList = dataList;
            cur = -1;
        }

        @Override
        public boolean next() throws SQLServerException {
            return ++cur < dataList.size();
        }

        @Override
        public Object[] getRowData() throws SQLServerException {
            if (cur >= dataList.size()) {
                return null;
            }
            return dataList.get(cur);
        }

    }

    // 更新到bulkCopyTest:先插入到临时表bulkCopyTestTemp,再update到bulkCopyTest,再删除临时表
    // 1w数据cost time 4362
    @Test
    public void testBulkUpdate() throws SQLException {
        // drd notes:
        long time = System.currentTimeMillis();

        String connectionUrl = "jdbc:sqlserver://localhost:1433;databaseName=dev-data;user=sa;password=465628578";
        String tableName = "bulkCopyTestTemp";
        String tableNameTarget = "bulkCopyTest";
        String deleteSql = "if exists (select * from dbo.sysobjects where id = object_id(N'[dbo].["
                + tableName + "]') and OBJECTPROPERTY(id, N'IsUserTable') = 1) DROP TABLE [" + tableName + "]";
        String createSql = "create table " + tableName + " (c1 bigint, c2 varchar(20))";
        String updateSql = "update " + tableNameTarget + " with(TABLOCK)  set c2 = t2.c2 from " + tableName + " t2 with(nolock) where " + tableNameTarget + ".c1 = t2.c1";
        // 要插入的数据
        List<Object[]> list = new ArrayList<>();
        for (int i = 0; i < 10000; i++) {
            Object[] objects = new Object[2];
            objects[0] = Long.valueOf(i);
            objects[1] = "name1_" + i;
            list.add(objects);
        }
        MySQLServerBulkRecord bulkRecord = new MySQLServerBulkRecord(list);
        bulkRecord.addColumnMetadata(1, "c1", Types.BIGINT, 19, 0);
//        bulkRecord.addColumnMetadata(1, "c1", Types.BIGINT, 19, 0);
        bulkRecord.addColumnMetadata(2, "c2", Types.VARCHAR, 20, 0);

        try (Connection connection = DriverManager.getConnection(connectionUrl);
             Statement statement = connection.createStatement();){
            connection.setAutoCommit(false);
            // 临时表
            statement.execute(deleteSql);
            statement.execute(createSql);

            SQLServerBulkCopyOptions options = new SQLServerBulkCopyOptions();
            options.setTableLock(true);
            options.setBatchSize(10_0000);
            SQLServerBulkCopy bulkCopy = new SQLServerBulkCopy(connection);
            bulkCopy.setBulkCopyOptions(options);
            bulkCopy.setDestinationTableName(tableName);

            bulkCopy.writeToServer(bulkRecord);

            // 从临时表更新到主表
            statement.execute(updateSql);
            // 删除临时表
            statement.execute(deleteSql);

            connection.commit();
            bulkCopy.close();
        }
        // 1w数据7332ms
        System.out.println("cost time " + (System.currentTimeMillis() - time));
    }
}

分析

第一个测试用例后,结果:
在这里插入图片描述
第二个测试用例结果
在这里插入图片描述

50w数据插入示例-本地电脑

package com.ydfind.driver;

import com.microsoft.sqlserver.jdbc.SQLServerBulkCopy;
import com.microsoft.sqlserver.jdbc.SQLServerBulkCopyOptions;
import com.ydfind.driver.ok.MySQLServerBulkRecord;
import org.junit.Test;

import java.sql.*;
import java.util.ArrayList;
import java.util.List;

public class BulkCopyInsertTest {
    private static String testTableName = "test_insert";
    private static String dropSql = "if exists (select * from dbo.sysobjects where id = object_id(N'[dbo].[" + testTableName + "]') and OBJECTPROPERTY(id, N'IsUserTable') = 1) DROP TABLE [" + testTableName + "]";
    private static String createTableName = "create table " + testTableName + "(c1 bigint, c2 varchar(20), c3 bigint)";

    @Test
    public void testInsert() throws SQLException {
        // 1.若存在表,则删除表
        // 2.创建表
        // 3.插入10w数据
        // 4.记录插入10w数据的时间输出
        String url = "jdbc:sqlserver://localhost:1433;databaseName=rec-manager;user=sa;password=465628578";
        try (Connection conn = DriverManager.getConnection(url);
             Statement statement = conn.createStatement()) {
            statement.execute(dropSql);
            statement.execute(createTableName);

            // 插入10w条记录
            long time = System.currentTimeMillis();
            int id = 0;
            String sql = "insert into " + testTableName + "(c1, c2, c3) values(%d,'%s',%d)";
            for (int i = 0; i < 500; i++) {
                for (int j = 0; j < 1000; j++) {
                    id++;
                    String sql1 = String.format(sql, id, "name1_" + id, id);
                    statement.addBatch(sql1);
                }
                statement.executeBatch();
            }
            System.out.println("batch insert cost time = " + (System.currentTimeMillis() - time));
        }
    }

    @Test
    public void testBulkCopyInsert() throws SQLException {
        // 1.若存在表,则删除表
        // 2.创建表
        // 3.插入10w数据
        // 4.记录插入10w数据的时间输出
        String url = "jdbc:sqlserver://localhost:1433;databaseName=rec-manager;user=sa;password=465628578";
        try (Connection conn = DriverManager.getConnection(url);
             Statement statement = conn.createStatement()) {
            statement.execute(dropSql);
            statement.execute(createTableName);

            // 插入10w条记录
            long time = System.currentTimeMillis();

            List<Object[]> list = new ArrayList<>();
            for (int i = 0; i < 50_0000; i++) {
                Object[] objects = new Object[3];
                objects[0] = Long.valueOf(i);
                objects[1] = "name1_" + i;
                objects[2] = Long.valueOf(i);
                list.add(objects);
            }
            MySQLServerBulkRecord bulkRecord = new MySQLServerBulkRecord(list);
            bulkRecord.addColumnMetadata(1, "c1", Types.BIGINT, 19, 0);
            bulkRecord.addColumnMetadata(2, "c2", Types.VARCHAR, 20, 0);
            bulkRecord.addColumnMetadata(3, "c3", Types.BIGINT, 19, 0);

            SQLServerBulkCopyOptions options = new SQLServerBulkCopyOptions();
            options.setTableLock(true);
            options.setBatchSize(10000);
            SQLServerBulkCopy bulkCopy = new SQLServerBulkCopy(conn);
            bulkCopy.setBulkCopyOptions(options);
            bulkCopy.setDestinationTableName(testTableName);

            bulkCopy.writeToServer(bulkRecord);

            bulkCopy.close();
            System.out.println("bulkCopy insert cost time = " + (System.currentTimeMillis() - time));
        }
    }
}

在这里插入图片描述

bulkCopy insert cost time = 25052
batch insert cost time = 222397

可见bulkCopy的方式可以提升接近8倍。把executeBatch()每次的数量从1000提高到1w,执行时间也需要175495,接近3分钟。

评论 2
添加红包

请填写红包祝福语或标题

红包个数最小为10个

红包金额最低5元

当前余额3.43前往充值 >
需支付:10.00
成就一亿技术人!
领取后你会自动成为博主和红包主的粉丝 规则
hope_wisdom
发出的红包
实付
使用余额支付
点击重新获取
扫码支付
钱包余额 0

抵扣说明:

1.余额是钱包充值的虚拟货币,按照1:1的比例进行支付金额的抵扣。
2.余额无法直接购买下载,可以购买VIP、付费专栏及课程。

余额充值