背景
对于其它数据库而言,统计一张表的行数是最基本的操作,但是对于HBase这种列式存储的数据库而言,使用不同方式统计表的行数效率差别巨大,本文将提供两种java客户端代码统计HBase表行数的方法
方案一:scan + filter
引入jar包
<dependency>
<groupId>com.aliyun.hbase</groupId>
<artifactId>alihbase-client</artifactId>
<version>2.0.3</version>
</dependency>
java代码实现
String tableNameStr = "${table_name}";
Configuration config = HBaseConfiguration.create();
config.set(HConstants.ZOOKEEPER_QUORUM, "${zk_addr}");
Connection connection = null;
try {
connection = ConnectionFactory.createConnection(config);
Table table = connection.getTable(TableName.valueOf(tableNameStr));
try {
long start = System.currentTimeMillis();
Scan scan = new Scan();
// 只获取每行数据的第一个kv,提高count速度
scan.setFilter(new FirstKeyOnlyFilter());
ResultScanner results = table.getScanner(scan);
long count = 0;
for (Result r : results) {
count += r.size();
}
System.out.println("count=="+count);
System.out.println("scan 总共耗时:" + (System.currentTimeMillis() - start) + "ms");
} finally {
if (table != null) tabl