代码参考网上其他博文,在其基础上作部分优化。以下代码在win7 + jdk1.7 + eclipse3.7 + centos 7 + hadoop2.6条件下运行通过。
java工程需添加hadoop根目录下/share/hadoop/下所有jar包到编译路径中。
工具类HdfsUtils.java,及测试用例代码如下:
HdfsUtils.java
package com.xy6.demo.utils;
import java.io.ByteArrayInputStream;
import java.io.IOException;
import java.io.InputStream;
import java.io.OutputStream;
import java.net.URI;
import java.util.ArrayList;
import java.util.List;
import org.apache.commons.lang.StringUtils;
import org.apache.hadoop.conf.Configuration;
import org.apache.hadoop.fs.FSDataInputStream;
import org.apache.hadoop.fs.FSDataOutputStream;
import org.apache.hadoop.fs.FileStatus;
import org.apache.hadoop.fs.FileSystem;
import org.apache.hadoop.fs.Path;
import org.apache.zookeeper.common.IOUtils;
/**
* operate hdfs file or directory util class
*
* @author zhang
* @since 2016-09-26
*
*/
public class HdfsUtils {
public static String uri = "hdfs://192.168.1.118:9000";
/**
* make a new dir in the hdfs
*
* @param dir the dir may like '/tmp/testdir'
* @return boolean true-success, false-failed
* @exception IOException something wrong happends when operating files
*/
public static boolean mkdir(String dir) throws IOException {
if (StringUtils.isBlank(dir)) {
return false;
}
dir = uri + dir;
Configuration conf = new Configuration();
FileSystem fs = FileSystem.get(URI.create(dir), conf);
if (!fs.exists(new Path(dir))) {
fs.mkdirs(new Path(dir));
}
fs.close();
return true;
}
/**
* delete a dir in the hdfs.
* if dir not exists, it will throw FileNotFoundException
*
* @param dir the dir may like '/tmp/testdir'
* @return boolean true-success, false-failed
* @exception IOException something wrong happends when operating files
*
*/
public static boolean deleteDir(String dir) throws IOException {
if (StringUtils.isBlank(dir)) {
return false;
}
dir = uri + dir;
Configuration conf = new Configuration();
FileSystem fs = FileSystem.get(URI.create(dir), conf);
fs.delete(new Path(dir), true);
fs.close();
return true;
}
/**
* list files/directories/links names under a directory, not include embed
* objects
*
* @param dir a folder path may like '/tmp/testdir'
* @return List<String> list of file names
* @throws IOException file io exception
*/
public static List<String> listAll(String dir) throws IOException {
if (StringUtils.isBlank(dir)) {
return new ArrayList<String>();
}
dir = uri + dir;
Configuration conf = new Configuration();
FileSystem fs = FileSystem.get(URI.create(dir), conf);
FileStatus[] stats = fs.listStatus(new Path(dir));
List<String> names = new ArrayList<String>();
for (int i = 0; i < stats.length; ++i) {
if (stats[i].isFile()) {
// regular file
names.add(stats[i].getPath().toString());
} else if (stats[i].isDirectory()) {
// dir
names.add(stats[i].getPath().toString());
} else if (stats[i].isSymlink()) {
// is s symlink in linux
names.add(stats[i].getPath().toString());
}
}
fs.close();
return names;
}
/*
* upload the local file to the hds,
* notice that the path is full like /tmp/test.txt
* if local file not exists, it will throw a FileNotFoundException
*
* @param localFile local file path, may like F:/test.txt or /usr/local/test.txt
*
* @param hdfsFile hdfs file path, may like /tmp/dir
* @return boolean true-success, false-failed
*
* @throws IOException file io exception
*/
public static boolean uploadLocalFile2HDFS(String localFile, String hdfsFile) throws IOException {
if (StringUtils.isBlank(localFile) || StringUtils.isBlank(hdfsFile)) {
return false;
}
hdfsFile = uri + hdfsFile;
Configuration config = new Configuration();
FileSystem hdfs = FileSystem.get(URI.create(uri), config);
Path src = new Path(localFile);
Path dst = new Path(hdfsFile);
hdfs.copyFromLocalFile(src, dst);
hdfs.close();
return true;
}
/*
* create a new file in the hdfs.
*
* notice that the toCreateFilePath is the full path
*
* and write the content to the hdfs file.
*/
/**
* create a new file in the hdfs.
* if dir not exists, it will create one
*
* @param newFile new file path, a full path name, may like '/tmp/test.txt'
* @param content file content
* @return boolean true-success, false-failed
* @throws IOException file io exception
*/
public static boolean createNewHDFSFile(String newFile, String content) throws IOException {
if (StringUtils.isBlank(newFile) || null == content) {
return false;
}
newFile = uri + newFile;
Configuration config = new Configuration();
FileSystem hdfs = FileSystem.get(URI.create(newFile), config);
FSDataOutputStream os = hdfs.create(new Path(newFile));
os.write(content.getBytes("UTF-8"));
os.close();
hdfs.close();
return true;
}
/**
* delete the hdfs file
*
* @param hdfsFile a full path name, may like '/tmp/test.txt'
* @return boolean true-success, false-failed
* @throws IOException file io exception
*/
public static boolean deleteHDFSFile(String hdfsFile) throws IOException {
if (StringUtils.isBlank(hdfsFile)) {
return false;
}
hdfsFile = uri + hdfsFile;
Configuration config = new Configuration();
FileSystem hdfs = FileSystem.get(URI.create(hdfsFile), config);
Path path = new Path(hdfsFile);
boolean isDeleted = hdfs.delete(path, true);
hdfs.close();
return isDeleted;
}
/**
* read the hdfs file content
*
* @param hdfsFile a full path name, may like '/tmp/test.txt'
* @return byte[] file content
* @throws IOException file io exception
*/
public static byte[] readHDFSFile(String hdfsFile) throws Exception {
if (StringUtils.isBlank(hdfsFile)) {
return null;
}
hdfsFile = uri + hdfsFile;
Configuration conf = new Configuration();
FileSystem fs = FileSystem.get(URI.create(hdfsFile), conf);
// check if the file exists
Path path = new Path(hdfsFile);
if (fs.exists(path)) {
FSDataInputStream is = fs.open(path);
// get the file info to create the buffer
FileStatus stat = fs.getFileStatus(path);
// create the buffer
byte[] buffer = new byte[Integer.parseInt(String.valueOf(stat.getLen()))];
is.readFully(0, buffer);
is.close();
fs.close();
return buffer;
} else {
throw new Exception("the file is not found .");
}
}
/**
* append something to file dst
*
* @param hdfsFile a full path name, may like '/tmp/test.txt'
* @param content string
* @return boolean true-success, false-failed
* @throws Exception something wrong
*/
public static boolean append(String hdfsFile, String content) throws Exception {
if (StringUtils.isBlank(hdfsFile)) {
return false;
}
if(StringUtils.isEmpty(content)){
return true;
}
hdfsFile = uri + hdfsFile;
Configuration conf = new Configuration();
// solve the problem when appending at single datanode hadoop env
conf.set("dfs.client.block.write.replace-datanode-on-failure.policy", "NEVER");
conf.set("dfs.client.block.write.replace-datanode-on-failure.enable", "true");
FileSystem fs = FileSystem.get(URI.create(hdfsFile), conf);
// check if the file exists
Path path = new Path(hdfsFile);
if (fs.exists(path)) {
try {
InputStream in = new ByteArrayInputStream(content.getBytes());
OutputStream out = fs.append(new Path(hdfsFile));
IOUtils.copyBytes(in, out, 4096, true);
out.close();
in.close();
fs.close();
} catch (Exception ex) {
fs.close();
throw ex;
}
} else {
HdfsUtils.createNewHDFSFile(hdfsFile, content);
}
return true;
}
}
HdfsUtilsTest .java
package test.com.xy6.demo.utils;
import static org.junit.Assert.assertEquals;
import java.util.ArrayList;
import java.util.List;
import org.junit.Test;
import com.xy6.demo.utils.HdfsUtils;
public class HdfsUtilsTest {
public static String uri = "hdfs://192.168.1.118:9000";
public String dir = "/user/output1";
public String parentDir = "/user";
@Test
public void testMkdirNull1() {
try{
assertEquals(false, HdfsUtils.mkdir(null));
assertEquals(false, HdfsUtils.mkdir(" "));
assertEquals(false, HdfsUtils.mkdir(""));
} catch(Exception ex){
assertEquals(true, false);
}
}
@Test
public void testMkdirNormal1() {
try{
HdfsUtils.deleteDir(dir);
boolean result = HdfsUtils.mkdir(dir);
assertEquals(true, result);
List<String> listFile = HdfsUtils.listAll(parentDir);
boolean existFile = false;
for(String elem : listFile){
if(elem.equals(uri + dir)){
existFile = true;
break;
}
}
assertEquals(true, existFile);
} catch(Exception ex){
ex.printStackTrace();
assertEquals(true, false);
}
}
@Test
public void testDeleteDirNull1() {
try{
assertEquals(false, HdfsUtils.deleteDir(null));
assertEquals(false, HdfsUtils.deleteDir(""));
assertEquals(false, HdfsUtils.deleteDir(" "));
} catch(Exception ex){
assertEquals(true, false);
}
}
@Test
public void testDeleteDir() {
try{
assertEquals(true, HdfsUtils.mkdir(dir));
assertEquals(true, HdfsUtils.deleteDir(dir));
List<String> listFile = HdfsUtils.listAll(parentDir);
boolean existFile = false;
for(String elem : listFile){
if(uri + dir == elem){
existFile = true;
break;
}
}
assertEquals(false, existFile);
} catch(Exception ex){
ex.printStackTrace();
assertEquals(true, false);
}
}
@Test
public void testListAllNull1() {
try{
List<String> listFile = new ArrayList<String>();
assertEquals(listFile.toString(), HdfsUtils.listAll(null).toString());
assertEquals(listFile.toString(), HdfsUtils.listAll(" ").toString());
assertEquals(listFile.toString(), HdfsUtils.listAll("").toString());
} catch(Exception ex){
assertEquals(true, false);
}
}
@Test
public void testListAllEmptyFolder() {
try{
HdfsUtils.deleteDir(dir);
assertEquals(true, HdfsUtils.mkdir(dir));
List<String> listFile = HdfsUtils.listAll(dir);
assertEquals(0, listFile.size());
} catch(Exception ex){
ex.printStackTrace();
assertEquals(true, false);
}
}
@Test
public void testListAllNotExistFolder() {
try{
HdfsUtils.deleteDir(dir);
List<String> listFile = HdfsUtils.listAll(dir);
assertEquals(0, listFile.size());
} catch(Exception ex){
assertEquals(true, true);
}
}
@Test
public void testUploadLocalFile2HDFSNull1() {
try{
assertEquals(false, HdfsUtils.uploadLocalFile2HDFS(null, null));
assertEquals(false, HdfsUtils.uploadLocalFile2HDFS("", ""));
assertEquals(false, HdfsUtils.uploadLocalFile2HDFS(" ", " "));
} catch(Exception ex){
assertEquals(true, false);
}
}
@Test
public void testUploadLocalFile2HDFS() {
String localFile = "F:/Program Files/eclipse/eclipse.ini";
String remoteFile = dir + "/eclipse.ini";
try{
HdfsUtils.mkdir(dir);
HdfsUtils.deleteHDFSFile(remoteFile);
assertEquals(true, HdfsUtils.uploadLocalFile2HDFS(localFile, remoteFile));
} catch(Exception ex){
ex.printStackTrace();
assertEquals(true, false);
}
}
@Test
public void testUploadLocalFile2HDFSLocalNotExist() {
String localFile = "F:/Program Files/eclipse/eclipse2.ini";
String remoteFile = dir + "/eclipse.ini";
try{
assertEquals(true, HdfsUtils.mkdir(dir));
HdfsUtils.deleteHDFSFile(remoteFile);
HdfsUtils.uploadLocalFile2HDFS(localFile, remoteFile);
} catch(Exception ex){
assertEquals(true, true);
}
}
@Test
public void testCreateNewHDFSFileNull1() {
try{
assertEquals(false, HdfsUtils.createNewHDFSFile(null, null));
assertEquals(false, HdfsUtils.createNewHDFSFile(" ", " "));
assertEquals(false, HdfsUtils.createNewHDFSFile("", ""));
} catch(Exception ex){
assertEquals(true, false);
}
}
@Test
public void testCreateNewHDFSFileNormal1() {
try{
String newFile = dir + "/file1.txt";
String content = "hello file1";
HdfsUtils.deleteHDFSFile(newFile);
assertEquals(true, HdfsUtils.createNewHDFSFile(newFile, content));
String result = new String(HdfsUtils.readHDFSFile(newFile));
assertEquals(content, result);
} catch(Exception ex){
ex.printStackTrace();
assertEquals(true, false);
}
}
@Test
public void testCreateNewHDFSFileFoldNotexist1() {
try{
String newFile = dir + "/file1.txt";
String content = "hello file1";
assertEquals(true, HdfsUtils.deleteDir(dir));
assertEquals(true, HdfsUtils.createNewHDFSFile(newFile, content));
} catch(Exception ex){
ex.printStackTrace();
assertEquals(true, false);
}
}
@Test
public void testDeleteHDFSFileNull1() {
try{
assertEquals(false, HdfsUtils.deleteHDFSFile(null));
assertEquals(false, HdfsUtils.deleteHDFSFile(" "));
assertEquals(false, HdfsUtils.deleteHDFSFile(""));
} catch(Exception ex){
assertEquals(true, false);
}
}
@Test
public void testDeleteHDFSFile() {
this.testUploadLocalFile2HDFS();
try{
String remoteFile = dir + "/eclipse.ini";
assertEquals(true, HdfsUtils.deleteHDFSFile(remoteFile));
} catch(Exception ex){
assertEquals(true, false);
}
}
@Test
public void testDeleteHDFSFileNotexist1() {
try{
String remoteFile = dir + "/eclipse2.ini";
assertEquals(false, HdfsUtils.deleteHDFSFile(remoteFile));
} catch(Exception ex){
assertEquals(true, false);
}
}
@Test
public void testReadHDFSFileNull1() {
try{
assertEquals(null, HdfsUtils.readHDFSFile(null));
assertEquals(null, HdfsUtils.readHDFSFile(" "));
assertEquals(null, HdfsUtils.readHDFSFile(""));
} catch(Exception ex){
assertEquals(true, false);
}
}
@Test
public void testReadHDFSFile() {
this.testUploadLocalFile2HDFS();
try{
String remoteFile = dir + "/eclipse.ini";
String result = new String(HdfsUtils.readHDFSFile(remoteFile));
assertEquals(true, result.length() > 0);
} catch(Exception ex){
ex.printStackTrace();
assertEquals(true, false);
}
}
@Test
public void testAppendNull1() {
try{
assertEquals(false, HdfsUtils.append(null, null));
assertEquals(false, HdfsUtils.append(" ", " "));
assertEquals(false, HdfsUtils.append("", ""));
} catch(Exception ex){
assertEquals(true, false);
}
}
@Test
public void testAppend() {
try{
String newFile = dir + "/file1.txt";
String content1 = "hello append1\r\n";
String content2 = "hello append2\r\n";
HdfsUtils.deleteHDFSFile(newFile);
assertEquals(true, HdfsUtils.createNewHDFSFile(newFile, ""));
assertEquals(true, HdfsUtils.append(newFile, content1));
assertEquals(content1, new String(HdfsUtils.readHDFSFile(newFile)));
assertEquals(true, HdfsUtils.append(newFile, content2));
assertEquals(content1 + content2, new String(HdfsUtils.readHDFSFile(newFile)));
} catch(Exception ex){
ex.printStackTrace();
assertEquals(true, false);
}
}
}
如果文章对你有帮助,请随意打赏,这将鼓励我写出更好的文章:)