// An highlighted block
import java.io.BufferedReader;
import java.io.IOException;
import java.io.InputStreamReader;
import java.net.URI;
import org.apache.hadoop.conf.Configuration;
import org.apache.hadoop.fs.FSDataInputStream;
import org.apache.hadoop.fs.FileSystem;
import org.apache.hadoop.fs.Path;
public static List<String> getHdfsTxt(String hdfsTxtPath, Configuration conf) {
StringBuffer buffer = new StringBuffer();
FSDataInputStream fsr = null;
BufferedReader bufferedReader = null;
String lineTxt = null;
List<String> mylist = new ArrayList<String>();
try {
FileSystem fs = FileSystem.get(URI.create(hdfsTxtPath), conf);
fsr = fs.open(new Path(hdfsTxtPath));
bufferedReader = new BufferedReader(new InputStreamReader(fsr));
while ((lineTxt = bufferedReader.readLine()) != null)
{
mylist.add(lineTxt);
}
} catch (Exception e) {
e.printStackTrace();
} finally {
if (bufferedReader != null) {
try {
bufferedReader.close();
} catch (IOException e) {
e.printStackTrace();
}
}
}
return mylist;
}
Java逐行读取hdfs文件
最新推荐文章于 2024-05-12 00:07:25 发布