Spark 读取HDFS的Zip文件
Spark 读取HDFS的Zip文件
import java.util.zip.ZipInputStream;
import java.io.BufferedReader;
import java.io.InputStreamReader;
val path = "xxxx.zip"
def loadZip(path:String)={
val minPartitions =10
sc.binaryFiles(path, minPartitions)
.flatMap {
原创
2021-07-29 14:45:01 ·
404 阅读 ·
0 评论