python操作hdfs_python 操作hdfs

from hdfs.client importClient#关于python操作hdfs的API可以查看官网:#https://hdfscli.readthedocs.io/en/latest/api.html

#读取hdfs文件内容,将每行存入数组返回

defread_hdfs_file(client, filename):#with client.read('samples.csv', encoding='utf-8', delimiter='\n') as reader:

#for line in reader:

#pass

lines =[]

with client.read(filename, encoding='utf-8', delimiter='\n') as reader:for line inreader:#pass

#print line.strip()

lines.append(line.strip())returnlines#创建目录

defmkdirs(client, hdfs_path):

client.makedirs(hdfs_path)#删除hdfs文件

defdelete_hdfs_file(client, hdfs_path):

client.delete(hdfs_path)#上传文件到hdfs

defput_to_hdfs(client, local_path, hdfs_path):

client.upload(hdfs_path, local_path, cleanup=True)#从hdfs获取文件到本地

defget_from_hdfs(client, hdfs_path, local_path):

client.download(hdfs_path, local_path, overwrite=False)#追加数据到hdfs文件

defappend_to_hdfs(client, hdfs_path, data):

client.write(hdfs_path, data, overwrite=False, append=True, encoding='utf-8')#覆盖数据写到hdfs文件

defwrite_to_hdfs(client, hdfs_path, data):

client.write(hdfs_path, data, overwrite=True, append=False, encoding='utf-8')#移动或者修改文件

defmove_or_rename(client, hdfs_src_path, hdfs_dst_path):

client.rename(hdfs_src_path, hdfs_dst_path)#返回目录下的文件

deflist(client, hdfs_path):return client.list(hdfs_path, status=False)#client = Client(url, root=None, proxy=None, timeout=None, session=None)#client = Client("http://hadoop:50070")

client = Client("http://120.78.186.82:50070/",root="/",timeout=10000,session=False)#client = InsecureClient("http://120.78.186.82:50070", user='ann');

#move_or_rename(client,'/input/2.csv', '/input/emp.csv')#read_hdfs_file(client,'/input/emp.csv')

put_to_hdfs(client, 'D:\\bbb.txt', '/file')#append_to_hdfs(client,'/input/emp.csv','我爱你'+'\n')#write_to_hdfs(client, '/emp.csv', "sadfafdadsf")#read_hdfs_file(client,'/input/emp.csv')#move_or_rename(client,'/input/emp.csv', '/input/2.csv')#mkdirs(client,'/input/python')#print(list(client, '/'))#chown(client,'/input/1.csv', 'root')

  • 0
    点赞
  • 0
    收藏
    觉得还不错? 一键收藏
  • 0
    评论
评论
添加红包

请填写红包祝福语或标题

红包个数最小为10个

红包金额最低5元

当前余额3.43前往充值 >
需支付:10.00
成就一亿技术人!
领取后你会自动成为博主和红包主的粉丝 规则
hope_wisdom
发出的红包
实付
使用余额支付
点击重新获取
扫码支付
钱包余额 0

抵扣说明:

1.余额是钱包充值的虚拟货币,按照1:1的比例进行支付金额的抵扣。
2.余额无法直接购买下载,可以购买VIP、付费专栏及课程。

余额充值