import numpy import pandas as pd #画图设置 import matplotlib.pyplot as plt plt.rcParams['font.sans-serif'] = ['SimHei']#设置中文字体为黑体 plt.rcParams['axes.unicode_minus'] = False #正常显示负号 #读取excel文件 # df=pd.read_excel('data1.xlsx',engine='openpyxl') # print(df.head()) #读取txt格式文件 # with open('data.txt', encoding='utf-8') as file: # content = file.read() # print(content.rstrip()) ##rstrip()删除字符串末尾的空行 ###逐行读取数据 # for line in content: # print(line) ##写入txt文件 # filename='data.txt' # with open(filename,'w') as file: # file.write('python\n') # file.write('java\n') #读取csv文件/读取某列/去重 df=pd.read_csv('1type.csv') # df = df[['temp','isweekend','type']] #选取多列 # pd.unique(df.column) unique()对于单个字段去重,如unique(cpc.日期) # df = pd.Series(pd.unique(df['temp'])) # drop_duplicates()对于多个字段去重,如drop
一些python数据处理方法总结
最新推荐文章于 2024-05-15 12:59:31 发布