# -*- coding: utf-8 -*-
"""
@Time : 2022/5/5 10:11
@Author : Mr Wang
@FileName: main_usepd.py
@SoftWare: PyCharm
"""
import pandas as pd
import numpy as np
pd.set_option('display.max_rows', 2000)
import matplotlib.pyplot as plt
plt.rcParams['font.sans-serif'] = ['KaiTi']
#数据清洗,不符合的改为NAN
def data_clean(sex):
if (sex == 'f') | (sex == 'female'):
return 'female'
elif (sex == 'm') | (sex == 'male'):
return 'male'
else:
return np.NAN
if __name__ == '__main__':
path = 'E:\python\data_mining\codes1\lect01_proj\survey.csv'
#usecols表示只需的列
df = pd.read_csv(path, usecols=['Country', 'Gender'])
#重写列名
df.rename(columns={'Country': 'cou', 'Gender': 'gen'}, inplace=True)
# prin
pandas操作csv以及可视化操作(实例)
于 2022-05-05 16:54:26 首次发布