1. 定类数据各类别数查看及可视化
# 前置库:pandas
# 对标签列进行观察,查看已标注样本各类别对数量
print(pd.value_counts(DataFrame['column'], sort=True))
# 图形化展示
from matplotlib import pyplot as plt
pd.value_counts(DataFrame['target_column']).plot(kind = 'bar')
plt.title("name")
plt.xlabel("name")
plt.ylabel("name")
plt.show
2. 将定类数据各类别替换为数值
objects_replace = {
"column_name" : {
"object1": 1,
"object2": 0,
"..."
}
}
DF2 = DF1.replace(objects_replace)