import pandas as pd
df = pd.DataFrame([
[‘green’ , ‘A’],
[‘red’ , ‘B’],
[‘blue’ , ‘A’]])
df.columns = [‘color’, ‘class’]
pd.get_dummies(df)
https://blog.csdn.net/maymay_/article/details/80198468
https://juejin.im/post/6885614731982766088
对分类特征进行One-Hot编码
def oneHotEncode(df,colNames):
for col in colNames:
if( df[col].dtype == np.dtype(‘object’)):
# pandas.get_dummies 可以对分类特征进行One-Hot编码
dummies = pd.get_dummies(df[col],prefix=col)
df = pd.concat([df,dummies],axis=1)
# drop the encoded column
df.drop([col],axis = 1 , inplace=True)
return df
df-数据集
colNames 分类特征columns
####大佬带手撕代码的时候,建议还是要自己一个个来转换,手动解析输出并转换