python——将类别数据转化为数值数据

LabelEncoder

# 数据预处理-将类别数据转化为数值数据
import numpy as np
import pandas as pd
from sklearn.preprocessing import LabelEncoder


# 加载数据
def loaddata():
    columns = ['sepal_length', 'speal_width', 'petal_length', 'petal_width', 'type']
    data = pd.read_csv('data/iris.data', header=None, names=columns)
    data = data.values
    X = data[:, :-1]
    y = data[:, -1]
    return X, y


if __name__ == '__main__':
    # 加载数据
    X, y = loaddata()
    # 获取标签
    label = np.unique(y)

    le = LabelEncoder()
    le.fit(label)
    y = le.transform(y)
    print(y)

pd.Catrgorical(series).codes

# 数据预处理-将类别数据转化为数值数据
import numpy as np
import pandas as pd


# 加载数据
def loaddata():
    columns = ['sepal_length', 'speal_width', 'petal_length', 'petal_width', 'type']
    data = pd.read_csv('data/iris.data', header=None, names=columns)
    # 将类别信息转化为数值信息
    data['type'] = pd.Categorical(data['type']).codes
    data = data.values
    X = data[:, :-1]
    y = data[:, -1]
    return X, y


if __name__ == '__main__':
    # 加载数据
    X, y = loaddata()
    print(y)

字典映射

# 数据预处理-将类别数据转化为数值数据
import numpy as np
import pandas as pd


# 加载数据
def loaddata():
    columns = ['sepal_length', 'speal_width', 'petal_length', 'petal_width', 'type']
    data = pd.read_csv('iris.data', header=None, names=columns)
    # 将类别信息转化为数值信息
    data['type'] = data['type'].map({'Iris-setosa':0,'Iris-versicolor':1,'Iris-virginica':2}).astype(int)
    data = data.values
    X = data[:, :-1]
    y = data[:, -1]
    return X, y


if __name__ == '__main__':
    # 加载数据
    X, y = loaddata()
    print(y)
[0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0.
 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0. 0.
 0. 0. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1.
 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1. 1.
 1. 1. 1. 1. 2. 2. 2. 2. 2. 2. 2. 2. 2. 2. 2. 2. 2. 2. 2. 2. 2. 2. 2. 2.
 2. 2. 2. 2. 2. 2. 2. 2. 2. 2. 2. 2. 2. 2. 2. 2. 2. 2. 2. 2. 2. 2. 2. 2.
 2. 2. 2. 2. 2. 2.]
评论
添加红包

请填写红包祝福语或标题

红包个数最小为10个

红包金额最低5元

当前余额3.43前往充值 >
需支付:10.00
成就一亿技术人!
领取后你会自动成为博主和红包主的粉丝 规则
hope_wisdom
发出的红包
实付
使用余额支付
点击重新获取
扫码支付
钱包余额 0

抵扣说明:

1.余额是钱包充值的虚拟货币,按照1:1的比例进行支付金额的抵扣。
2.余额无法直接购买下载,可以购买VIP、付费专栏及课程。

余额充值