import numpy as np
from sklearn import datasets
import pandas as pd
data = pd.read_csv(r'E:\dataset\clusterData\ecoli.csv',header=None)
data1 =np.array(data)
X = data1[:,1:9]
labels = set(data1[:,8])
print(labels)
count = []
for i,L in enumerate(labels):
for j in range(len(X)):
if X[j,-1] == L:
X[j,-1] = i
X = pd.DataFrame(X)
X.to_csv(r'E:\dataset\clusterData\ecoli_1.csv',index=None,header=None)
据说pandas有更快捷的方式。大神请留言!