在http://blog.csdn.net/zouxy09/article/details/17589329 上看到聚类分析算法,但是是基于python2.7.5版本,直接移植到Python3.6会有问题,更改代码后为增加对比性,绘制原始数据不部分;代码如下:
################################################# #pyhon3.6运行 #time:20170501 #version #liouwuzhou #Email : liouwuzhou@139.com ################################################# def euclDistance(vector1, vector2): return sqrt(sum(power(vector2 - vector1, 2))) def initCentroids(dataSet, k): numSamples, dim = dataSet.shape centroids = zeros((k, dim)) for i in range(k): index = int(random.uniform(0, numSamples)) centroids[i, :] = dataSet[index, :] return centroids def kmeans(dataSet, k): numSamples = dataSet.shape[0] clusterAssment = mat(zeros((numSamples, </