Logistic回归解析（python代码）

最新推荐文章于 2023-10-02 10:12:07 发布

回到未来望过去

最新推荐文章于 2023-10-02 10:12:07 发布

阅读量456

点赞数

原文链接：https://mp.csdn.net/editor/html/111027965

版权


机器学习之Logistic回归解析及实例应用
22/100
viviliving


<没有设置>
from numpy import *
import matplotlib.pyplot as plt
from matplotlib.font_manager import FontProperties
def loadDataSet():
    dataMat = []
    labelMat = []
    fr = open('testSet.txt')
    #读取文本文件
    for line in fr.readlines():
        #读取全部行内容并且逐行遍历
        lineArr = line.strip().split()
        #对单行进行处理，伤处空格换行符并且切分
        dataMat.append([1.0,float(lineArr[0]),float(lineArr[1])])
        #将文本中的数据的前两个x1,x2和1.0作为x0一起放入列表中
        labelMat.append(int(lineArr[2]))
        #将标签放入标签列表
    return dataMat,labelMat
    
def sigmoid(inX):#sigmoid函数计算
    return 1.0/(1+exp(-inX))
    # return .5 * (1 + tanh(.5 * inX))

def stocGradAscent1(dataMatrix,classLabels,numIter=150):#随机梯度上升算法
    #定义了迭代次数，可更改
    m,n = shape(dataMatrix)
    #获得数据集的行列数
    weights = ones(n)
    #初始化回归系数为1
    weights_arry = array([])
    for j in range(numIter):
        dataIndex = list(range(m))
        #创建数据集索引列表
        for i in range(m):
            alpha = 4/(1.0+j+i)+0.01
            #降低alpha的大小，每次减小1/(j+i)
            randIndex = int(random.uniform(0,len(dataIndex)))
            #产生随机数，即随机的样本
            h = sigmoid(sum(dataMatrix[randIndex]*weights))
            #计算函数值
            error = classLabels[randIndex] - h
            weights = weights + alpha*error*dataMatrix[randIndex]
            #公式计算最佳回归系数
            weights_arry = append(weights_arry,weights,axis=0)
            del(dataIndex[randIndex])
            #删除适用过的数据的索引
    weights_arry = weights_arry.reshape(numIter*m,n)
    return weights,weights_arry
    
def plotWeights(weights_array):
    fig = plt.figure()
    font = FontProperties(fname=r"c:\windows\fonts\simsun.ttc",size=14)
    x = arange(0,len(weights_array),1)
    ax1 = fig.add_subplot(3,1,1)
    ax1.plot(x,weights_array[:,0])
    plt.ylabel('W0')
    ax2 = fig.add_subplot(3,1,2)
    ax2.plot(x,weights_array[:,1])
    plt.ylabel('W1')
    ax3 = fig.add_subplot(3,1,3)
    ax3.plot(x,weights_array[:,2])
    plt.xlabel('迭代次数',fontproperties=font)
    plt.ylabel('W3')
    plt.show()
    
if __name__=='__main__':
    dataArr,labelMat = loadDataSet()
    weights,weights_array = stocGradAscent1(array(dataArr),labelMat)
    plotWeights(weights_array)

回到未来望过去

关注

0
点赞
踩
1

收藏

觉得还不错? 一键收藏
0
评论
Logistic回归解析（python代码）

机器学习之Logistic回归解析及实例应用22/100viviliving<没有设置>from numpy import *import matplotlib.pyplot as pltfrom matplotlib.font_manager import FontPropertiesdef loadDataSet(): dataMat = [] labelMat = [] fr = open('testSet.txt') #读取文本文件..
复制链接

扫一扫