最小二乘支持向量机LS-SVM

最新推荐文章于 2025-03-23 09:15:04 发布
DeniuHe
最新推荐文章于 2025-03-23 09:15:04 发布
阅读量1.1k
点赞数
分类专栏：算法文章标签：支持向量机人工智能
本文链接：https://blog.csdn.net/DeniuHe/article/details/122051684
版权
算法专栏收录该内容
193 篇文章
订阅专栏
import numpy as np
import pandas as pd
import matplotlib.pyplot as plt
import scipy.optimize as optimize
import sklearn.datasets as ds
from sklearn import datasets
from sklearn.metrics import accuracy_score
from sklearn.model_selection import train_test_split
from sklearn.metrics.pairwise import rbf_kernel
from sklearn.svm import SVC
from time import time


class lssvm:
    def __init__(self):
        # self.model = 'svm'          # 'svm', 'lssvm', 'twsvm'
        # self.method = 'ovo'         # Multi-class method. 'ovo': One vs One, 'ova': One vs All
        # Kernel settings
        self.kernel_type = 'rbf'   # 'linear', 'poly', 'rbf', 'erbf', 'tanh', 'lspline'
        self.b = 1                  # constant multiplier for hyperbolic tangent
        self.c = 1                  # constant sum for polynomial, tangent and linear splines
        self.d = 2                  # polynomial power
        self.sigma = 0.5            # RBF and ERBF sigma

        # SVM settings
        self.C = 0.01                 # soft margin

        #
        self.alpha = None           # Lagrange multiplier (SVM and LSSVM)
        self.SV = None              # Support vectors
        self.bias = 1               # bias
        # Kernel types
        # linear : linear
        # poly   : polynomial
        # rbf    : radial base gaussian function (RFB)
        # erbf   : radial base exponencial
        # tanh   : hyperbolic tangent
        # lspline: linear splines
        return

    def kernel(self, x1, x2):
        # Input parameters
        #   t = kernel type
        #       linear:     linear
        #       poly:       polynomial
        #       rbf:        radial base gaussian function (RFB)
        #       erbf:       radial base exponencial
        #       tanh:       hyperbolic tangent
        #       lspline:    linear splines
        #   b:      constant multiplier for hyperbolic tangent
        #   c:      constant sum for polynomial, tangent and linear splines
        #   d:      polynomial and linear splines power indicator
        #   sigma:  free parameter for RBF and exponential base
        # One problem with the polynomial kernel is that it may suffer
        # from numerical instability:
        # when x1Tx2 + c < 1, k(x1, x2) = (x1Tx2 + c)^d tends to zero with increasing d,
        # whereas when x1Tx2 + c > 1, k(x1, x2) tends to infinity
        #
        if x1.ndim == 1:
            x1 = np.array([x1]).T

        if x2.ndim == 1:
            x2 = np.array([x2]).T

        m1 = x1.shape[0]
        m2 = x2.shape[0]
        k = np.zeros((m1, m2))

        t = self.kernel_type
        b = self.b
        c = self.c
        d = self.d
        sigma = self.sigma
        for i in range(m1):
            for j in range(m2):

                # Linear kernel
                if t == 'linear':
                    k[i, j] = x1[i] @ x2[j]
                # Polynomial kernel
                elif t == 'poly':
                    k[i, j] = (x1[i] @ x2[j] + c) ** d
                # Radial base gaussian function (RBF)
                elif t == 'rbf':
                    k[i, j] = np.exp(-(x1[i] - x2[j]) @ (x1[i] - x2[j]) / (2 * sigma ** 2))
                # Radial base exponential function
                elif t == 'erbf':
                    k[i, j] = np.exp(-np.abs(x1[i] - x2[j]) / (2 * sigma ** 2))
                # Hyperbolic tangent
                elif t == 'tanh':
                    k[i, j] = np.tanh(b * (x1[i] @ x2[j]) + c)
                # Linear splines
                elif t == 'lspline':
                    k[i, j] = c + x1[i] * x2[j] + x1[i] * x2[j] * min(x1[i], x2[j]) + 1 / 2 * (x1[i] + x2[j]) *  min(x1[i], x2[j]) ** d

        return k


    def lssvm_predict(self, X_test, X_train, y_train):
        """
        Predict LS-SVM values.

        Input
            X_test:         test set. Numeric normalized values or categorical values
                            encoded as numeric.
            X_train:        train set. Numeric normalized values or categorical values
                            encoded as numeric.
            y_train:        train set, y={-1, 1} or y={0, 1}. Vector if binary,
                            one-hot enconded if multiclass.
        Output
            y_hat:          predicted values
        """

        y_train = np.where(y_train == 0, -1, y_train)

        # y_hat = np.sign(np.sum(self.alpha * y_train * self.kernel(X_train, X_test), axis=0,
        #                        keepdims=True) + self.bias).T
        y_hat = np.sign(np.sum(self.alpha * y_train * rbf_kernel(X_train, X_test,gamma=self.sigma), axis=0,
                               keepdims=True) + self.bias).T

        y_hat = np.where(y_hat == -1, 0, y_hat)

        return y_hat

    def lssvm_fit(self, X_train, y_train):
        """
        Train LS-SVM model. Parameters defined in the svm object. Trained values
        stored in the svm object.

        Input
            X_train:        train set. Numeric normalized values or categorical
                            values encoded as numeric.
            y_train:        train set, y={-1, 1} or y={0, 1}. Vector if binary,
                            one-hot enconded if multiclass.
        SVM parameter
            C:              SVM soft margin
        Kernel parameters
            t:              kernel type: 'linear', 'poly', 'rbf', 'erbf','tanh',
                            'lspline'
            b:              constant multiplier for hyperbolic tangent
            c:              constant sum for polynomial, hyperbolic tangent and
                            linear splines
            d:              polynomial and linear splines power indicator
            sigma:          free parameter for RBF and exponential base
        Output
            Trained model stored in svm object.
        """

        y_train = np.where(y_train == 0, -1, y_train)

        N = X_train.shape[0]
        # y_train = y_train[:,None]
        # nc = y_train.shape[1]
        # K = self.kernel(X_train, X_train)
        K = rbf_kernel(X_train, X_train,gamma=self.sigma)

        # 3. Compute omega
        omega = np.zeros((N, N), int)
        for k in range(K.shape[0]):
            for l in range(K.shape[1]):
                omega[k, l] = y_train[k] * y_train[l] * K[k, l]

        # 4. Build Matrix A and vector b
        I = np.eye(omega.shape[0])
        ZZCI = omega + self.C ** -1 * I

        # 4.1 Build matrix A
        A11 = np.zeros((1, 1))  # Element A(1,1)
        A1 = np.hstack((A11, -y_train.T))  # Row 1
        A2 = np.hstack((y_train, ZZCI))  # Row 2

        # Build matrix A
        A = np.vstack((A1, A2))

        # 4.2 Output vector b
        b = np.vstack((np.zeros((1, 1)), np.ones((N, 1))))

        # 5. Solve the linear equation Ax = b
        x = np.linalg.solve(A, b)

        self.bias = x[0]
        self.alpha = x[1:len(x)]

        return

if __name__ == '__main__':
    X,y = datasets.make_blobs(n_samples=5000, n_features=2,
                              centers=2, cluster_std=[2.0,2.0], random_state=12)
    plt.scatter(X[:,0], X[:,1], c=y)
    plt.show()
    # X, y = datasets.load_breast_cancer(return_X_y=True)
    print("nDim=",X.shape[1])
    X_train, X_test, y_train, y_test = train_test_split(X,y, test_size=0.2,random_state=100)
    y_train = y_train[:,None]

    s_time = time()
    model = lssvm()
    model.lssvm_fit(X_train=X_train,y_train=y_train)
    y_hat = model.lssvm_predict(X_test=X_test,X_train=X_train,y_train=y_train)
    Acc = accuracy_score(y_test, y_hat)
    e_time = time()
    print("精度=",Acc)
    print("耗时=",e_time - s_time)

    s_time = time()
    model = SVC(kernel='rbf')
    model.fit(X_train, y_train)
    y_hat = model.predict(X_test)
    Acc = accuracy_score(y_test, y_hat)
    e_time = time()
    print("精度=",Acc)
    print("耗时=",e_time - s_time)
不知为什么 LS-SVM的效果始终无法超过SVM，特别是在一些数据集上无论怎么调整参数分类精度远低于SVM。
另外，LS-SVM对容差系数C貌似不是特别敏感，相对于SVM而言。