TSNE-降维可视化，函数封装

最新推荐文章于 2025-04-04 13:19:37 发布

helloppc90

最新推荐文章于 2025-04-04 13:19:37 发布

阅读量434

点赞数

文章标签： python 可视化机器学习

本文链接：https://blog.csdn.net/ZZcppc/article/details/110482157

版权

TSNE-降维可视化

from sklearn.manifold import TSNE
import pandas as pd
import numpy as np
from time import time
import matplotlib.pyplot as plt
import seaborn as sns

data_path='./dataset.xlsx'
train_data=pd.read_excel(data_path)
print(type(train_data))

origin_data=np.array(train_data)
data,label=np.split(origin_data,(6,),axis=1)
#print(label.reshape(-1))
print(label.shape)


def perform_tsne(X_data, y_data, perplexities, n_iter=1000, img_name_prefix='t-sne'):
    for index, perplexity in enumerate(perplexities):
        # perform t-sne
        print('\nperforming tsne with perplexity {} and with {} iterations at max'.format(perplexity, n_iter))
        #自行调节学习率
        X_reduced = TSNE(verbose=2,init='pca',random_state=0, learning_rate=0.0001,perplexity=perplexity).fit_transform(X_data)
        print(X_reduced)
        print('Done..')


        # prepare the data for seaborn
        print('Creating plot for this t-sne visualization..')
        #注意下面label的维数，这里reshape(-1)是为了将（700，1）变为（700）
        df = pd.DataFrame({'x': X_reduced[:, 0], 'y': X_reduced[:, 1], 'label': y_data.reshape(-1)})

        # draw the plot in appropriate place in the grid
        sns.lmplot(data=df, x='x', y='y', hue='label', fit_reg=False, size=8, \
                   palette="Set1", markers=['^', 'v', 's'])
        plt.title("perplexity : {} and max_iter : {}".format(perplexity, n_iter))
        img_name = img_name_prefix + '_perp_{}_iter_{}.png'.format(perplexity, n_iter)
        print('saving this plot as image in present working directory...')
        plt.savefig(img_name)
        plt.show()
        print('Done')

X_pre_tsne = data
y_pre_tsne = label

perform_tsne(X_data = X_pre_tsne,y_data=y_pre_tsne, perplexities =[5,10,50,100],n_iter=1000)