IP-ESN

最新推荐文章于 2022-12-27 16:34:56 发布
颹蕭蕭
最新推荐文章于 2022-12-27 16:34:56 发布
阅读量976
点赞数 2
分类专栏： # 机器学习
我们不生产知识，我们只是互联网的搬运工
本文链接：https://blog.csdn.net/itnerd/article/details/109226320
版权
机器学习专栏收录该内容
136 篇文章 17 订阅
订阅专栏
在这里插入图片描述
"""
A minimalistic Echo State Networks demo with Mackey-Glass (delay 17) data 
in "plain" scientific Python.
by Mantas Lukosevicius 2012
http://minds.jacobs-university.de/mantas
---
Modified by Xavier Hinaut: 19 November 2015.
http://www.xavierhinaut.com

Modified by Remy Portelas: 30 May 2016
https://github.com/rPortelas/ip_in_esn

Modified by Xiao Wei: 20 Oct 2020
https://goodgoodstudy.blog.csdn.net/article/details/109226320
"""
import numpy as np
import matplotlib.pyplot as plt
import scipy.linalg
import random

def set_seed(seed=None):
    """Making the seed (for random values) variable if None"""

    # Set the seed
    if seed is None:
        import time
        seed = int((time.time()*10**6) % 10**12)
        
    try:
        random.seed(seed) #np.random.seed(seed)
        print("Seed used for random values:", seed)
    except:
        print("!!! WARNING !!!: Seed was not set correctly.")
    return seed

#reservoir's neurons activation function    
def sigmoid(x):
    if activation_function_mode == 'tanh':
        return np.tanh(x)
    elif activation_function_mode == 'fermi':
        return ( 1 / ( 1 + np.exp(-x)))
    else:
        raise Exception("ERROR: 'activation_function_mode' was not " + \
        "set correctly.")

#plot the activation of all neurons in the reservoir during 1 epoch
def plot_activity(x,epoch):
    plt.figure(epoch+42).clear()
    if activation_function_mode == 'tanh':
         plt.hist(x.ravel(), bins = 200)
         plt.xlim(-1,+1)
    else :#fermi
        plt.hist(x.ravel(), bins = 100)
        plt.xlim(0,+1)
    plt.xlabel('neurons outputs')
    plt.ylabel('number of neurons')
    #compute some caracteristics of the distribution
    mean = str(round(x.mean(), 2))
    med = str(round(np.median(x), 2))
    min = str(round(x.min(), 2))
    max = str(round(x.max(), 2))
    std_dev = str(round(x.std(), 2))
    plt.title('Spatio-temporal distribution of the reservoir at epoch ' + \
    str(epoch) + '\n mean = '+ mean + ' median = ' + med + ' min = ' + \
    min + ' max = ' + max + ' std_dev = ' + std_dev)
 
def plot_neuron_activity(x,epoch):
    plt.figure(epoch+84).clear()
    if activation_function_mode == 'tanh':
         plt.hist(x.ravel(), bins = 200)
         plt.xlim(-1,+1)
    else :#fermi
        plt.hist(x.ravel(), bins = 100)
        plt.xlim(0,+1)
    plt.xlabel('neuron outputs')
    plt.ylabel('number of timesteps')
    #compute some caracteristics of the distribution
    plt.title('The output distribution of a single randomly chosen neuron ' + \
    'at epoch ' + str(epoch))

# load the data
trainLen = 4000  # include prepareLen
prepareLen = 2000
testLen = 2000

data = np.loadtxt('../datasets/MackeyGlass_t17.txt')
print(data.shape)
# plot some of it
# plt.figure(10).clear()
# plt.plot(data[0:1000])
# plt.title('A sample of data')
# plt.show()

# mode = 'prediction'  #given x try to predict x+1
mode = 'generative' #compute x and use it as an input to compute x+1

activation_function_mode = 'tanh'
# activation_function_mode = 'fermi'

wout_mode = 'entries bias and resOut'
# wout_mode = 'resOut and bias only'

# ip_mode = 'intrinsic plasticity on'
ip_mode = 'intrinsic plasticity off'

#IP parameter
# ip_update_mode = 'leaky neurons treated'
ip_update_mode = 'leaky neurons ignored'

#Set the number of training's epochs,
if ip_mode == 'intrinsic plasticity on':
  if activation_function_mode == 'tanh':
      nb_epoch = 3 #IP with tanh neurons needs less time to converge
  else:
    nb_epoch = 41
else: #if no IP, then we don't need multiple epochs of training
  nb_epoch = 1

# generate the ESN reservoir
inSize = outSize = 1 #input/output dimension
resSize = 100 #reservoir size
a = 0.3 # leaking rate
if ip_mode == 'intrinsic plasticity on':
    spectral_radius = 1.
    reg = 0.02  #regularization coefficient
    #init Intrisic Plasticity (IP)
    lr = 0.001  #learning rate   
    if activation_function_mode == 'tanh':
        m = 0.      #mean
        sigma = 0.2 #standard deviation 0.2 gives best results
        var = np.square(sigma) #variance
    
    else : #fermi
        m = 0.2
    #instanciate some matrix to store the evolution of IP's gain and bias
    ip_gain = np.ones((resSize, 1))
    record_ip_gain = np.zeros(((nb_epoch-1) * trainLen , 1))
    record_ip_bias = np.zeros(((nb_epoch-1) * trainLen , 1))
    ip_bias = np.zeros((resSize, 1))
    
    
else :          #IP off
    spectral_radius = 1.25
    reg = 1e-8 # regularization coefficient
    
input_scaling = 1.

#change the seed, reservoir performances should be averaged accross at least 
#20 random instances (with the same set of parameters)
our_seed = None #Choose a seed or None
set_seed(our_seed) 

#generation of random weights
Win = (np.random.rand(resSize,1+inSize)-0.5) * input_scaling
W = np.random.rand(resSize,resSize)-0.5

# Option 1 - direct scaling (quick&dirty, reservoir-specific):
#W *= 0.135 
# Option 2 - normalizing and setting spectral radius (correct, slow):
print('Computing spectral radius...', end=' ')
rhoW = max(abs(np.linalg.eig(W)[0])) #maximal eigenvalue
print('done.')
W *= spectral_radius / rhoW

# allocated memory for the design (collected states) matrix
if wout_mode == 'entries bias and resOut':
    X = np.zeros((1+inSize+resSize,trainLen))
    
elif wout_mode == 'resOut and bias only':
    X = np.zeros((1+resSize,trainLen))
else :
        raise Exception("ERROR: 'wout_mode' was not set correctly.")

#to display the spatio-temporal activity of an entire epoch
recorded_res_out = np.zeros((trainLen, resSize))

#choose a random neuron in the res to create a histogram of its activations
choosen_neuron = np.random.random_integers(resSize - 1)
neuron_out_records = np.zeros(trainLen)

# set the corresponding target matrix directly
Yt = data[None,1:trainLen+1] 

# run the reservoir with the data and collect X
x = np.zeros((resSize,1))
for epoch in range(nb_epoch):
    for t in range(trainLen):
        u = data[t]
        res_in = np.dot( Win, np.vstack((1,u))) + np.dot( W, x )
        #compute reservoir activations with or without IP
        if ip_mode == 'intrinsic plasticity on':
            res_out = sigmoid( ip_gain * res_in + ip_bias )
            x = (1-a) * x + a * res_out
            #compute delta_bias considering the activation function
            #we don't want to train our network during the first epoch
            if epoch != 0:
                if activation_function_mode == 'tanh':
                    if ip_update_mode == 'leaky neurons ignored':
                        d_ip_bias = (-lr) * ((-(m / var)) + (res_out / var) * \
                        ((2 * var) + 1 - np.square(res_out) + m * res_out))
                    elif ip_update_mode == 'leaky neurons treated':
                        d_ip_bias = (-lr) * ((-(m / var)) + (x / var ) * \
                        ((2 * var) + 1 - np.square(x) + m * x))
                    else:
                        raise Exception("ERROR: 'ip_update_mode' was not " \
                        "set correctly.") 
                else: #fermi
                    if ip_update_mode == 'leaky neurons ignored':   
                        d_ip_bias = lr * (1 - (2 + (1/m)) * res_out + \
                        (np.square(res_out) / m))
                    elif ip_update_mode == 'leaky neurons treated':
                        d_ip_bias = lr * (1 - (2 + (1/m)) * x + \
                        (np.square(x) / m))
                    else:
                        raise Exception("ERROR: 'ip_update_mode' was not " \
                        "set correctly.") 
                #compute delta_bias and update IP's gain and bias
                ip_bias += d_ip_bias
                ip_gain += (lr / ip_gain) + (d_ip_bias * res_in)
                #store the results to plot them
                record_ip_bias[t + (trainLen * (epoch-1)),0] = ip_bias.mean()
                record_ip_gain[t + (trainLen * (epoch-1)),0] = ip_gain.mean()
               
               
        elif ip_mode == 'intrinsic plasticity off':
            res_out = sigmoid(res_in)
            x = (1-a) * x + a * res_out 
           
        else:
           raise Exception("ERROR: 'ip_mode' was not set correctly.")
        #accumulate values of a randomly choosen reservoir's neuron activations
        neuron_out_records[t] = np.round(res_out[choosen_neuron],2)
        
        #we perform linear regression after the last epoch of training
        #so we only store the activations of the last epoch
        if epoch == nb_epoch - 1 :
            if wout_mode == 'entries bias and resOut':       
                X[:,t] = np.vstack((1,u,x))[:,0]
      
            elif wout_mode == 'resOut and bias only':
                X[:,t] = np.vstack((1,x))[:,0]
            
            else:
                raise Exception("ERROR: 'wout_mode' was not set correctly.")
        #store spatio-temporal activity of the reservoir
        recorded_res_out[t] = res_out[:,0] 
        
    #plot some signals to see if IP works
    if activation_function_mode == 'tanh':    
        plot_activity(recorded_res_out, epoch)
        plot_neuron_activity(neuron_out_records, epoch)
    if activation_function_mode == 'fermi':
        if(epoch%20 == 0):
            plot_activity(recorded_res_out, epoch)
            plot_neuron_activity(neuron_out_records, epoch)
            
    # plot the evolution of gain and bias during training 
    if ip_mode == 'intrinsic plasticity on':
        plt.figure(10).clear()
        plt.plot( record_ip_gain, label='gain' )
        plt.plot( record_ip_bias, label='bias' )
        plt.legend()
        plt.ylabel('mean value')
        plt.xlabel('number of timesteps')
        plt.title('Evolution of the mean of gain and bias ' \
        'relative to intrinsic plasticity')

# train the output, using the states after prepareLen
print(X.shape,Yt.shape)
X = X[:, prepareLen:]
Yt = Yt[:, prepareLen:]
X_T = X.T

# use ridge regression (linear regression with regularization)
if wout_mode == 'entries bias and resOut':       
    Wout = np.dot( np.dot(Yt,X_T), np.linalg.inv( np.dot(X,X_T) + \
    reg*np.eye(1+inSize+resSize)))
    
elif wout_mode == 'resOut and bias only':
    Wout = np.dot( np.dot(Yt,X_T), np.linalg.inv( np.dot(X,X_T) + \
    reg*np.eye(1+resSize)))
        
else :
    raise Exception("ERROR: 'wout_mode' was not set correctly.")
    
# use pseudo inverse
#Wout = dot( Yt, linalg.pinv(X) )

# run the trained ESN with the test set
Y = np.zeros((outSize,testLen))
u = data[trainLen]

for t in range(testLen):
    res_in = np.dot( Win, np.vstack((1,u)) ) + np.dot( W, x )
    if ip_mode == 'intrinsic plasticity on':        
        res_out = sigmoid(ip_gain * res_in + ip_bias )
        
    elif ip_mode == 'intrinsic plasticity off':
       res_out = sigmoid(res_in)
       
    else:
       raise Exception("ERROR: 'ip_mode' was not set correctly.") 
    x = (1-a) * x + a * res_out  
    
    if wout_mode == 'entries bias and resOut':       
        y = np.dot( Wout, np.vstack((1,u,x)) )
    
    elif wout_mode == 'resOut and bias only':
        y = np.dot( Wout, np.vstack((1,x)))
        
    else :
        raise Exception("ERROR: 'wout_mode' was not set correctly.")
      
    Y[:,t] = y
    if mode == 'generative':
        # generative mode:
        u = y
    elif mode == 'prediction':
        # predictive mode:
        u = data[trainLen+t+1] 
    else:
        raise Exception("ERROR: 'mode' was not set correctly.")

# compute MSE for the first errorLen time steps
errorLen = 1000
mse_for_each_t = np.square( data[trainLen+1:trainLen+errorLen+1] - \
Y[0,0:errorLen] )
mse = np.sum( mse_for_each_t ) / errorLen
print('MSE = ' + str( mse )) 
print('compared to max default (Mantas) error 2.91524629066e-07'\
'(For prediction / 100 Neurons)')
print('ratio compared to (Mantas) error ' + str(mse/2.91524629066e-07) + \
'  (For prediction / 100 Neurons)')
print("") 
print('compared to max default (Mantas) error 4.06986845044e-06 '\
'(For generation / 1000 Neurons)') 
print('compared to max default (Mantas) error 2.02529702465e-08 '\
'(For prediction / 1000 Neurons)')
plt.figure()
plt.plot(data[trainLen+1:trainLen+errorLen+1].T)
plt.plot(Y[0,0:errorLen])

import seaborn as sns
plt.figure(figsize=(20,10))
ax = sns.heatmap(X[:,:1000])

plt.figure()
plt.plot(Yt.T, color='k', label='y')
for i in range(9,10):
    plt.plot(X[i],label=str(i))
plt.legend()
plt.show()