深度学习入门ch3a jupyter note

最新推荐文章于 2024-08-18 09:25:36 发布

renzao_ai

最新推荐文章于 2024-08-18 09:25:36 发布

阅读量268

点赞数

分类专栏： Python 深度学习文章标签： sigmoid identity step_function softmax astype

本文链接：https://blog.csdn.net/zt5169/article/details/91129221

版权

Python 同时被 2 个专栏收录

58 篇文章 5 订阅

订阅专栏

深度学习

18 篇文章 1 订阅

订阅专栏

深度学习入门ch3a jupyter note

In [8]:

import numpy as np
x=np.array([-1.0,1.0,2.0])
print(x)
y=x>0
print(y)
y=y.astype(np.int)
print(y)
print(y.ndim)      #property
print(np.ndim(y))  #method

Output:

[-1.  1.  2.]
[False  True  True]
[0 1 1]
1
1

In [5]:

import matplotlib.pyplot as plt
%pylab inline

def sigmoid(x):
    return 1 / (1 + np.exp(-x))    


def step_function(x):
    return np.array(x > 0, dtype=np.int)

x = np.arange(-5.0, 5.0, 0.1)
y1 = sigmoid(x)
y2 = step_function(x)

plt.plot(x, y1)
plt.plot(x, y2, 'k--')
plt.ylim(-0.1, 1.1) #指定图中绘制的y轴的范围
plt.show()

Output:

Populating the interactive namespace from numpy and matplotlib

In [7]:

def relu(x):
    return np.maximum(0, x)

x = np.arange(-5.0, 5.0, 0.1)
y = relu(x)
plt.plot(x, y)
plt.ylim(-1.0, 5.5)
plt.show()

Output:

In [16]:

def identity_function(x):
    return x

def softmax(x):
    if x.ndim == 2:
        x = x.T
        x = x - np.max(x, axis=0)
        y = np.exp(x) / np.sum(np.exp(x), axis=0)
        return y.T 

    x = x - np.max(x) # 溢出对策
    return np.exp(x) / np.sum(np.exp(x))

#一般地，回归问题可以使用恒等函数，
#二元分类问题可以使用sigmoid 函数，
#多元分类问题可以使用softmax 函数。而输出层的softmax通常省略。

Output:

In [11]:

#matrix multiply or dot mult
ma = np.array([[1,2,3],[4,5,6]])
mb = np.array([[1,2],[3,4],[5,6]])
print(ma.shape)
print(mb.shape)
print(np.dot(ma,mb))
#  A     dot    B 
# 3X2         2X4   = 3X4
# 3X5         5X4   = 3X4

Output:

(2, 3)
(3, 2)
[[22 28]
 [49 64]]

In [19]:

#两层正向网络
X = np.array([1.0, 0.5])
W1 = np.array([[0.1, 0.3, 0.5], [0.2, 0.4, 0.6]])
B1 = np.array([0.1, 0.2, 0.3])
print(W1.shape) # (2, 3)
print(X.shape) # (2,)
print(B1.shape) # (3,)
A1 = np.dot(X, W1) + B1
Z1 = sigmoid(A1)
print(A1) # [0.3, 0.7, 1.1]
print(Z1) # [0.57444252, 0.66818777, 0.75026011]
W2 = np.array([[0.1, 0.4], [0.2, 0.5], [0.3, 0.6]])
B2 = np.array([0.1, 0.2])
print(Z1.shape) # (3,)
print(W2.shape) # (3, 2)
print(B2.shape) # (2,)
A2 = np.dot(Z1, W2) + B2
Z2 = sigmoid(A2)
print(Z2)
W3 = np.array([[0.1, 0.3], [0.2, 0.4]])
B3 = np.array([0.1, 0.2])
A3 = np.dot(Z2, W3) + B3
Y = identity_function(A3) # 或者Y = A3
print("output:")
print(Y)

Output:

(2, 3)
(2,)
(3,)
[0.3 0.7 1.1]
[0.57444252 0.66818777 0.75026011]
(3,)
(3, 2)
(2,)
[0.62624937 0.7710107 ]
output:
[0.31682708 0.69627909]

In [20]:

#whole view of nn code
def init_network():
    network = {}
    network['W1'] = np.array([[0.1, 0.3, 0.5], [0.2, 0.4, 0.6]])
    network['b1'] = np.array([0.1, 0.2, 0.3])
    network['W2'] = np.array([[0.1, 0.4], [0.2, 0.5], [0.3, 0.6]])
    network['b2'] = np.array([0.1, 0.2])
    network['W3'] = np.array([[0.1, 0.3], [0.2, 0.4]])
    network['b3'] = np.array([0.1, 0.2])
    return network  

def forward(network, x):
    W1, W2, W3 = network['W1'], network['W2'], network['W3']
    b1, b2, b3 = network['b1'], network['b2'], network['b3']
    a1 = np.dot(x, W1) + b1
    z1 = sigmoid(a1)
    a2 = np.dot(z1, W2) + b2
    z2 = sigmoid(a2)
    a3 = np.dot(z2, W3) + b3
    y = identity_function(a3)
    return y

#main()
network = init_network()
x = np.array([1.0, 0.5])
y = forward(network, x)
print(y) # [ 0.31682708 0.69627909]

Output: