PyTorch Lecture12：RNN1 - Basics-CSDN博客

本文链接：https://blog.csdn.net/zhuoyuezai/article/details/80711801

代码1

import torch
import torch.nn as nn
from torch.autograd import Variable

# One hot encoding for each char in 'hello'
h = [1, 0, 0, 0]
e = [0, 1, 0, 0]
l = [0, 0, 1, 0]
o = [0, 0, 0, 1]

# One cell RNN input_dim(4) -> output_dim(2). sequence:5
cell = nn.RNN(input_size=4, hidden_size=2, batch_first=True)

# (num_layers * num_directions, batch,hidden_size) whether batch_first = True or False
hidden = Variable(torch.randn(1, 1, 2))
# Propagate input through RNN
# Input: (batch, seq_len, input_size) when batch_first=True
inputs = Variable(torch.Tensor([h, e, l, l, o]))
for one in inputs:
    one = one.view(1, 1, -1)
    # Input: (batch, seq_len, input_size) when batch_first=True
    out, hidden = cell(one, hidden)
    print("one input size", one.size(), "out.size", out.size())

# We can do the whole at once
# propagate input through RNN
# Input :(batch,seq_len,input_size) when batch_first =True
inputs=inputs.view(1,5,-1)
out,hidden=cell(inputs,hidden)
print("sequence input  size",inputs.size(),"out size",out.size())

# hidden:(num_layers * num_directions, batch,hidden_size) whether batch_first =True or False
hidden =Variable(torch.randn(1,3,2))

# One cell RNN input-dim(4) ->output_dim(2). sequence:5, batch 3
# 3 batches 'hello','eolll','lleel'
# rank =(3,5,4)

inputs=Variable(torch.Tensor([[h,e,l,l,o],
                             [e,o,l,l,l],
                             [l,l,e,e,l]]))

# Propagate input through RNN
# Input:(batch,seq_len.input_size) when batch_first=True
# B*S*I

out,hidden=cell(inputs,hidden)
print("batch input size",inputs.size(),"out size",out.size())

# One cell RNN input_dim(4) ->output_dim(2)
cell =nn.RNN(input_size=4,hidden_size=2)

# The given dimensions dim0 and dim1 are swapped.

inputs=inputs.transpose(0,1)
# Propagate input through RNN
# Input: (seq_len, batch_size, input_size) when batch_first=False (default)
# S x B x I
out,hidden =cell(inputs,hidden)
print("batch input size",inputs.size(),"out size",out.size())