'''Sequence to sequence example in Keras (character-level).
This script demonstrates how to implement a basic character-level
sequence-to-sequence model. We apply it to translating
short English sentences into short French sentences,
character-by-character. Note that it is fairly unusual to
do character-level machine translation, as word-level
models are more common in this domain.

# Summary of the algorithm

- We start with input sequences from a domain (e.g. English sentences)
    and correspding target sequences from another domain
    (e.g. French sentences).
- An encoder LSTM turns input sequences to 2 state vectors
    (we keep the last LSTM state and discard the outputs).
- A decoder LSTM is trained to turn the target sequences into
    the same sequence but offset by one timestep in the future,
    a training process called "teacher forcing" in this context.
    Is uses as initial state the state vectors from the encoder.
    Effectively, the decoder learns to generate `targets[t+1...]`
    given `targets[...t]`, conditioned on the input sequence.
- 解码器LSTM被训练成将目标序列转换成相同的序列,但是在将来被一个时间步长偏移,
在此上下文中称为“teacher forcing”的训练过程。作为编码器的初始状态,有效地,译码器
学会在输入序列条件下生成“目标[t+1…] ]给定的‘目标[…t]’。
- In inference mode, when we want to decode unknown input sequences, we:
- 在推理模式中,当我们想要解码未知输入序列时,我们:
    - Encode the input sequence into state vectors
    - 将输入序列编码为状态向量
    - Start with a target sequence of size 1
        (just the start-of-sequence character)
    - 从大小为1的目标序列开始(只是序列字符的开始)
    - Feed the state vectors and 1-char target sequence
        to the decoder to produce predictions for the next character
    - 将状态向量和1-Char目标序列送到解码器以生成下一个字符的预测。
    - Sample the next character using these predictions
        (we simply use argmax).
    - 使用这些预测来采样下一个字符(我们只使用argmax)。
    - Append the sampled character to the target sequence
    - 采样的字符追加到目标序列
    - Repeat until we generate the end-of-sequence character or we
        hit the character limit.
    - 重复,直到产生序列结束字符或到达字符限制。

# Data download
English to French sentence pairs.

Lots of neat sentence pairs datasets can be found at:

# References
- Sequence to Sequence Learning with Neural Networks
- Learning Phrase Representations using
    RNN Encoder-Decoder for Statistical Machine Translation
from __future__ import print_function

from keras.models import Model
from keras.layers import Input, LSTM, Dense
import numpy as np

batch_size = 64  # Batch size for training. 训练批次大小(每个批次包含样本数)
epochs = 100  # Number of epochs to train for.训练周期数
latent_dim = 256  # Latent dimensionality of the encoding space.编码空间的潜在维数
num_samples = 10000  # Number of samples to train on.训练集样本数
# Path to the data txt file on disk.
# 存储器数据文件路径(先下载,然后存放到和本脚本同级目录)
data_path = 'fra-eng/fra.txt'

# Vectorize the data.
# 数据向量化
input_texts = []
target_texts = []
input_characters = set()
target_characters = set()
with open(data_path, 'r', encoding='utf-8') as f:
    lines = f.read().split('\n')
for line in lines[: min(num_samples, len(lines) - 1)]:
    input_text, target_text = line.split('\t')
    # We use "tab" as the "start sequence" character
    # 使用"tab"为开始序列字符
    # for the targets, and "\n" as "end sequence" character.
    # 使用“tab”作为目标的“开始序列”字符,而“\n”作为“结束序列”字符。
    target_text = '\t' + target_text + '\n'
    for char in input_text:
        if char not in input_characters:
    for char in target_text:
        if char not in target_characters:

input_characters = sorted(list(input_characters))
target_characters = sorted(list(target_characters))
num_encoder_tokens = len(input_characters)
num_decoder_tokens = len(target_characters)
max_encoder_seq_length = max([len(txt) for txt in input_texts])
max_decoder_seq_length = max([len(txt) for txt in target_texts])

print('Number of samples:', len(input_texts))
print('Number of unique input tokens:', num_encoder_tokens)
print('Number of unique output tokens:', num_decoder_tokens)
print('Max sequence length for inputs:', max_encoder_seq_length)
print('Max sequence length for outputs:', max_decoder_seq_length)

input_token_index = dict(
    [(char, i) for i, char in enumerate(input_characters)])
target_token_index = dict(
    [(char, i) for i, char in enumerate(target_characters)])

encoder_input_data = np.zeros(
    (len(input_texts), max_encoder_seq_length, num_encoder_tokens),
decoder_input_data = np.zeros(
    (len(input_texts), max_decoder_seq_length, num_decoder_tokens),
decoder_target_data = np.zeros(
    (len(input_texts), max_decoder_seq_length, num_decoder_tokens),

for i, (input_text, target_text) in enumerate(zip(input_texts, target_texts)):
    for t, char in enumerate(input_text):
        encoder_input_data[i, t, input_token_index[char]] = 1.
    for t, char in enumerate(target_text):
        # decoder_target_data is ahead of decoder_input_data by one timestep
        # decoder_target_data领先decoder_input_data一步
        decoder_input_data[i, t, target_token_index[char]] = 1.
        if t > 0:
            # decoder_target_data will be ahead by one timestep
            # and will not include the start character.
            # decoder_target_data数据将提前一个时间步,不包括开始字符。
            decoder_target_data[i, t - 1, target_token_index[char]] = 1.

# Define an input sequence and process it.
# 定义一个输入序列并对其进行处理。
encoder_inputs = Input(shape=(None, num_encoder_tokens))
encoder = LSTM(latent_dim, return_state=True)
encoder_outputs, state_h, state_c = encoder(encoder_inputs)
# We discard `encoder_outputs` and only keep the states.
# 丢弃“encoder_outputs”,只保留状态。
encoder_states = [state_h, state_c]

# Set up the decoder, using `encoder_states` as initial state.
# 设置解码器,使用encoder_states作为初始状态。
decoder_inputs = Input(shape=(None, num_decoder_tokens))
# We set up our decoder to return full output sequences,
# and to return internal states as well. We don't use the
# return states in the training model, but we will use them in inference.
# 设置解码器返回完整的输出序列,并返回内部状态。我们在训练模型中不使用返回状态,但是我们将在推理中使用它们。
decoder_lstm = LSTM(latent_dim, return_sequences=True, return_state=True)
decoder_outputs, _, _ = decoder_lstm(decoder_inputs,
decoder_dense = Dense(num_decoder_tokens, activation='softmax')
decoder_outputs = decoder_dense(decoder_outputs)

# Define the model that will turn
# `encoder_input_data` & `decoder_input_data` into `decoder_target_data`
# 定义将encoder_input_data和decoder_input_data转换为decoder_target_data的模型
model = Model([encoder_inputs, decoder_inputs], decoder_outputs)

# Run training
# 运行模型
model.compile(optimizer='rmsprop', loss='categorical_crossentropy')
model.fit([encoder_input_data, decoder_input_data], decoder_target_data,
# Save model
# 保存模型

# Next: inference mode (sampling).
# 下一步:推理模式(采样)。
# Here's the drill:
# 练习:
# 1) encode input and retrieve initial decoder state
# 1) 编码输入和检索初始解码器状态
# 2) run one step of decoder with this initial state
# and a "start of sequence" token as target.
# Output will be the next target token
# 2) 以这个初始状态和一个“序列开始”分词为目标运行一步解码器。输出将是下一个目标分词
# 3) Repeat with the current target token and current states
# 3) 重复当前目标分词和当前状态

# Define sampling models
# 定义抽样模型
encoder_model = Model(encoder_inputs, encoder_states)

decoder_state_input_h = Input(shape=(latent_dim,))
decoder_state_input_c = Input(shape=(latent_dim,))
decoder_states_inputs = [decoder_state_input_h, decoder_state_input_c]
decoder_outputs, state_h, state_c = decoder_lstm(
    decoder_inputs, initial_state=decoder_states_inputs)
decoder_states = [state_h, state_c]
decoder_outputs = decoder_dense(decoder_outputs)
decoder_model = Model(
    [decoder_inputs] + decoder_states_inputs,
    [decoder_outputs] + decoder_states)

# Reverse-lookup token index to decode sequences back to
# something readable.
# 反向查找分词索引(词的编号)将序列解码为可读的。
reverse_input_char_index = dict(
    (i, char) for char, i in input_token_index.items())
reverse_target_char_index = dict(
    (i, char) for char, i in target_token_index.items())

def decode_sequence(input_seq):
    # Encode the input as state vectors.
    # 将输入(数据)编码为状态向量。
    states_value = encoder_model.predict(input_seq)

    # Generate empty target sequence of length 1.
    # 生成长度为1的空目标序列。
    target_seq = np.zeros((1, 1, num_decoder_tokens))
    # Populate the first character of target sequence with the start character.
    # 用开始字符填充目标序列的第一个字符。
    target_seq[0, 0, target_token_index['\t']] = 1.

    # Sampling loop for a batch of sequences
    # (to simplify, here we assume a batch of size 1).
    # 一批序列的采样循环(为了简化,这里假设一批次大小为1)。
    stop_condition = False
    decoded_sentence = ''
    while not stop_condition:
        output_tokens, h, c = decoder_model.predict(
            [target_seq] + states_value)

        # Sample a token
        # 采样
        sampled_token_index = np.argmax(output_tokens[0, -1, :])
        sampled_char = reverse_target_char_index[sampled_token_index]
        decoded_sentence += sampled_char

        # Exit condition: either hit max length
        # or find stop character.
        # 退出条件:到达最大长度或找到停止字符。
        if (sampled_char == '\n' or
           len(decoded_sentence) > max_decoder_seq_length):
            stop_condition = True

        # Update the target sequence (of length 1).
        # 更新目标序列(长度1)。
        target_seq = np.zeros((1, 1, num_decoder_tokens))
        target_seq[0, 0, sampled_token_index] = 1.

        # Update states
        # 更新状态
        states_value = [h, c]

    return decoded_sentence

for seq_index in range(100):
    # Take one sequence (part of the training set)
    # for trying out decoding.
    # 用一个序列(训练集的一部分)进行解码。
    input_seq = encoder_input_data[seq_index: seq_index + 1]
    decoded_sentence = decode_sequence(input_seq)
    print('Input sentence:', input_texts[seq_index])
    print('Decoded sentence:', decoded_sentence)


C:\ProgramData\Anaconda3\python.exe E:/keras-master/examples/lstm_seq2seq.py
Using TensorFlow backend.
Number of samples: 10000
Number of unique input tokens: 71
Number of unique output tokens: 94
Max sequence length for inputs: 16
Max sequence length for outputs: 59
Train on 8000 samples, validate on 2000 samples
Epoch 1/100

8000/8000 [==============================] - 25s 3ms/step - loss: 0.9274 - val_loss: 1.0000
Epoch 2/100

Epoch 100/100

8000/8000 [==============================] - 19s 2ms/step - loss: 0.0588 - val_loss: 0.7629
E:\keras-master\keras\engine\topology.py:2365: UserWarning: Layer lstm_2 was passed non-serializable keyword arguments: {'initial_state': [<tf.Tensor 'lstm_1/while/Exit_2:0' shape=(?, 256) dtype=float32>, <tf.Tensor 'lstm_1/while/Exit_3:0' shape=(?, 256) dtype=float32>]}. They will not be included in the serialized model (and thus will be missing at deserialization time).
  str(node.arguments) + '. They will not be included '
Input sentence: Go.
Decoded sentence: Va !

Input sentence: Run!
Decoded sentence: Cours !

Input sentence: Run!
Decoded sentence: Cours !

Input sentence: Fire!
Decoded sentence: Au feu !

Input sentence: Help!
Decoded sentence: À l'aide !

Input sentence: Jump.
Decoded sentence: Saute.

Input sentence: Stop!
Decoded sentence: Arrête-toi !

Input sentence: Stop!
Decoded sentence: Arrête-toi !

Input sentence: Stop!
Decoded sentence: Arrête-toi !

Input sentence: Wait!
Decoded sentence: Attends !

Input sentence: Wait!
Decoded sentence: Attends !

Input sentence: Go on.
Decoded sentence: Continuez.

Input sentence: Go on.
Decoded sentence: Continuez.

Input sentence: Go on.
Decoded sentence: Continuez.

Input sentence: I see.
Decoded sentence: Je vois une lumière.

Input sentence: I try.
Decoded sentence: J'essaye.

Input sentence: I won!
Decoded sentence: J'ai demandé à dore.

Input sentence: I won!
Decoded sentence: J'ai demandé à dore.

Input sentence: Oh no!
Decoded sentence: Oh non !

Input sentence: Attack!
Decoded sentence: Attaquez !

Input sentence: Attack!
Decoded sentence: Attaquez !

Input sentence: Cheers!
Decoded sentence: À votre santé !

Input sentence: Cheers!
Decoded sentence: À votre santé !

Input sentence: Cheers!
Decoded sentence: À votre santé !

Input sentence: Cheers!
Decoded sentence: À votre santé !

Input sentence: Get up.
Decoded sentence: Lève-toi.

Input sentence: Go now.
Decoded sentence: Va doucement !

Input sentence: Go now.
Decoded sentence: Va doucement !

Input sentence: Go now.
Decoded sentence: Va doucement !

Input sentence: Got it!
Decoded sentence: Compris !

Input sentence: Got it!
Decoded sentence: Compris !

Input sentence: Got it?
Decoded sentence: Compris ?

Input sentence: Got it?
Decoded sentence: Compris ?

Input sentence: Got it?
Decoded sentence: Compris ?

Input sentence: Hop in.
Decoded sentence: Montez.

Input sentence: Hop in.
Decoded sentence: Montez.

Input sentence: Hug me.
Decoded sentence: Serre-moi dans tes bras !

Input sentence: Hug me.
Decoded sentence: Serre-moi dans tes bras !

Input sentence: I fell.
Decoded sentence: Je suis tombée.

Input sentence: I fell.
Decoded sentence: Je suis tombée.

Input sentence: I know.
Decoded sentence: Je sais.

Input sentence: I left.
Decoded sentence: Je suis parti.

Input sentence: I left.
Decoded sentence: Je suis parti.

Input sentence: I lost.
Decoded sentence: J'ai perdu.

Input sentence: I'm 19.
Decoded sentence: J'ai les chocontes.

Input sentence: I'm OK.
Decoded sentence: Je vais bien.

Input sentence: I'm OK.
Decoded sentence: Je vais bien.

Input sentence: Listen.
Decoded sentence: Écoutez !

Input sentence: No way!
Decoded sentence: C'est exclu !

Input sentence: No way!
Decoded sentence: C'est exclu !

Input sentence: No way!
Decoded sentence: C'est exclu !

Input sentence: No way!
Decoded sentence: C'est exclu !

Input sentence: No way!
Decoded sentence: C'est exclu !

Input sentence: No way!
Decoded sentence: C'est exclu !

Input sentence: No way!
Decoded sentence: C'est exclu !

Input sentence: No way!
Decoded sentence: C'est exclu !

Input sentence: No way!
Decoded sentence: C'est exclu !

Input sentence: Really?
Decoded sentence: Vrai ?

Input sentence: Really?
Decoded sentence: Vrai ?

Input sentence: Really?
Decoded sentence: Vrai ?

Input sentence: Thanks.
Decoded sentence: Merci !

Input sentence: We try.
Decoded sentence: On essaye.

Input sentence: We won.
Decoded sentence: Nous avons réveillé.

Input sentence: We won.
Decoded sentence: Nous avons réveillé.

Input sentence: We won.
Decoded sentence: Nous avons réveillé.

Input sentence: We won.
Decoded sentence: Nous avons réveillé.

Input sentence: Ask Tom.
Decoded sentence: Demande-leur.

Input sentence: Awesome!
Decoded sentence: Faisalez-moi !

Input sentence: Be calm.
Decoded sentence: Sois calme !

Input sentence: Be calm.
Decoded sentence: Sois calme !

Input sentence: Be calm.
Decoded sentence: Sois calme !

Input sentence: Be cool.
Decoded sentence: Sois détendu !

Input sentence: Be fair.
Decoded sentence: Soyez équitables !

Input sentence: Be fair.
Decoded sentence: Soyez équitables !

Input sentence: Be fair.
Decoded sentence: Soyez équitables !

Input sentence: Be fair.
Decoded sentence: Soyez équitables !

Input sentence: Be fair.
Decoded sentence: Soyez équitables !

Input sentence: Be fair.
Decoded sentence: Soyez équitables !

Input sentence: Be kind.
Decoded sentence: Sois gentil.

Input sentence: Be nice.
Decoded sentence: Sois gentille !

Input sentence: Be nice.
Decoded sentence: Sois gentille !

Input sentence: Be nice.
Decoded sentence: Sois gentille !

Input sentence: Be nice.
Decoded sentence: Sois gentille !

Input sentence: Be nice.
Decoded sentence: Sois gentille !

Input sentence: Be nice.
Decoded sentence: Sois gentille !

Input sentence: Beat it.
Decoded sentence: Dégage !

Input sentence: Call me.
Decoded sentence: Appellez-moi !

Input sentence: Call me.
Decoded sentence: Appellez-moi !

Input sentence: Call us.
Decoded sentence: Appelle-nous !

Input sentence: Call us.
Decoded sentence: Appelle-nous !

Input sentence: Come in.
Decoded sentence: Entrez !

Input sentence: Come in.
Decoded sentence: Entrez !

Input sentence: Come in.
Decoded sentence: Entrez !

Input sentence: Come in.
Decoded sentence: Entrez !

Input sentence: Come on!
Decoded sentence: Allez !

Input sentence: Come on.
Decoded sentence: Viens !

Input sentence: Come on.
Decoded sentence: Viens !

Input sentence: Come on.
Decoded sentence: Viens !

Input sentence: Drop it!
Decoded sentence: Laissez-le tomber !

Input sentence: Drop it!
Decoded sentence: Laissez-le tomber !

下面代码在tensorflow中出现了init() missing 1 required positional argument: 'cell'报错: class Model(): def init(self): self.img_seq_shape=(10,128,128,3) self.img_shape=(128,128,3) self.train_img=dataset # self.test_img=dataset_T patch = int(128 / 2 ** 4) self.disc_patch = (patch, patch, 1) self.optimizer=tf.keras.optimizers.Adam(learning_rate=0.001) self.build_generator=self.build_generator() self.build_discriminator=self.build_discriminator() self.build_discriminator.compile(loss='binary_crossentropy', optimizer=self.optimizer, metrics=['accuracy']) self.build_generator.compile(loss='binary_crossentropy', optimizer=self.optimizer) img_seq_A = Input(shape=(10,128,128,3)) #输入图片 img_B = Input(shape=self.img_shape) #目标图片 fake_B = self.build_generator(img_seq_A) #生成的伪目标图片 self.build_discriminator.trainable = False valid = self.build_discriminator([img_seq_A, fake_B]) self.combined = tf.keras.models.Model([img_seq_A, img_B], [valid, fake_B]) self.combined.compile(loss=['binary_crossentropy', 'mse'], loss_weights=[1, 100], optimizer=self.optimizer,metrics=['accuracy']) def build_generator(self): def res_net(inputs, filters): x = inputs net = conv2d(x, filters // 2, (1, 1), 1) net = conv2d(net, filters, (3, 3), 1) net = net + x # net=tf.keras.layers.LeakyReLU(0.2)(net) return net def conv2d(inputs, filters, kernel_size, strides): x = tf.keras.layers.Conv2D(filters, kernel_size, strides, 'same')(inputs) x = tf.keras.layers.BatchNormalization()(x) x = tf.keras.layers.LeakyReLU(alpha=0.2)(x) return x d0 = tf.keras.layers.Input(shape=(10, 128, 128, 3)) out= ConvRNN2D(filters=32, kernel_size=3,padding='same')(d0) out=tf.keras.layers.Conv2D(3,1,1,'same')(out) return keras.Model(inputs=d0, outputs=out) def build_discriminator(self): def d_layer(layer_input, filters, f_size=4, bn=True): d = tf.keras.layers.Conv2D(filters, kernel_size=f_size, strides=2, padding='same')(layer_input) if bn: d = tf.keras.layers.BatchNormalization(momentum=0.8)(d) d = tf.keras.layers.LeakyReLU(alpha=0.2)(d) return d img_A = tf.keras.layers.Input(shape=(10, 128, 128, 3)) img_B = tf.keras.layers.Input(shape=(128, 128, 3)) df = 32 lstm_out = ConvRNN2D(filters=df, kernel_size=4, padding="same")(img_A) lstm_out = tf.keras.layers.LeakyReLU(alpha=0.2)(lstm_out) combined_imgs = tf.keras.layers.Concatenate(axis=-1)([lstm_out, img_B]) d1 = d_layer(combined_imgs, df)#64 d2 = d_layer(d1, df * 2)#32 d3 = d_layer(d2, df * 4)#16 d4 = d_layer(d3, df * 8)#8 validity = tf.keras.layers.Conv2D(1, kernel_size=4, strides=1, padding='same')(d4) return tf.keras.Model([img_A, img_B], validity)
