为什么网络学习效果不好（Tensorflow LSTM用于文本生成）？

from __future__ import absolute_import, division, print_function import os import numpy as np import tflearn from tflearn.data_utils import * from tflearn.layers.estimator import regression inputs, targets, char_dict = \ textfile_to_semi_redundant_sequences("shakespeare_input.txt", seq_maxlen=20) #helper - vectorises text LSTM = tflearn.input_data([None, 20, len(char_dict)]) LSTM = tflearn.lstm(LSTM, 512, return_seq=True, restore=True, dropout = 0.5) LSTM = tflearn.lstm(LSTM, 512, restore=True, dropout = 0.5) LSTM = tflearn.fully_connected(LSTM, len(char_dict), activation='softmax') LSTM = tflearn.regression(LSTM, optimizer= 'adam', loss='categorical_crossentropy', learning_rate=0.001) LSTMmodel = tflearn.SequenceGenerator(LSTM, dictionary=char_dict, seq_maxlen=20, clip_gradients=5.0, tensorboard_verbose=0,tensorboard_dir='pathfile/logs') #LSTMmodel.load('/pathfile/LSTMmodel.tfl') for i in range(10): print("-- TESTING...") starting = random_sequence_from_textfile("shakespeare_input.txt", 20) output_path = 'pathfile/epoch_' + str(i) + '_output.txt' generated_output = LSTMmodel.generate(500, temperature=1.0, seq_seed=starting) text_file = open(output_path, "w") #save the outputs to a text file - allows us to view progress of model text_file.write("With temperature 1.0: \n \n \n") #two different temperatures - higher temp = more novel text_file.write(generated_output) generated_output = LSTMmodel.generate(500, temperature=0.5, seq_seed=starting) #lower temp = more accurate to original text text_file.write("\n \n \n With temperature 0.5: \n \n \n") text_file.write(generated_output) text_file.close() print("-- TRAINING...") LSTMmodel.fit(inputs, targets, batch_size=200, n_epoch=1, run_id='Shakespeare_Generator',shuffle = True) print("-- SAVING MODEL...") if (i%2==0): LSTMmodel.save("pathfile/LSTMmodel.tfl") else: LSTMmodel.save("pathfile//LSTMmodel2.tfl") print("-- EPOCH " + str(i+1) +" COMPLETE...")

1条回答

网友
1楼 · 发布于 2024-05-14 17:04:51

对于这个模型，我没有答案，但是你有没有试过从一个现存的莎士比亚生成的LSTM的例子开始，比如这个？
https://github.com/sherjilozair/char-rnn-tensorflow
训练应该会快一点，如果你是从一个实际的例子开始的话，在出错的地方调试可能会更容易。

相关问题更多 >

编程相关推荐

热门问题

热门文章