基於RNN(二)唐詩生成
- 本篇博文就是手寫數字識別的一個升級版本,天天手寫數字都厭煩了,索性在網上找了個有趣的例程唐詩生成.
- 本博文是學完RNN的一個小練習,讀懂全部程式你會對LSTM有更深的理解.
參考:
......
先看結果:
'''
求得能名及八鸚,把盤猶舒熱龍鱗。
贊娟從荀繞苔寢,唯有泉聲細洞房。
求耕遐老數三秦,豈汝百驄濾自能。
關朝酒別詞堪愁,愁向長雲寄白頭。
注農滿映雲滿嫌,此翩逼時朝方清。
'''
網路流程:
- 收集唐詩資料-->>點選下載
- 分析資料-->>生成詞向量
- 生成get_batch函式
- 批量對詩進行訓練
- 確保精度 / 儲存模型
- 生成唐詩(隱含詩)
特殊說明:
生成詞向量會略去很少的生僻字
資料缺失進行填充
批量訓練對長短不齊的詩進行補全,以長的為標準
生成詩的過程使用了隨機性
random
,如果不適用隨機性那麼每次生成的詩都一樣.源程式對概率大的詩進行了保留大概率,下圖簡單說明以下:
對於生成五言和七言詩有缺陷,得一直達到要求才可以返回
if len(sentence) == 2 + 2 * type:
sentence += u'\n'
poem += sentence
flag = False
程式碼:
#這裡就不放程式碼了,那麼多程式碼,我不信你在微信上面看完!!!還是點選後面的閱讀全文進行觀察吧~~
#!/usr/bin/python3
# -*- coding: UTF-8 -*-
import collections
import numpy as np
import tensorflow as tf
import os
#os.environ["CUDA_VISIBLE_DEVICES"] = "0"#設定GPU為gtx1060
'''
author: log16
Data: 2017/5/4
'''
# -------------------------------資料預處理---------------------------#
poetry_file = os.getcwd()+'/poetry.txt'
# 詩集
poetrys = []
with open(poetry_file, "r") as f:
for line in f:
try:
#line = line.decode('UTF-8')
line = line.strip(u'\n')
title, content = line.strip(u' ').split(u':')
content = content.replace(u' ', u'')
if u'_' in content or u'(' in content or u'(' in content or u'《' in content or u'[' in content:
continue
if len(content) < 5 or len(content) > 79:
continue
content = u'[' + content + u']'
poetrys.append(content)
except Exception as e:
pass
# 按詩的字數排序
poetrys = sorted(poetrys, key=lambda line: len(line))
print('唐詩總數: ', len(poetrys))
# 統計每個字出現次數
all_words = []
for poetry in poetrys:
all_words += [word for word in poetry]
counter = collections.Counter(all_words)
count_pairs = sorted(counter.items(), key=lambda x: -x[1])
words, _ = zip(*count_pairs)
# 取前多少個常用字
words = words[:len(words)] + (' ',)
# 每個字對映為一個數字ID
word_num_map = dict(zip(words, range(len(words))))
#word_num_map = sorted(word_num_map.items(),key=lambda x:x[1],reverse=True)
# 把詩轉換為向量形式
to_num = lambda word: word_num_map.get(word, len(words))
poetrys_vector = [list(map(to_num, poetry)) for poetry in poetrys]
# [[314, 3199, 367, 1556, 26, 179, 680, 0, 3199, 41, 506, 40, 151, 4, 98, 1],
# [339, 3, 133, 31, 302, 653, 512, 0, 37, 148, 294, 25, 54, 833, 3, 1, 965, 1315, 377, 1700, 562, 21, 37, 0, 2, 1253, 21, 36, 264, 877, 809, 1]
# ....]
# 每次取64首詩進行訓練
batch_size = 64
n_chunk = len(poetrys_vector) // batch_size
#利用序列對原始資料進行隨機化的抽取batch和enpoch
class DataSet(object):
def __init__(self, data_size):
self._data_size = data_size
self._epochs_completed = 0#epoch次數 = n*batch//data_size
self._index_in_epoch = 0#batch數量 = n*batch
self._data_index = np.arange(data_size)#下標索引
def next_batch(self, batch_size):
start = self._index_in_epoch
if start + batch_size > self._data_size:
np.random.shuffle(self._data_index)#打亂資料索引
self._epochs_completed = self._epochs_completed + 1
self._index_in_epoch = batch_size
full_batch_features, full_batch_labels = self.data_batch(0, batch_size)
return full_batch_features, full_batch_labels
else:
self._index_in_epoch += batch_size
end = self._index_in_epoch
full_batch_features, full_batch_labels = self.data_batch(start, end)
if self._index_in_epoch == self._data_size:
self._index_in_epoch = 0
self._epochs_completed = self._epochs_completed + 1
np.random.shuffle(self._data_index)
return full_batch_features, full_batch_labels
def data_batch(self, start, end):
batches = []
for i in range(start, end):
batches.append(poetrys_vector[self._data_index[i]])
length = max(map(len, batches))#求取batch的最大一個的長度
#------以最長的一個資料為基礎,其它的用" "空格去補全
xdata = np.full((end - start, length), word_num_map[' '], np.int32)
for row in range(end - start):
xdata[row, :len(batches[row])] = batches[row]
ydata = np.copy(xdata)
ydata[:, :-1] = xdata[:, 1:]#標籤對應著xdata的下一個序列
return xdata, ydata
# ---------------------------------------RNN--------------------------------------#
input_data = tf.placeholder(tf.int32, [batch_size, None])
output_targets = tf.placeholder(tf.int32, [batch_size, None])
# 定義RNN
def neural_network(model='lstm', rnn_size=128, num_layers=2):
if model == 'rnn':
cell_fun = tf.nn.rnn_cell.BasicRNNCell
elif model == 'gru':
cell_fun = tf.nn.rnn_cell.GRUCell
elif model == 'lstm':
cell_fun = tf.nn.rnn_cell.BasicLSTMCell
cell = cell_fun(rnn_size, state_is_tuple=True)#建立一個LSTM單元
cell = tf.nn.rnn_cell.MultiRNNCell([cell] * num_layers, state_is_tuple=True)#LSTM層數
initial_state = cell.zero_state(batch_size, tf.float32)
with tf.variable_scope('rnnlm'):
softmax_w = tf.get_variable("softmax_w", [rnn_size, len(words)])
softmax_b = tf.get_variable("softmax_b", [len(words)])
with tf.device("/gpu:0"):
#這裡會在文章單獨解釋
embedding = tf.get_variable("embedding", [len(words), rnn_size])
inputs = tf.nn.embedding_lookup(embedding, input_data)
outputs, last_state = tf.nn.dynamic_rnn(cell, inputs, initial_state=initial_state, scope='rnnlm')
output = tf.reshape(outputs, [-1, rnn_size])
logits = tf.matmul(output, softmax_w) + softmax_b
probs = tf.nn.softmax(logits)
return logits, last_state, probs, cell, initial_state
def load_model(sess, saver, ckpt_path):
latest_ckpt = tf.train.latest_checkpoint(ckpt_path)#得到最後一次儲存的模型
if latest_ckpt:
print('resume from', latest_ckpt)
saver.restore(sess, latest_ckpt)
return int(latest_ckpt[latest_ckpt.rindex('-') + 1:])
else:
print('building model from scratch')
sess.run(tf.global_variables_initializer())
return -1
# 訓練
def train_neural_network():
logits, last_state, _, _, _ = neural_network()
targets = tf.reshape(output_targets, [-1])
loss = tf.contrib.legacy_seq2seq.sequence_loss_by_example([logits], [targets], [tf.ones_like(targets, dtype=tf.float32)],
len(words))
cost = tf.reduce_mean(loss)
learning_rate = tf.Variable(0.0, trainable=False)
tvars = tf.trainable_variables()
grads, _ = tf.clip_by_global_norm(tf.gradients(cost, tvars), 5)#防止梯度爆炸,在其中設定的一個參考
# optimizer = tf.train.GradientDescentOptimizer(learning_rate)
optimizer = tf.train.AdamOptimizer(learning_rate)
#因為這裡不是直接優化損失函式,優化的是梯度值,所以得更新梯度
train_op = optimizer.apply_gradients(zip(grads, tvars))#對梯度進行更新
trainds = DataSet(len(poetrys_vector))
x, y = trainds.next_batch(batch_size)
#GPU設定為按需增長,且最大佔用90%
config = tf.ConfigProto(allow_soft_placement=True)
gpu_options = tf.GPUOptions(per_process_gpu_memory_fraction=0.9)
config.gpu_options.allow_growth = True
with tf.Session(config=config) as sess:
with tf.device('/gpu:0'):#使用os模組設定GPU
sess.run(tf.global_variables_initializer())
saver = tf.train.Saver(tf.all_variables())
last_epoch = load_model(sess, saver, 'model/')
for epoch in range(last_epoch + 1, 100):
sess.run(tf.assign(learning_rate, 0.002 * (0.97 ** epoch)))#不斷更新學習率
# sess.run(tf.assign(learning_rate, 0.01))
all_loss = 0.0
for batche in range(n_chunk):
x, y = trainds.next_batch(batch_size)
train_loss, _, _ = sess.run([cost, last_state, train_op],
feed_dict={input_data: x, output_targets: y})
all_loss = all_loss + train_loss
if batche % 50 == 1:
# print(epoch, batche, 0.01,train_loss)
print(epoch, batche, 0.002 * (0.97 ** epoch), train_loss)
saver.save(sess, 'model/poetry.module', global_step=epoch)
print(epoch, ' Loss: ', all_loss * 1.0 / n_chunk)
train_neural_network()
#!/usr/bin/python3
# -*- coding: UTF-8 -*-
import collections
import numpy as np
import tensorflow as tf
'''
This one will produce a poetry
author: log16
Date: 2017/5/4
'''
# -------------------------------資料預處理---------------------------#
poetry_file = 'poetry.txt'
# 詩集
poetrys = []
with open(poetry_file, "r") as f:
for line in f:
try:
#line = line.decode('UTF-8')
line = line.strip(u'\n')
title, content = line.strip(u' ').split(u':')
content = content.replace(u' ', u'')
if u'_' in content or u'(' in content or u'(' in content or u'《' in content or u'[' in content:
continue
if len(content) < 5 or len(content) > 79:
continue
content = u'[' + content + u']'
poetrys.append(content)
except Exception as e:
pass
# 按詩的字數排序
poetrys = sorted(poetrys, key=lambda line: len(line))
print('唐詩總數: ', len(poetrys))
# 統計每個字出現次數
all_words = []
for poetry in poetrys:
all_words += [word for word in poetry]
counter = collections.Counter(all_words)
count_pairs = sorted(counter.items(), key=lambda x: -x[1])
words, _ = zip(*count_pairs)
# 取前多少個常用字
words = words[:len(words)] + (' ',)
# 每個字對映為一個數字ID
word_num_map = dict(zip(words, range(len(words))))
# 把詩轉換為向量形式,參考TensorFlow練習1
to_num = lambda word: word_num_map.get(word, len(words))
poetrys_vector = [list(map(to_num, poetry)) for poetry in poetrys]
# [[314, 3199, 367, 1556, 26, 179, 680, 0, 3199, 41, 506, 40, 151, 4, 98, 1],
# [339, 3, 133, 31, 302, 653, 512, 0, 37, 148, 294, 25, 54, 833, 3, 1, 965, 1315, 377, 1700, 562, 21, 37, 0, 2, 1253, 21, 36, 264, 877, 809, 1]
# ....]
# 每次取64首詩進行訓練
batch_size = 1
n_chunk = len(poetrys_vector) // batch_size
class DataSet(object):
def __init__(self, data_size):
self._data_size = data_size
self._epochs_completed = 0
self._index_in_epoch = 0
self._data_index = np.arange(data_size)
def next_batch(self, batch_size):
start = self._index_in_epoch
if start + batch_size > self._data_size:
np.random.shuffle(self._data_index)
self._epochs_completed = self._epochs_completed + 1
self._index_in_epoch = batch_size
full_batch_features, full_batch_labels = self.data_batch(0, batch_size)
return full_batch_features, full_batch_labels
else:
self._index_in_epoch += batch_size
end = self._index_in_epoch
full_batch_features, full_batch_labels = self.data_batch(start, end)
if self._index_in_epoch == self._data_size:
self._index_in_epoch = 0
self._epochs_completed = self._epochs_completed + 1
np.random.shuffle(self._data_index)
return full_batch_features, full_batch_labels
def data_batch(self, start, end):
batches = []
for i in range(start, end):
batches.append(poetrys_vector[self._data_index[i]])
length = max(map(len, batches))
xdata = np.full((end - start, length), word_num_map[' '], np.int32)
for row in range(end - start):
xdata[row, :len(batches[row])] = batches[row]
ydata = np.copy(xdata)
ydata[:, :-1] = xdata[:, 1:]
return xdata, ydata
# ---------------------------------------RNN--------------------------------------#
input_data = tf.placeholder(tf.int32, [batch_size, None])
output_targets = tf.placeholder(tf.int32, [batch_size, None])
# 定義RNN
def neural_network(model='lstm', rnn_size=128, num_layers=2):
if model == 'rnn':
cell_fun = tf.nn.rnn_cell.BasicRNNCell
elif model == 'gru':
cell_fun = tf.nn.rnn_cell.GRUCell
elif model == 'lstm':
cell_fun = tf.nn.rnn_cell.BasicLSTMCell
cell = cell_fun(rnn_size, state_is_tuple=True)
cell = tf.nn.rnn_cell.MultiRNNCell([cell] * num_layers, state_is_tuple=True)
initial_state = cell.zero_state(batch_size, tf.float32)
with tf.variable_scope('rnnlm'):
softmax_w = tf.get_variable("softmax_w", [rnn_size, len(words)])
softmax_b = tf.get_variable("softmax_b", [len(words)])
with tf.device("/cpu:0"):
embedding = tf.get_variable("embedding", [len(words), rnn_size])
inputs = tf.nn.embedding_lookup(embedding, input_data)
outputs, last_state = tf.nn.dynamic_rnn(cell, inputs, initial_state=initial_state, scope='rnnlm')
output = tf.reshape(outputs, [-1, rnn_size])
logits = tf.matmul(output, softmax_w) + softmax_b
probs = tf.nn.softmax(logits)
return logits, last_state, probs, cell, initial_state
# -------------------------------生成古詩---------------------------------#
# 使用訓練完成的模型
def gen_poetry():
def to_word(weights):
t = np.cumsum(weights)
test = sorted(t)
s = np.sum(weights)
sample = int(np.searchsorted(t, np.random.rand(1) * s))
return words[sample]
_, last_state, probs, cell, initial_state = neural_network()
Session_config = tf.ConfigProto(allow_soft_placement=True)
Session_config.gpu_options.allow_growth = True
with tf.Session(config=Session_config) as sess:
with tf.device('/gpu:0'):
sess.run(tf.global_variables_initializer())
saver = tf.train.Saver(tf.all_variables())
saver.restore(sess, 'model/poetry.module-99')
state_ = sess.run(cell.zero_state(1, tf.float32))
x = np.array([list(map(word_num_map.get, '['))])
[probs_, state_] = sess.run([probs, last_state], feed_dict={input_data: x, initial_state: state_})
#word = to_word(probs_)
word = words[np.argmax(probs_)]
poem = ''
while word != ']':
poem += word
x = np.zeros((1, 1))
x[0, 0] = word_num_map[word]
[probs_, state_] = sess.run([probs, last_state], feed_dict={input_data: x, initial_state: state_})
word = to_word(probs_)
#word = words[np.argmax(probs_)]
return poem
print(gen_poetry())
#!/usr/bin/python3
# -*- coding: UTF-8 -*-
import collections
import numpy as np
import tensorflow as tf
'''
This one will produce a poetry with heads.
author: log16
Data: 2017/5/4
'''
# -------------------------------資料預處理---------------------------#
poetry_file = 'poetry.txt'
# 詩集
poetrys = []
with open(poetry_file, "r") as f:
for line in f:
try:
#line = line.decode('UTF-8')
line = line.strip(u'\n')
title, content = line.strip(u' ').split(u':')
content = content.replace(u' ', u'')
if u'_' in content or u'(' in content or u'(' in content or u'《' in content or u'[' in content:
continue
if len(content) < 5 or len(content) > 79:
continue
content = u'[' + content + u']'
poetrys.append(content)
except Exception as e:
pass
# 按詩的字數排序
poetrys = sorted(poetrys, key=lambda line: len(line))
print('唐詩總數: ', len(poetrys))
# 統計每個字出現次數
all_words = []
for poetry in poetrys:
all_words += [word for word in poetry]
counter = collections.Counter(all_words)
count_pairs = sorted(counter.items(), key=lambda x: -x[1])
words, _ = zip(*count_pairs)
# 取前多少個常用字
words = words[:len(words)] + (' ',)
# 每個字對映為一個數字ID
word_num_map = dict(zip(words, range(len(words))))
# 把詩轉換為向量形式,參考TensorFlow練習1
to_num = lambda word: word_num_map.get(word, len(words))
poetrys_vector = [list(map(to_num, poetry)) for poetry in poetrys]
# [[314, 3199, 367, 1556, 26, 179, 680, 0, 3199, 41, 506, 40, 151, 4, 98, 1],
# [339, 3, 133, 31, 302, 653, 512, 0, 37, 148, 294, 25, 54, 833, 3, 1, 965, 1315, 377, 1700, 562, 21, 37, 0, 2, 1253, 21, 36, 264, 877, 809, 1]
# ....]
# 每次取64首詩進行訓練
batch_size = 1
n_chunk = len(poetrys_vector) // batch_size
class DataSet(object):
def __init__(self, data_size):
self._data_size = data_size
self._epochs_completed = 0
self._index_in_epoch = 0
self._data_index = np.arange(data_size)
def next_batch(self, batch_size):
start = self._index_in_epoch
if start + batch_size > self._data_size:
np.random.shuffle(self._data_index)
self._epochs_completed = self._epochs_completed + 1
self._index_in_epoch = batch_size
full_batch_features, full_batch_labels = self.data_batch(0, batch_size)
return full_batch_features, full_batch_labels
else:
self._index_in_epoch += batch_size
end = self._index_in_epoch
full_batch_features, full_batch_labels = self.data_batch(start, end)
if self._index_in_epoch == self._data_size:
self._index_in_epoch = 0
self._epochs_completed = self._epochs_completed + 1
np.random.shuffle(self._data_index)
return full_batch_features, full_batch_labels
def data_batch(self, start, end):
batches = []
for i in range(start, end):
batches.append(poetrys_vector[self._data_index[i]])
length = max(map(len, batches))
xdata = np.full((end - start, length), word_num_map[' '], np.int32)
for row in range(end - start):
xdata[row, :len(batches[row])] = batches[row]
ydata = np.copy(xdata)
ydata[:, :-1] = xdata[:, 1:]
return xdata, ydata
# ---------------------------------------RNN--------------------------------------#
input_data = tf.placeholder(tf.int32, [batch_size, None])
output_targets = tf.placeholder(tf.int32, [batch_size, None])
# 定義RNN
def neural_network(model='lstm', rnn_size=128, num_layers=2):
if model == 'rnn':
cell_fun = tf.nn.rnn_cell.BasicRNNCell
elif model == 'gru':
cell_fun = tf.nn.rnn_cell.GRUCell
elif model == 'lstm':
cell_fun = tf.nn.rnn_cell.BasicLSTMCell
cell = cell_fun(rnn_size, state_is_tuple=True)
cell = tf.nn.rnn_cell.MultiRNNCell([cell] * num_layers, state_is_tuple=True)
initial_state = cell.zero_state(batch_size, tf.float32)
with tf.variable_scope('rnnlm'):
softmax_w = tf.get_variable("softmax_w", [rnn_size, len(words)])
softmax_b = tf.get_variable("softmax_b", [len(words)])
with tf.device("/cpu:0"):
embedding = tf.get_variable("embedding", [len(words), rnn_size])
inputs = tf.nn.embedding_lookup(embedding, input_data)
outputs, last_state = tf.nn.dynamic_rnn(cell, inputs, initial_state=initial_state, scope='rnnlm')
output = tf.reshape(outputs, [-1, rnn_size])
logits = tf.matmul(output, softmax_w) + softmax_b
probs = tf.nn.softmax(logits)
return logits, last_state, probs, cell, initial_state
# -------------------------------生成古詩---------------------------------#
# 使用訓練完成的模型
def gen_head_poetry(heads, type):
if type != 5 and type != 7:
print
'The second para has to be 5 or 7!'
return
def to_word(weights):
t = np.cumsum(weights)
s = np.sum(weights)
sample = int(np.searchsorted(t, np.random.rand(1) * s))
return words[sample]
_, last_state, probs, cell, initial_state = neural_network()
Session_config = tf.ConfigProto(allow_soft_placement=True)
Session_config.gpu_options.allow_growth = True
with tf.Session(config=Session_config) as sess:
with tf.device('/gpu:0'):
sess.run(tf.global_variables_initializer())
saver = tf.train.Saver(tf.global_variables())
saver.restore(sess, 'model/poetry.module-99')
poem = ''
for head in heads:
flag = True
while flag:
state_ = sess.run(cell.zero_state(1, tf.float32))
x = np.array([list(map(word_num_map.get, u'['))])
[probs_, state_] = sess.run([probs, last_state], feed_dict={input_data: x, initial_state: state_})
sentence = head
x = np.zeros((1, 1))
x[0, 0] = word_num_map[sentence]
[probs_, state_] = sess.run([probs, last_state], feed_dict={input_data: x, initial_state: state_})
word = to_word(probs_)
sentence += word
while word != u'。':
x = np.zeros((1, 1))
x[0, 0] = word_num_map[word]
[probs_, state_] = sess.run([probs, last_state],
feed_dict={input_data: x, initial_state: state_})
word = to_word(probs_)
sentence += word
if len(sentence) == 2 + 2 * type:
sentence += u'\n'
poem += sentence
flag = False
return poem
print(gen_head_poetry(u'求贊求關注', 7))
相關文章
- 簡單明朗的 RNN 寫詩教程RNN
- 怎麼這麼唐詩的 DS 都做不出來啊
- 華為推出AI詩人“樂府”:唐詩宋詞都不在話下,竟一時分不出真假AI
- 機器也可以寫詩——中文詩歌生成網路初探
- 深度學習--RNN基礎深度學習RNN
- 基於canvas生成海報Canvas
- 基於canvas生成圖片Canvas
- 無監督詩詞風格生成
- 基於Gin框架的web後端開發(二): JSON資料生成框架Web後端JSON
- RNN二進位制加法例項RNN
- 用文字挖掘分析了5萬首《全唐詩》,竟然發現這些祕密
- 基於 koa 和 node-qrcode 實現一個二維碼生成工具
- 關於詩歌的故事
- 技術解讀 | 基於fastText和RNN的語義消歧實戰ASTRNN
- 基於 NodeGit 的週報生成工具Git
- 唐山開票-唐山開票
- RNNRNN
- 基於 GD 庫生成圓形頭像
- 如何基於 SAP CDS view 生成 object pageViewObject
- 基於函式計算快速實現《為你寫詩》(阿里雲ECS)函式阿里
- [詩]春天的第二首哀歌
- (二)非線性迴圈神經網路(RNN)神經網路RNN
- 基於Vue的極簡生成器 — VuepressVue
- RNN、LSTMRNN
- 再用RNN神經網路架構設計生成式語言模型RNN神經網路架構模型
- 【精讀】自然語言處理基礎之RNN自然語言處理RNN
- 基於 solox 二次開發
- 全站HTTPS升級系列(二)基於 acme.sh從Letsencrypt生成免費的泛域名證書HTTPACM
- 基於釦子AI智慧體生成雙語播客AI智慧體
- 教你基於MindSpore用DCGAN生成漫畫頭像
- 基於 AST 的程式碼自動生成方案AST
- 基於ZXingAndroid實現生成二維碼圖片和相機掃描二維碼圖片即時解碼的功能Android
- 二維碼生成
- 基於Unity3D引擎的大地形生成研究Unity3D
- 基於雪花演算法的 PHP ID 生成器演算法PHP
- 基於vs外掛的abp程式碼生成器
- 基於SSM風格的Java原始碼生成器SSMJava原始碼
- 基於gd庫和phpqrcode的海報生成外掛PHP