راهنمایی در مورد کد LSTM

سلام دوستان کد rnn_cell = rnn.MultiRNNCell([rnn.BasicLSTMCell(n_hidden),rnn.BasicLSTMCell(n_hidden)]) در قطعه کد زیر چی کار می کنه؟

کد از اینجا گرفتم

from __future__ import print_function

import numpy as np

import tensorflow as tf

from tensorflow.contrib import rnn

import random

import collections

import time

start_time = time.time()

def elapsed(sec):

if sec<60:

return str(sec) + " sec"

elif sec<(60*60):

return str(sec/60) + " min"

else:

return str(sec/(60*60)) + " hr"

# Target log path

logs_path = '/output'

writer = tf.summary.FileWriter(logs_path)

# Text file containing words for training

training_file = 'belling_the_cat.txt'

def read_data(fname):

with open(fname) as f:

content = f.readlines()

content = [x.strip() for x in content]

content = [word for i in range(len(content)) for word in content[i].split()]

content = np.array(content)

return content

training_data = read_data(training_file)

print("Loaded training data...")

def build_dataset(words):

count = collections.Counter(words).most_common()

dictionary = dict()

for word, _ in count:

dictionary[word] = len(dictionary)

reverse_dictionary = dict(zip(dictionary.values(), dictionary.keys()))

return dictionary, reverse_dictionary

dictionary, reverse_dictionary = build_dataset(training_data)

vocab_size = len(dictionary)

# Parameters

learning_rate = 0.001

training_iters = 50000

display_step = 1000

n_input = 3

# number of units in RNN cell

n_hidden = 512

# tf Graph input

x = tf.placeholder("float", [None, n_input, 1])

y = tf.placeholder("float", [None, vocab_size])

# RNN output node weights and biases

weights = {

'out': tf.Variable(tf.random_normal([n_hidden, vocab_size]))

}

biases = {

'out': tf.Variable(tf.random_normal([vocab_size]))

}

def RNN(x, weights, biases):

# reshape to [1, n_input]

x = tf.reshape(x, [-1, n_input])

# Generate a n_input-element sequence of inputs

# (eg. [had] [a] [general] -> [20] [6] [33])

x = tf.split(x,n_input,1)

# 2-layer LSTM, each layer has n_hidden units.

# Average Accuracy= 95.20% at 50k iter

rnn_cell = rnn.MultiRNNCell([rnn.BasicLSTMCell(n_hidden),rnn.BasicLSTMCell(n_hidden)])

print(type(rnn_cell))

print(rnn_cell)

# 1-layer LSTM with n_hidden units but with lower accuracy.

# Average Accuracy= 90.60% 50k iter

# Uncomment line below to test but comment out the 2-layer rnn.MultiRNNCell above

# rnn_cell = rnn.BasicLSTMCell(n_hidden)

# generate prediction

outputs, states = rnn.static_rnn(rnn_cell, x, dtype=tf.float32)

# there are n_input outputs but

# we only want the last output

return tf.matmul(outputs[-1], weights['out']) + biases['out']

pred = RNN(x, weights, biases)

# Loss and optimizer

cost = tf.reduce_mean(tf.nn.softmax_cross_entropy_with_logits(logits=pred, labels=y))

optimizer = tf.train.RMSPropOptimizer(learning_rate=learning_rate).minimize(cost)

# Model evaluation

correct_pred = tf.equal(tf.argmax(pred,1), tf.argmax(y,1))

accuracy = tf.reduce_mean(tf.cast(correct_pred, tf.float32))

# Initializing the variables

init = tf.global_variables_initializer()

# Launch the graph

with tf.Session() as session:

session.run(init)

step = 0

offset = random.randint(0,n_input+1)

end_offset = n_input + 1

acc_total = 0

loss_total = 0

writer.add_graph(session.graph)

while step < training_iters:

# Generate a minibatch. Add some randomness on selection process.

if offset > (len(training_data)-end_offset):

offset = random.randint(0, n_input+1)

symbols_in_keys = [ [dictionary[ str(training_data[i])]] for i in range(offset, offset+n_input) ]

symbols_in_keys = np.reshape(np.array(symbols_in_keys), [-1, n_input, 1])

symbols_out_onehot = np.zeros([vocab_size], dtype=float)

symbols_out_onehot[dictionary[str(training_data[offset+n_input])]] = 1.0

symbols_out_onehot = np.reshape(symbols_out_onehot,[1,-1])

_, acc, loss, onehot_pred = session.run([optimizer, accuracy, cost, pred], \

feed_dict={x: symbols_in_keys, y: symbols_out_onehot})

loss_total += loss

acc_total += acc

if (step+1) % display_step == 0:

print("Iter= " + str(step+1) + ", Average Loss= " + \

"{:.6f}".format(loss_total/display_step) + ", Average Accuracy= " + \

"{:.2f}%".format(100*acc_total/display_step))

acc_total = 0

loss_total = 0

symbols_in = [training_data[i] for i in range(offset, offset + n_input)]

symbols_out = training_data[offset + n_input]

symbols_out_pred = reverse_dictionary[int(tf.argmax(onehot_pred, 1).eval())]

print("%s - [%s] vs [%s]" % (symbols_in,symbols_out,symbols_out_pred))

step += 1

offset += (n_input+1)

print("Optimization Finished!")

print("Elapsed time: ", elapsed(time.time() - start_time))

print("Run on command line.")

وبـــلاگ هــفت خــط کــد

راهنمایی در مورد کد LSTM

لطفا وارد شوید یا ثبت نام کنید برای اضافه کردن دیدگاه .

پاسخ شما

سوالات مرتبط

وبـــلاگ هــفت خــط کــد

راهنمایی در مورد کد LSTM

لطفا وارد شوید یا ثبت نام کنید برای اضافه کردن دیدگاه .

پاسخ شما