-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathlearn.py
54 lines (44 loc) · 1.78 KB
/
learn.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
from __future__ import absolute_import, division, print_function
import os
import pickle
import tflearn
from tflearn.data_utils import *
path = 'data/data.txt'
char_idx_file = 'char_idx.pickle'
maxlen = 10
char_idx = None
if os.path.isfile(char_idx_file):
print('Loading previous char_idx')
char_idx = pickle.load(open(char_idx_file, 'rb'))
X, Y, char_idx = \
textfile_to_semi_redundant_sequences(path, seq_maxlen=maxlen, redun_step=3,
pre_defined_char_idx=char_idx)
pickle.dump(char_idx, open(char_idx_file, 'wb'))
g = tflearn.input_data([None, maxlen, len(char_idx)])
g = tflearn.lstm(g, 512, return_seq=True)
g = tflearn.dropout(g, 0.5)
g = tflearn.lstm(g, 512, return_seq=True)
g = tflearn.dropout(g, 0.5)
g = tflearn.lstm(g, 512)
g = tflearn.dropout(g, 0.5)
g = tflearn.fully_connected(g, len(char_idx), activation='softmax')
g = tflearn.regression(g, optimizer='adam', loss='categorical_crossentropy',
learning_rate=0.001)
m = tflearn.SequenceGenerator(g, dictionary=char_idx,
seq_maxlen=maxlen,
clip_gradients=5.0,
checkpoint_path='model_ass')
with open('data/results.txt', 'w+') as outfile:
for i in range(50):
seed = random_sequence_from_textfile(path, maxlen)
m.fit(X, Y, validation_set=0.1, batch_size=128,
n_epoch=1, run_id='ass')
print("-- TESTING...")
print("-- Test with temperature of 1.0 --")
res1 = m.generate(600, temperature=1.0, seq_seed=seed)
print(res1)
outfile.write(res1 + '\n')
print("-- Test with temperature of 0.5 --")
res2 = m.generate(600, temperature=0.5, seq_seed=seed)
print(res2)
outfile.write(res2 + '\n')