-
Notifications
You must be signed in to change notification settings - Fork 12
/
Copy pathtrain.py
85 lines (71 loc) · 3.3 KB
/
train.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
from model import CVAE
from utils import *
import numpy as np
import os
import tensorflow as tf
import time
import argparse
parser = argparse.ArgumentParser()
parser.add_argument('--batch_size', help='batch_size', type=int, default=128)
parser.add_argument('--unit_size', help='unit_size of rnn cell', type=int, default=512)
parser.add_argument('--n_rnn_layer', help='number of rnn layer', type=int, default=3)
parser.add_argument('--seq_length', help='max_seq_length', type=int, default=120)
parser.add_argument('--num_epochs', help='epochs', type=int, default=100)
parser.add_argument('--lr', help='learning rate', type=float, default=0.0001)
parser.add_argument('--save_dir', help='save dir', type=str, default='save/')
parser.add_argument('--smiles_data', help='smiles data', type=str)
parser.add_argument('--vocab_from', help='the file where vocab is extracted from', type=str)
parser.add_argument('--pretrained', help='pretrained model', type=str)
args = parser.parse_args()
print (args)
#extact vocab and char
char, vocab = extract_vocab(args.vocab_from, args.seq_length)
#convert smiles to numpy array
molecules_input, molecules_output, length = load_data(args.smiles_data, args.seq_length, char, vocab)
print ('Number of data : ', len(molecules_input))
vocab_size = len(char)
#make save_dir
if not os.path.isdir(args.save_dir):
os.mkdir(args.save_dir)
#divide data into training and test set
num_train_data = int(len(molecules_input)*0.75)
train_molecules_input = molecules_input[0:num_train_data]
test_molecules_input = molecules_input[num_train_data:-1]
train_molecules_output = molecules_output[0:num_train_data]
test_molecules_output = molecules_output[num_train_data:-1]
train_length = length[0:num_train_data]
test_length = length[num_train_data:-1]
model = CVAE(vocab_size,
args
)
if args.pretrained is not None : model.restore(args.pretrained)
print ('Number of parameters : ', np.sum([np.prod(v.shape) for v in tf.trainable_variables()]))
for epoch in range(args.num_epochs):
st = time.time()
# Learning rate scheduling
#model.assign_lr(learning_rate * (decay_rate ** epoch))
train_loss = []
test_loss = []
st = time.time()
for iteration in range(len(train_molecules_input)//args.batch_size):
n = np.random.randint(len(train_molecules_input), size = args.batch_size)
x = np.array([train_molecules_input[i] for i in n])
y = np.array([train_molecules_output[i] for i in n])
l = np.array([train_length[i] for i in n])
cost = model.train(x, y, l)
train_loss.append(cost)
for iteration in range(len(test_molecules_input)//args.batch_size):
n = np.random.randint(len(test_molecules_input), size = args.batch_size)
x = np.array([test_molecules_input[i] for i in n])
y = np.array([test_molecules_output[i] for i in n])
l = np.array([test_length[i] for i in n])
cost = model.test(x, y, l)
test_loss.append(cost)
train_loss = np.mean(np.array(train_loss))
test_loss = np.mean(np.array(test_loss))
end = time.time()
if epoch==0:
print ('epoch\ttrain_loss\ttest_loss\ttime (s)')
print ("%s\t%.3f\t%.3f\t%.3f" %(epoch, train_loss, test_loss, end-st))
ckpt_path = args.save_dir+'/model_'+str(epoch)+'.ckpt'
model.save(ckpt_path, epoch)