-
Notifications
You must be signed in to change notification settings - Fork 16
/
Copy pathmodel.py
126 lines (104 loc) · 4.67 KB
/
model.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
import tensorflow as tf
from conf import conf
from keras.layers import (
Conv2D, BatchNormalization, Input, Activation, Dense, Reshape,
Add,
)
from keras.optimizers import SGD
from keras import backend as K
from keras.models import Model, load_model
from keras.callbacks import TensorBoard
from keras.regularizers import l2
import os
SIZE = conf['SIZE']
L2_EPSILON = conf['L2_EPSILON']
LEARNING_RATE = conf['LEARNING_RATE']
MOMENTUM = conf['MOMENTUM']
REGULARIZERS = {
'kernel_regularizer': l2(L2_EPSILON),
'bias_regularizer': l2(L2_EPSILON),
}
def residual_block(input_, node_name):
with tf.name_scope(node_name):
conv1 = Conv2D(filters=256, kernel_size=(3, 3), strides=1, padding='same', **REGULARIZERS)(input_)
batch1 = BatchNormalization()(conv1)
relu = Activation('relu')(batch1)
conv2 = Conv2D(filters=256, kernel_size=(3, 3), strides=1, padding='same', **REGULARIZERS)(relu)
batch2 = BatchNormalization()(conv2)
add = Add()([batch2, input_])
out = Activation('relu')(add)
return out
def loss(y_true, y_pred):
mse = K.mean(K.square(y_pred - y_true), axis=-1)
categorical_crossentropy = K.categorical_crossentropy(y_true, y_pred)
return mse + categorical_crossentropy
def build_model(name):
with tf.name_scope('input'):
_input = Input(shape=(SIZE, SIZE, 17))
conv1 = Conv2D(filters=256, kernel_size=(3, 3), strides=1,
data_format='channels_last', **REGULARIZERS)(_input)
batch1 = BatchNormalization()(conv1)
relu = Activation('relu')(batch1)
tower_input = relu
with tf.name_scope('tower'):
for i in range(conf['N_RESIDUAL_BLOCKS']):
tower_output = residual_block(tower_input, node_name="residual_%s" % i)
tower_input = tower_output
with tf.name_scope('policy'):
policy_conv = Conv2D(filters=2, kernel_size=(1, 1), strides=1, **REGULARIZERS)(tower_output)
policy_batch = BatchNormalization()(policy_conv)
policy_relu = Activation('relu')(policy_batch)
shape = policy_relu._keras_shape
policy_shape = (shape[1] * shape[2] * shape[3], )
policy_reshape = Reshape(target_shape=policy_shape)(policy_relu)
policy_out = Dense(SIZE*SIZE + 1, activation='softmax', name="policy_out", **REGULARIZERS)(policy_reshape)
with tf.name_scope('value'):
value_conv = Conv2D(filters=2, kernel_size=(1, 1), strides=1, **REGULARIZERS)(tower_output)
value_batch = BatchNormalization()(value_conv)
value_relu = Activation('relu')(value_batch)
shape = value_relu._keras_shape
value_shape = (shape[1] * shape[2] * shape[3], )
value_reshape = Reshape(target_shape=value_shape)(value_relu)
value_hidden = Dense(256, activation='relu', **REGULARIZERS)(value_reshape)
value_out = Dense(1, activation='tanh', name="value_out", **REGULARIZERS)(value_hidden)
model = Model(inputs=[_input], outputs=[policy_out, value_out], name=name)
sgd = SGD(lr=LEARNING_RATE, momentum = MOMENTUM)
model.compile(sgd, loss=loss)
return model
def create_initial_model(name):
full_filename = os.path.join(conf['MODEL_DIR'], name) + ".h5"
if os.path.isfile(full_filename):
model = load_model(full_filename, custom_objects={'loss': loss})
return model
model = build_model(name)
# Save graph in tensorboard. This graph has the name scopes making it look
# good in tensorboard, the loaded models will not have the scopes.
tf_callback = TensorBoard(log_dir=os.path.join(conf['LOG_DIR'], name),
histogram_freq=0, batch_size=1, write_graph=True, write_grads=False)
tf_callback.set_model(model)
tf_callback.on_epoch_end(0)
tf_callback.on_train_end(0)
from self_play import self_play
self_play(model, n_games=conf['N_GAMES'], mcts_simulations=conf['MCTS_SIMULATIONS'])
model.save(full_filename)
best_filename = os.path.join(conf['MODEL_DIR'], 'best_model.h5')
model.save(best_filename)
return model
def load_latest_model():
index = -1
model_filename = None
for filename in os.listdir(conf['MODEL_DIR']):
try:
name = filename.split('.')[0] # remove .h5
i = int(name.split('_')[-1])
if i > index:
model_filename = filename
index = i
except:
continue
model = load_model(os.path.join(conf['MODEL_DIR'], model_filename), custom_objects={'loss': loss})
print("Loaded latest model", model_filename)
return model
def load_best_model():
model = load_model(os.path.join(conf['ROOT_DIR'], conf['MODEL_DIR'], conf['BEST_MODEL']), custom_objects={'loss': loss})
return model