neural_nets.py

'''
neural_nets.py contains various network structure, including linear model, dense model, conv model and residual net
model
'''
from keras.layers import Input, Reshape, Dense, Conv2D, BatchNormalization, Activation, Flatten, Dropout, Lambda, Multiply, Add
from keras.models import Model
from keras.optimizers import Adam
from keras.regularizers import l2
import keras.backend as K

'''
# Possible alternate loss function
def combined_loss(args):
    is_put, pi_put, pi_cap, v = args
    not_is_put = Lambda(lambda x: (x - 1) * -1)
    put_loss = categorical_crossentropy(
    cap_loss = 
    v_loss = 
    return is_put * put_loss + not_is_put * cap_loss + v_loss

# This part would go in each model
custom_loss = Lambda(combined_loss, output_shape=(1,), name='combined_loss')([inputs, self.pi_put, self.pi_capture, self.v])
'''

class LinearModel(object):
    '''
    A linear model takes in a state and estimates the corresponding pi_put, pi_capture and v
    '''
    def __init__(self, game, config):
        '''
        Game, an object, needs to have the following attributes:
        game.getBoardSize() -> a tuple like (4, 4)

        game.getActionSize() -> a tuple of (putActionSize, captureActionSize), where each of the actionSize is a tuple
            - putActionSize = (16, 17, 3) * three dimensional
            - captureActionSize = (16, 6) * two dimensional

        game.getStateDepth() -> int. How deep is each state, such as 11

        :param game: A game object
        :param config: A config object. It's by default the config.py
        '''
        self.state_depth, self.board_x, self.board_y = game.board.state.shape
        self.put_action_size = game.get_placement_action_size()
        self.capture_action_size = game.get_capture_action_size()
        self.config = config

        inputs = Input(shape=(self.state_depth, self.board_x, self.board_y), name="inputs")

        hidden = Flatten()(inputs)
        hidden = Dense(self.config.hidden_size, activation='linear')(hidden)
        self.pi = Dense(self.put_action_size + self.capture_action_size, activation='softmax', name='pi')(hidden)
        self.v = Dense(1, activation='tanh', name='v')(hidden)

        self.model = Model(inputs=[inputs], outputs=[self.pi, self.v])
        self.model.compile(loss=['categorical_crossentropy', 'mean_squared_error'],
                           optimizer=Adam(self.config.lr))


class DenseModel(object):
    '''
    Fully connected neural networks. Number of layers is decided by config.num_layers
    '''
    def __init__(self, game, config):
        '''
        Game, an object, needs to have the following attributes:
        game.getBoardSize() -> a tuple like (4, 4)

        game.getActionSize() -> a tuple of (putActionSize, captureActionSize), where each of the actionSize is a tuple
            - putActionSize = (16, 17, 3) * three dimensional
            - captureActionSize = (16, 6) * two dimensional

        game.getStateDepth() -> int. How deep is each state, such as 11

        :param game: A game object
        :param config: A config object. It's by default the config.py
        '''

        self.state_depth, self.board_x, self.board_y = game.board.state.shape
        self.put_action_size = game.get_placement_action_size()
        self.capture_action_size = game.get_capture_action_size()
        self.config = config

        inputs = Input(shape=(self.state_depth, self.board_x, self.board_y), name="inputs")

        hidden = Flatten()(inputs)

        for i in range(self.config.num_layers):
            hidden = Dense(self.config.hidden_size, activation='relu')(hidden)

        self.pi = Dense(self.put_action_size + self.capture_action_size, activation='softmax', name='pi')(hidden)
        self.v = Dense(1, activation='tanh', name='v')(hidden)


        self.model = Model(inputs=[inputs], outputs=[self.pi, self.v])
        self.model.compile(loss=['categorical_crossentropy', 'mean_squared_error'],
                           optimizer=Adam(self.config.lr))


class ConvModel(object):
    '''
    A convolution NN. filters are decided by config.num_filters and config.kernel_size
    '''
    def __init__(self, game, config):
        '''
        Game, an object, needs to have the following attributes:
        game.getBoardSize() -> a tuple like (4, 4)

        game.getActionSize() -> a tuple of (putActionSize, captureActionSize), where each of the actionSize is a tuple
            - putActionSize = (16, 17, 3) * three dimensional
            - captureActionSize = (16, 6) * two dimensional

        game.getStateDepth() -> int. How deep is each state, such as 11

        :param game: A game object
        :param config: A config object. It's by default the config.py
        '''
        self.state_depth, self.board_x, self.board_y = game.board.state.shape
        self.put_action_size = game.get_placement_action_size()
        self.capture_action_size = game.get_capture_action_size()
        self.config = config

        inputs = Input(shape=(self.state_depth, self.board_x, self.board_y), name="inputs")

        hidden = inputs

        for i in range(self.config.num_layers):
            # Changed axis to 1 since channels first
            hidden = Activation('relu')(BatchNormalization(axis=1)(Conv2D(self.config.num_filters,
                                                                    self.config.kernel_size,
                                                                    padding='same',
                                                                    data_format='channels_first',
                                                                    kernel_regularizer=l2(self.config.regularizer))(hidden)))
        hidden = Flatten()(hidden)
        hidden = Dropout(self.config.dropout)(Activation('relu')(BatchNormalization(axis=1)(Dense(1024)(hidden))))
        hidden = Dropout(self.config.dropout)(Activation('relu')(BatchNormalization(axis=1)(Dense(512)(hidden))))

        self.pi = Dense(self.put_action_size + self.capture_action_size, activation='softmax', name='pi')(hidden)
        self.v = Dense(1, activation='tanh', name='v')(hidden)

        self.model = Model(inputs=[inputs], outputs=[self.pi, self.v])
        self.model.compile(loss=['categorical_crossentropy', 'mean_squared_error'], optimizer=Adam(self.config.lr))


class ResNet(object):
    '''
    ResNet!!
    '''
    def __init__(self, game, config):
        self.config = config
        self.game = game

    def bn_relu(self, input):
        norm = BatchNormalization(axis=1)(input)
        return Activation('relu')(norm)

    def conv_bn_relu(self, num_filters, kernel_size, strides):
        def f(input):
            out = Conv2D(filters=num_filters,
                         kernel_size=kernel_size,
                         strides=strides,
                         padding='same',
                         data_format='channels_first',
                         kernel_regularizer=l2(self.config.regularizer))(input)
            return self.bn_relu(out)
        return f

    def bn_conv_relu(self, num_filters, kernel_size, strides):
        def f(input):
            out = self.bn_relu(input)
            return Conv2D(filters=num_filters,
                         kernel_size=kernel_size,
                         strides=strides,
                         padding='same',
                         data_format='channels_first',
                         kernel_regularizer=l2(self.config.regularizer))(out)


    def short_cut(self, input, residual):
        input_shape = K.int_shape(input)
        residual_shape = K.int_shape(residual)
        rate = int(input_shape[2] / residual_shape[2])

        if input_shape != residual_shape:
            shortcut = Conv2D(filters=residual_shape[0],
                         kernel_size=1,
                         strides=rate,
                         padding='valid',
                         data_format='channels_first',
                         kernel_regularizer=l2(self.config.regularizer))(input)
        else:
            shortcut = input
        return Add([shortcut, residual])


    def residual_block(self, num_filters, kernel_size, first_block=False, increase_dim=False):
        def f(input):
            if first_block:
                out = Conv2D(filters=num_filters,
                         kernel_size=kernel_size,
                         strides=1,
                         padding='same',
                         data_format='channels_first',
                         kernel_regularizer=l2(self.config.regularizer))(input)
            else:
                out = self.bn_conv_relu(num_filters=num_filters, kernel_size=kernel_size, strides=1 + int(1+increase_dim))(input)

            out = self.bn_conv_relu(num_filters=num_filters, kernel_size=kernel_size, strides=1)(out)
            return self.short_cut(input=input, residual=out)
        return f

    def build_graph(self):
        self.state_depth, self.board_x, self.board_y = self.game.board.state.shape
        self.put_action_size = self.game.get_placement_action_size()
        self.capture_action_size = self.game.get_capture_action_size()

        inputs = Input(shape=(self.state_depth, self.board_x, self.board_y), name="inputs")
        hidden = inputs

        hidden = self.conv_bn_relu(num_filters=16, kernel_size=2, strides=1)
        for i in range(self.config.num_residual_blocks):
            # hidden = self.residual_block(num_filters=16, )
            pass