tfworld-hackathon/scripts/GANModels.py

# Import modules
import tensorflow as tf
from tensorflow.keras.models import Model
from tensorflow.keras.layers import Lambda, Dense, LSTM, Activation, Input, Bidirectional, Dropout
from tensorflow.keras.layers import Reshape, Conv2DTranspose, TimeDistributed, Conv1D, LeakyReLU, Layer, ReLU
from tensorflow.keras.optimizers import Adam
import tensorflow.keras.backend as K

def Generator(d, num_samples, c=16):

    input_layer = Input(shape=(100,))

    # output shape = (None, 16, 16d)
    dense_layer0 = Dense(16*c*d)(input_layer)
    reshape_layer0 = Reshape((c, c*d))(dense_layer0)
    relu_layer0 = ReLU()(reshape_layer0)

    # Upsampling
    # output shape = (None, 64, 8d)
    c //= 2
    expanded_layer0 = Lambda(lambda x: K.expand_dims(x, axis=1))(relu_layer0)
    conv1d_t_layer0 = Conv2DTranspose(c*d, (1, 25), strides=(1, 4), padding='same')(expanded_layer0)
    slice_layer0 = Lambda(lambda x: x[:, 0])(conv1d_t_layer0)
    relu_layer1 = ReLU()(slice_layer0)

    # output shape = (None, 256, 4d)
    c //= 2
    expanded_layer1 = Lambda(lambda x: K.expand_dims(x, axis=1))(relu_layer1)
    conv1d_t_layer1 = Conv2DTranspose(c*d, (1, 25), strides=(1, 4), padding='same')(expanded_layer1)
    slice_layer1 = Lambda(lambda x: x[:, 0])(conv1d_t_layer1)
    relu_layer2 = ReLU()(slice_layer1)

    # output shape = (None, 1024, 2d)
    c //= 2
    expanded_layer2 = Lambda(lambda x: K.expand_dims(x, axis=1))(relu_layer2)
    conv1d_t_layer2 = Conv2DTranspose(c*d, (1, 25), strides=(1, 4), padding='same')(expanded_layer2)
    slice_layer2 = Lambda(lambda x: x[:, 0])(conv1d_t_layer2)
    relu_layer3 = ReLU()(slice_layer2)

    # output shape = (None, 4096, d)
    c //= 2
    expanded_layer3 = Lambda(lambda x: K.expand_dims(x, axis=1))(relu_layer3)
    conv1d_t_layer3 = Conv2DTranspose(c*d, (1, 25), strides=(1, 4), padding='same')(expanded_layer3)
    slice_layer3 = Lambda(lambda x: x[:, 0])(conv1d_t_layer3)
    relu_layer4 = ReLU()(slice_layer3)

    # output shape = (None, 16384, 1)
    expanded_layer4 = Lambda(lambda x: K.expand_dims(x, axis=1))(relu_layer4)
    conv1d_t_layer4 = Conv2DTranspose(1, (1, 25), strides=(1, 4), padding='same')(expanded_layer4)
    slice_layer4 = Lambda(lambda x: x[:, 0])(conv1d_t_layer4)

    #### The number of transposed convolution operations  should be modified
    #### in accordance with num_samples. This current architecture expects
    #### num_samples == 16384

    # Squeeze values between (-1, 1)
    tanh_layer0 = Activation('tanh')(slice_layer4)

    model = Model(inputs=input_layer, outputs=tanh_layer0)

    return model

# Makes critic invariant to upsampling artifacts of generator to avoid the critic learning to
# easily identify generated audio from said artifacts
def _apply_phaseshuffle(x, rad=2, pad_type='reflect'):
    b, x_len, nch = x.get_shape().as_list()

    phase = tf.random.uniform([], minval=-rad, maxval=rad + 1, dtype=tf.int32)
    pad_l = tf.maximum(phase, 0)
    pad_r = tf.maximum(-phase, 0)
    phase_start = pad_r
    x = tf.pad(x, [[0, 0], [pad_l, pad_r], [0, 0]], mode=pad_type)

    x = x[:, phase_start:phase_start+x_len]
    x.set_shape([b, x_len, nch])

    return x

def Critic(d, num_samples, c=1):

    input_layer = Input(shape=(num_samples, 1))

    # Downsampling
    # output shape = (None, 4096, d)
    conv1d_layer0 = Conv1D(c*d, 25, strides=4, padding='same')(input_layer)
    LReLU_layer0 = LeakyReLU(alpha=0.2)(conv1d_layer0)
    phaseshuffle_layer0 = Lambda(lambda x: _apply_phaseshuffle(x))(LReLU_layer0)

    # output shape = (None, 1024, 2d)
    c *= 2
    conv1d_layer1 = Conv1D(c*d, 25, strides=4, padding='same')(phaseshuffle_layer0)
    LReLU_layer1 = LeakyReLU(alpha=0.2)(conv1d_layer1)
    phaseshuffle_layer1 = Lambda(lambda x: _apply_phaseshuffle(x))(LReLU_layer1)

    # output shape = (None, 256, 4d)
    c *= 2
    conv1d_layer2 = Conv1D(c*d, 25, strides=4, padding='same')(phaseshuffle_layer1)
    LReLU_layer2 = LeakyReLU(alpha=0.2)(conv1d_layer2)
    phaseshuffle_layer2 = Lambda(lambda x: _apply_phaseshuffle(x))(LReLU_layer2)

    # output shape = (None, 64, 8d)
    c *= 2
    conv1d_layer3 = Conv1D(c*d, 25, strides=4, padding='same')(phaseshuffle_layer2)
    LReLU_layer3 = LeakyReLU(alpha=0.2)(conv1d_layer3)
    phaseshuffle_layer3 = Lambda(lambda x: _apply_phaseshuffle(x))(LReLU_layer3)

    # output shape = (None, 16, 16d)
    c *= 2
    conv1d_layer4 = Conv1D(c*d, 25, strides=4, padding='same')(phaseshuffle_layer3)
    LReLU_layer4 = LeakyReLU(alpha=0.2)(conv1d_layer4)

    #### The number of convolution operations  should be modified
    #### in accordance with num_samples. This current architecture expects
    #### num_samples == 16384

    # output shape = (None, 256d)
    reshape_layer0 = Reshape((16*c*d,))(LReLU_layer4)#

    # Output a critic score
    dense_layer1 = Dense(1)(reshape_layer0)

    model = Model(inputs=input_layer, outputs=dense_layer1)

    return model
new 2020-01-01 15:13:30 +11:00			`# Import modules`
			`import tensorflow as tf`
			`from tensorflow.keras.models import Model`
			`from tensorflow.keras.layers import Lambda, Dense, LSTM, Activation, Input, Bidirectional, Dropout`
			`from tensorflow.keras.layers import Reshape, Conv2DTranspose, TimeDistributed, Conv1D, LeakyReLU, Layer, ReLU`
			`from tensorflow.keras.optimizers import Adam`
			`import tensorflow.keras.backend as K`

			`def Generator(d, num_samples, c=16):`

			`input_layer = Input(shape=(100,))`

			`# output shape = (None, 16, 16d)`
			`dense_layer0 = Dense(16cd)(input_layer)`
			`reshape_layer0 = Reshape((c, c*d))(dense_layer0)`
			`relu_layer0 = ReLU()(reshape_layer0)`

			`# Upsampling`
			`# output shape = (None, 64, 8d)`
			`c //= 2`
			`expanded_layer0 = Lambda(lambda x: K.expand_dims(x, axis=1))(relu_layer0)`
			`conv1d_t_layer0 = Conv2DTranspose(c*d, (1, 25), strides=(1, 4), padding='same')(expanded_layer0)`
			`slice_layer0 = Lambda(lambda x: x[:, 0])(conv1d_t_layer0)`
			`relu_layer1 = ReLU()(slice_layer0)`

			`# output shape = (None, 256, 4d)`
			`c //= 2`
			`expanded_layer1 = Lambda(lambda x: K.expand_dims(x, axis=1))(relu_layer1)`
			`conv1d_t_layer1 = Conv2DTranspose(c*d, (1, 25), strides=(1, 4), padding='same')(expanded_layer1)`
			`slice_layer1 = Lambda(lambda x: x[:, 0])(conv1d_t_layer1)`
			`relu_layer2 = ReLU()(slice_layer1)`

			`# output shape = (None, 1024, 2d)`
			`c //= 2`
			`expanded_layer2 = Lambda(lambda x: K.expand_dims(x, axis=1))(relu_layer2)`
			`conv1d_t_layer2 = Conv2DTranspose(c*d, (1, 25), strides=(1, 4), padding='same')(expanded_layer2)`
			`slice_layer2 = Lambda(lambda x: x[:, 0])(conv1d_t_layer2)`
			`relu_layer3 = ReLU()(slice_layer2)`

			`# output shape = (None, 4096, d)`
			`c //= 2`
			`expanded_layer3 = Lambda(lambda x: K.expand_dims(x, axis=1))(relu_layer3)`
			`conv1d_t_layer3 = Conv2DTranspose(c*d, (1, 25), strides=(1, 4), padding='same')(expanded_layer3)`
			`slice_layer3 = Lambda(lambda x: x[:, 0])(conv1d_t_layer3)`
			`relu_layer4 = ReLU()(slice_layer3)`

			`# output shape = (None, 16384, 1)`
			`expanded_layer4 = Lambda(lambda x: K.expand_dims(x, axis=1))(relu_layer4)`
			`conv1d_t_layer4 = Conv2DTranspose(1, (1, 25), strides=(1, 4), padding='same')(expanded_layer4)`
			`slice_layer4 = Lambda(lambda x: x[:, 0])(conv1d_t_layer4)`

			`#### The number of transposed convolution operations should be modified`
			`#### in accordance with num_samples. This current architecture expects`
			`#### num_samples == 16384`

			`# Squeeze values between (-1, 1)`
			`tanh_layer0 = Activation('tanh')(slice_layer4)`

			`model = Model(inputs=input_layer, outputs=tanh_layer0)`

			`return model`

			`# Makes critic invariant to upsampling artifacts of generator to avoid the critic learning to`
			`# easily identify generated audio from said artifacts`
			`def _apply_phaseshuffle(x, rad=2, pad_type='reflect'):`
			`b, x_len, nch = x.get_shape().as_list()`

			`phase = tf.random.uniform([], minval=-rad, maxval=rad + 1, dtype=tf.int32)`
			`pad_l = tf.maximum(phase, 0)`
			`pad_r = tf.maximum(-phase, 0)`
			`phase_start = pad_r`
			`x = tf.pad(x, [[0, 0], [pad_l, pad_r], [0, 0]], mode=pad_type)`

			`x = x[:, phase_start:phase_start+x_len]`
			`x.set_shape([b, x_len, nch])`

			`return x`

			`def Critic(d, num_samples, c=1):`

			`input_layer = Input(shape=(num_samples, 1))`

			`# Downsampling`
			`# output shape = (None, 4096, d)`
			`conv1d_layer0 = Conv1D(c*d, 25, strides=4, padding='same')(input_layer)`
			`LReLU_layer0 = LeakyReLU(alpha=0.2)(conv1d_layer0)`
			`phaseshuffle_layer0 = Lambda(lambda x: _apply_phaseshuffle(x))(LReLU_layer0)`

			`# output shape = (None, 1024, 2d)`
			`c *= 2`
			`conv1d_layer1 = Conv1D(c*d, 25, strides=4, padding='same')(phaseshuffle_layer0)`
			`LReLU_layer1 = LeakyReLU(alpha=0.2)(conv1d_layer1)`
			`phaseshuffle_layer1 = Lambda(lambda x: _apply_phaseshuffle(x))(LReLU_layer1)`

			`# output shape = (None, 256, 4d)`
			`c *= 2`
			`conv1d_layer2 = Conv1D(c*d, 25, strides=4, padding='same')(phaseshuffle_layer1)`
			`LReLU_layer2 = LeakyReLU(alpha=0.2)(conv1d_layer2)`
			`phaseshuffle_layer2 = Lambda(lambda x: _apply_phaseshuffle(x))(LReLU_layer2)`

			`# output shape = (None, 64, 8d)`
			`c *= 2`
			`conv1d_layer3 = Conv1D(c*d, 25, strides=4, padding='same')(phaseshuffle_layer2)`
			`LReLU_layer3 = LeakyReLU(alpha=0.2)(conv1d_layer3)`
			`phaseshuffle_layer3 = Lambda(lambda x: _apply_phaseshuffle(x))(LReLU_layer3)`

			`# output shape = (None, 16, 16d)`
			`c *= 2`
			`conv1d_layer4 = Conv1D(c*d, 25, strides=4, padding='same')(phaseshuffle_layer3)`
			`LReLU_layer4 = LeakyReLU(alpha=0.2)(conv1d_layer4)`

			`#### The number of convolution operations should be modified`
			`#### in accordance with num_samples. This current architecture expects`
			`#### num_samples == 16384`

			`# output shape = (None, 256d)`
			`reshape_layer0 = Reshape((16cd,))(LReLU_layer4)#`

			`# Output a critic score`
			`dense_layer1 = Dense(1)(reshape_layer0)`

			`model = Model(inputs=input_layer, outputs=dense_layer1)`

			`return model`