-
Notifications
You must be signed in to change notification settings - Fork 2
/
rnn_v10.py
91 lines (81 loc) · 2.82 KB
/
rnn_v10.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
## Architecture of neural network currently in use for CLIPNET.
import tensorflow as tf
from tensorflow.keras import layers
import custom_loss
# model fitting hyperparameters
epochs = 200
patience = 10
batch_size = 256
# compile parameters
optimizer = tf.keras.optimizers.Adam
opt_hyperparameters = {
"learning_rate": 0.001,
"beta_1": 0.9,
"beta_2": 0.999,
"epsilon": 1e-7,
}
loss = {"shape": "CosineSimilarity", "sum": "msle"}
metrics = {"shape": custom_loss.corr}
# model architecture hyperparameters
c1 = {"filters": 64, "kernel_size": 8}
c2 = {"filters": 128, "kernel_size": 4}
dropout = 0.3
num_dilations = 9
num_filters = 64
dilation_kernel = 3
def dilated_conv(x, filters, kernel_size, dilation_rate):
"""
Constructs a residual block with a single dilated convolutional layer.
"""
# Dilated convolution
residual = layers.Conv1D(
filters=filters,
kernel_size=kernel_size,
padding="same",
dilation_rate=dilation_rate,
)(x)
residual = layers.BatchNormalization()(residual)
residual = layers.Activation("relu")(residual)
# Add skip connection
out = layers.Add()([x, residual])
out = layers.BatchNormalization()(out)
out = layers.Activation("relu")(out)
return out
def construct_nn(input_length, output_length, dilation_kernel=dilation_kernel):
"""
Returns a neural network with given input and output lengths.
"""
# input
X = layers.Input(shape=(input_length, 4))
y = layers.BatchNormalization()(X)
# 1st convolutional layer
y = layers.Conv1D(filters=c1["filters"], kernel_size=c1["kernel_size"])(y)
y = layers.BatchNormalization()(y)
y = layers.Activation("elu")(y)
y = layers.MaxPooling1D(pool_size=(2))(y)
# 2nd convolutional layer
y = layers.Conv1D(filters=c2["filters"], kernel_size=c2["kernel_size"])(y)
y = layers.BatchNormalization()(y)
y = layers.Activation("relu")(y)
y = layers.MaxPooling1D(pool_size=(2))(y)
# dilated convolutions
y = layers.Conv1D(kernel_size=1, filters=num_filters)(y)
for i in range(num_dilations):
y = dilated_conv(
y, filters=num_filters, kernel_size=dilation_kernel, dilation_rate=2**i
)
y = layers.MaxPooling1D(pool_size=(2))(y)
# shape / probability distribution head
p_head = layers.Flatten()(y)
p_head = layers.Dense(output_length)(p_head)
p_head = layers.BatchNormalization()(p_head)
p_head = layers.Activation("relu")(p_head)
p_head = layers.Dropout(dropout, name="shape")(p_head)
# sum head
s_head = layers.GlobalAvgPool1D()(y)
s_head = layers.Dense(1)(s_head)
s_head = layers.BatchNormalization()(s_head)
s_head = layers.Activation("relu")(s_head)
s_head = layers.Dropout(dropout, name="sum")(s_head)
# output model
return tf.keras.models.Model(X, [p_head, s_head])