-
Notifications
You must be signed in to change notification settings - Fork 3
/
Copy pathCNN.py
80 lines (71 loc) · 3.59 KB
/
CNN.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
import keras
import numpy as np
from keras.models import Model, load_model, Sequential
from keras.layers import Conv1D, Dense, Reshape, Dropout, LSTM, GlobalMaxPooling1D, MaxPooling1D, Flatten, Input, Concatenate
import tensorflow as tf
from keras import optimizers
#CNN code for motif convolutional layer
# taken from https://github.com/uci-cbcl/DanQ
class CNN():
def __init__(self,model_layers,seq_shape,out_shape=2,conv_filter_number=100,conv_filter_size=20):
model=Sequential()
for i, layer in enumerate(model_layers):
if layer == 'conv':
if i == 0:
HOMER_motifs = list(np.load('homer_matrix.npy'))
filter_len = max([HOMER_motifs[k].shape[0] for k in range(len(HOMER_motifs))])
conv_layer = Conv1D(input_shape=seq_shape,
filters=len(HOMER_motifs)*2,
kernel_size=35,
padding="valid",
activation="relu",
strides=1)
model.add(conv_layer)
conv_weights = conv_layer.get_weights()
reverse_motifs = [HOMER_motifs[j][::-1,::-1] for j in range(len(HOMER_motifs))]
HOMER_motifs = HOMER_motifs + reverse_motifs
for j in range(len(HOMER_motifs)):
m = HOMER_motifs[j][::-1,:]
w = m.shape[0]
conv_weights[0][:,:,j] = 0
start = np.random.randint(low=3, high=35-w-3+1)
conv_weights[0][start:(start+w),:,j] = m - 0.25
conv_weights[1][j] = np.random.uniform(low=-1.0,high=0.0)
conv_layer.set_weights(conv_weights)
conv_layer.trainable=False
else:
model.add(Conv1D(conv_filter_number,conv_filter_size,activation='relu',padding='same'))
if layer == 'globalpool':
model.add(GlobalMaxPooling1D())
if layer == 'maxpool':
model.add(MaxPooling1D(3,1))
if layer == 'LSTM':
model.add(LSTM(16,return_sequences=True))
if layer == 'dense':
model.add(Dropout(0.1))
model.add(Dense(128,activation='relu'))
if 'dense' not in model_layers and 'globalpool' not in model_layers:
model.add(Flatten())
model.add(Dropout(0.1))
model.add(Dense(out_shape,activation='sigmoid'))
adam = optimizers.Adam(lr=1e-4,clipnorm=0.5,decay=(1e-4/100.0))
model.compile(optimizer=adam,loss='binary_crossentropy',metrics=['accuracy'])
self.model = model
def train(self,X,y,sample_weights):
callbacks = [keras.callbacks.EarlyStopping(monitor='val_loss',
patience=3),
keras.callbacks.History()]
history = self.model.fit(x=X,
y=y,epochs=100,
shuffle=True,
validation_split=0.2,
batch_size=100,verbose=1,
callbacks=callbacks,
sample_weight = sample_weights)
return history
def save(self,h5file):
self.model.save(h5file)
def predict(self,X):
return self.model.predict(X)
def error(self,X,y):
return np.linalg.norm(y-self.model.predict(X))