-
Notifications
You must be signed in to change notification settings - Fork 4
/
Copy pathattention_soft.py
42 lines (35 loc) · 2.1 KB
/
attention_soft.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
#pylint: skip-file
import numpy as np
import theano
import theano.tensor as T
from utils_pg import *
class SoftAttentionLayer(object):
def __init__(self, layer_id, shape, sent_encs, cmt_encs, sent_decs, pz):
prefix = "AttentionLayer_"
layer_id = "_" + layer_id
self.num_summs, self.num_sents, self.num_cmts, self.out_size = shape
self.W_a1 = init_weights((self.out_size, self.out_size), prefix + "W_a1" + layer_id)
self.W_a2 = init_weights((self.out_size, self.out_size), prefix + "W_a2" + layer_id)
self.W_a3 = init_weights((1, self.out_size), prefix + "W_a3" + layer_id)
self.W_a4 = init_weights((self.out_size, self.out_size), prefix + "W_a4" + layer_id)
#self.W_a5 = init_weights((self.num_summs, 1), prefix + "W_a5" + layer_id)
#self.W_a6 = init_weights((self.num_summs, 1), prefix + "W_a6" + layer_id)
self.W_a5 = init_weights((self.out_size, self.out_size), prefix + "W_a5" + layer_id)
self.W_a6 = init_weights((self.out_size, self.out_size), prefix + "W_a6" + layer_id)
def attend(h, sent_encs, num_sents):
h = T.reshape(h, (1, self.out_size))
h_ = T.repeat(h, num_sents, axis=0)
M = T.tanh(T.dot(self.W_a1, sent_encs.T) + T.dot(self.W_a2, h_.T))
a = T.nnet.softmax(T.dot(self.W_a3, M))
return a
outputs, updates = theano.scan(attend, sequences = sent_decs, non_sequences = [sent_encs, self.num_sents])
A = T.reshape(outputs, (self.num_summs, self.num_sents))
c = T.dot(A, sent_encs)
outputs2, updates2 = theano.scan(attend, sequences = sent_decs, non_sequences = [cmt_encs, self.num_cmts])
A2 = T.reshape(outputs2, (self.num_summs, self.num_cmts))
pz = T.repeat(pz, self.num_summs, axis=0)
c2 = T.dot(A2 * pz, cmt_encs)
self.activation = T.tanh(T.dot(c, self.W_a4) + T.dot(c2, self.W_a6) + T.dot(sent_decs, self.W_a5))
self.A = A
self.params = [self.W_a1, self.W_a2, self.W_a3, self.W_a4, self.W_a5, self.W_a6]
#self.params = [self.W_a4, self.W_a5, self.W_a6]