RNN: GRU
PyTorch
blog
1. 计算模式
data:image/s3,"s3://crabby-images/46839/468393ce88e471f6bdb0fd4944a8556b6dfc08ce" alt="gru"
2. Python代码计算
def gru_test(inputs, dict_):
weight_ih_l0 = dict_['_parameters']['weight_ih_l0'].detach().numpy()
weight_hh_l0 = dict_['_parameters']['weight_hh_l0'].detach().numpy()
bias_ih = dict_['_parameters']['bias_ih_l0'].detach().numpy()
bias_hh = dict_['_parameters']['bias_hh_l0'].detach().numpy()
hidden_size, input_size = weight_ih_l0.shape # 384*128
hidden_size = int( hidden_size / 3 )
w_ir = weight_ih_l0[0:hidden_size, :]
w_iz = weight_ih_l0[hidden_size:hidden_size * 2, :]
w_in = weight_ih_l0[hidden_size * 2:hidden_size * 3, :]
w_hr = weight_hh_l0[0:hidden_size, :]
w_hz = weight_hh_l0[hidden_size:hidden_size * 2, :]
w_hn = weight_hh_l0[hidden_size * 2:hidden_size * 3, :]
bir = bias_ih[0:hidden_size]
biz = bias_ih[hidden_size:hidden_size * 2]
bin = bias_ih[2 * hidden_size:3 * hidden_size]
# print("bii = ", bii.view(1, -1))
bhr = bias_hh[0:hidden_size]
bhz = bias_hh[hidden_size:hidden_size * 2]
bhn = bias_hh[2 * hidden_size:3 * hidden_size]
h0 = np.zeros(hidden_size).astype(np.float32) # 128
input = inputs.value[0,0,:] # 1,31,128
wir_x = np.dot(w_ir,input) + bir
whr_x = np.dot(w_hr,h0) + bhr
wiz_x = np.dot(w_iz, input) + biz
whz_x = np.dot(w_hz,h0) + bhz
win_x = np.dot(w_in, input) + bin
whn_h = np.dot(w_hn,h0) + bhn
r0 = F.sigmoid(torch.from_numpy(wir_x + whr_x))
z0 = F.sigmoid(torch.from_numpy(wiz_x + whz_x))
r_WhnH_bhn = r0 * torch.from_numpy(whn_h)
n0 = F.tanh(torch.from_numpy(win_x) + r_WhnH_bhn)
t1 = torch.Tensor(np.ones(hidden_size))
h1 = (t1 - z0) * n0+z0*torch.from_numpy(h0)
return h1