Exemplo n.º 1
0
    def reset_parameters(self):
        for head in range(self.attn_heads):
            glorot_uniform(self.kernels[head])
            glorot_uniform(self.att_kernels[head])

            if self.use_bias:
                zeros(self.biases[head])
Exemplo n.º 2
0
    def _initialize(self):
        for w, wv in zip(self.weights, self.w_velocities):
            glorot_uniform(w)
            zeros(wv)

        for ix in range(len(self.weights)):
            self.weights[ix] = self.weights[ix].detach()
            self.w_velocities[ix] = self.w_velocities[ix].detach()
            self.weights[ix].requires_grad = True
Exemplo n.º 3
0
    def reset_parameters(self):
        for head in range(self.attn_heads):
            W, a1, a2 = self.kernels[head], self.attn_kernel_self[
                head], self.attn_kernel_neighs[head]
            glorot_uniform(W)
            glorot_uniform(a1)
            glorot_uniform(a2)

            if self.use_bias:
                zeros(self.biases[head])
Exemplo n.º 4
0
    def reset_parameters(self):

        for layer in self.layers:
            layer.reset_parameters()

        for s in self.scores:
            glorot_uniform(s)

        for b in self.bias:
            # fill in b with postive value to make
            # score s closer to 1 at the beginning
            zeros(b)

        for Dk in self.D_k:
            glorot_uniform(Dk)

        for b in self.D_bias:
            zeros(b)
Exemplo n.º 5
0
 def reset_parameters(self):
     uniform(self.kernel)
     zeros(self.bias)