Python bilinear_attention_layer 예제들

프로그래밍 언어: Python

네임스페이스/패키지 이름: att_layer

메소드/함수: bilinear_attention_layer

hotexamples.com에서의 예제들: 5

Python bilinear_attention_layer - 5개의 예제가 발견되었습니다. 이것들은 오픈소스 프로젝트에서 추출된 Python의 att_layer.bilinear_attention_layer에 대한 실세계 최고 등급의 예제들입니다. 예제들을 평가하여 예제의 품질 향상에 도움을 줄 수 있습니다.

예제 #1

파일 보기

파일: lcrModelInverse.py 프로젝트: ofwallaart/HAABSA

def lcr_rot(input_fw,
            input_bw,
            sen_len_fw,
            sen_len_bw,
            target,
            sen_len_tr,
            keep_prob1,
            keep_prob2,
            l2,
            _id='all'):
    print('I am lcr_rot_inv.')
    cell = tf.contrib.rnn.LSTMCell
    # left hidden
    input_fw = tf.nn.dropout(input_fw, keep_prob=keep_prob1)
    hiddens_l = bi_dynamic_rnn(cell, input_fw, FLAGS.n_hidden, sen_len_fw,
                               FLAGS.max_sentence_len, 'l' + _id, 'all')

    pool_l = reduce_mean_with_len(hiddens_l, sen_len_fw)
    # right hidden
    input_bw = tf.nn.dropout(input_bw, keep_prob=keep_prob1)
    hiddens_r = bi_dynamic_rnn(cell, input_bw, FLAGS.n_hidden, sen_len_bw,
                               FLAGS.max_sentence_len, 'r' + _id, 'all')

    pool_r = reduce_mean_with_len(hiddens_r, sen_len_bw)
    # target hidden
    target = tf.nn.dropout(target, keep_prob=keep_prob1)
    hiddens_t = bi_dynamic_rnn(cell, target, FLAGS.n_hidden, sen_len_tr,
                               FLAGS.max_sentence_len, 't' + _id, 'all')

    pool_t = reduce_mean_with_len(hiddens_t, sen_len_tr)

    # attention target left
    att_t_l = bilinear_attention_layer(hiddens_t, pool_l, sen_len_tr,
                                       2 * FLAGS.n_hidden, l2,
                                       FLAGS.random_base, 'tl')
    outputs_t_l = tf.squeeze(tf.matmul(att_t_l, hiddens_t))
    # attention target right
    att_t_r = bilinear_attention_layer(hiddens_t, pool_r, sen_len_tr,
                                       2 * FLAGS.n_hidden, l2,
                                       FLAGS.random_base, 'tr')
    outputs_t_r = tf.squeeze(tf.matmul(att_t_r, hiddens_t))

    # attention left
    att_l = bilinear_attention_layer(hiddens_l, outputs_t_l, sen_len_fw,
                                     2 * FLAGS.n_hidden, l2, FLAGS.random_base,
                                     'l')
    # attention right
    att_r = bilinear_attention_layer(hiddens_r, outputs_t_r, sen_len_bw,
                                     2 * FLAGS.n_hidden, l2, FLAGS.random_base,
                                     'r')

    outputs_r = tf.squeeze(tf.matmul(att_r, hiddens_r))

    outputs = tf.concat([outputs_l, outputs_r, outputs_t_l, outputs_t_r], 1)

    prob = softmax_layer(outputs, 8 * FLAGS.n_hidden, FLAGS.random_base,
                         keep_prob2, l2, FLAGS.n_class)
    return prob, att_l, att_r, att_t_l, att_t_r

예제 #2

파일 보기

파일: lcrModelAlt_hierarchical_v4_multihead.py 프로젝트: RayelH/HAABSA-Multidim-Multihead

def compute_head(hiddens, pool, length, n_hidden, max_len, dim_head,
                 random_base, l2_reg, id):
    w1 = tf.get_variable(name='head_w_hiddens' + str(id),
                         shape=[n_hidden, dim_head],
                         initializer=tf.random_uniform_initializer(
                             -random_base, random_base),
                         regularizer=tf.contrib.layers.l2_regularizer(l2_reg))

    w2 = tf.get_variable(name='head_w_pool' + str(id),
                         shape=[n_hidden, dim_head],
                         initializer=tf.random_uniform_initializer(
                             -random_base, random_base),
                         regularizer=tf.contrib.layers.l2_regularizer(l2_reg))

    # compute linear projections of hidden states
    hiddens = tf.reshape(hiddens, [-1, n_hidden])
    # tmp: batch_size * max_sen_len * dim_head
    hiddens_q = tf.reshape(tf.matmul(hiddens, w1), [-1, max_len, dim_head])
    # hiddens_q = hiddens

    # compute linear projection of pool
    pool_q = tf.matmul(pool, w2)
    # pool_q = pool

    att_q = bilinear_attention_layer(hiddens_q, pool_q, length, dim_head,
                                     l2_reg, random_base, id)
    outputs_q = tf.squeeze(tf.matmul(att_q, hiddens_q))

    return att_q, outputs_q, hiddens_q

예제 #3

파일 보기

def lcr_rot(
    input_fw,
    input_bw,
    sen_len_fw,
    sen_len_bw,
    target,
    sen_len_tr,
    keep_prob1,
    keep_prob2,
    l2,
    _id='all',
):
    print('I am lcr_rot_alt-V4.')
    cell = tf.contrib.rnn.LSTMCell
    # left hidden
    input_fw = tf.nn.dropout(input_fw, keep_prob=keep_prob1)
    hiddens_l = bi_dynamic_rnn(cell, input_fw, FLAGS.n_hidden, sen_len_fw,
                               FLAGS.max_sentence_len, 'l' + _id, 'all')
    pool_l = reduce_mean_with_len(hiddens_l, sen_len_fw)

    # right hidden
    input_bw = tf.nn.dropout(input_bw, keep_prob=keep_prob1)
    hiddens_r = bi_dynamic_rnn(cell, input_bw, FLAGS.n_hidden, sen_len_bw,
                               FLAGS.max_sentence_len, 'r' + _id, 'all')
    pool_r = reduce_mean_with_len(hiddens_r, sen_len_bw)

    # target hidden
    target = tf.nn.dropout(target, keep_prob=keep_prob1)
    hiddens_t = bi_dynamic_rnn(cell, target, FLAGS.n_hidden, sen_len_tr,
                               FLAGS.max_sentence_len, 't' + _id, 'all')
    pool_t = reduce_mean_with_len(hiddens_t, sen_len_tr)

    # attention left
    att_l = bilinear_attention_layer(hiddens_l, pool_t, sen_len_fw,
                                     2 * FLAGS.n_hidden, l2, FLAGS.random_base,
                                     'tl')
    outputs_t_l_init = tf.matmul(att_l, hiddens_l)
    outputs_t_l = tf.squeeze(outputs_t_l_init)
    # attention right
    att_r = bilinear_attention_layer(hiddens_r, pool_t, sen_len_bw,
                                     2 * FLAGS.n_hidden, l2, FLAGS.random_base,
                                     'tr')
    outputs_t_r_init = tf.matmul(att_r, hiddens_r)
    outputs_t_r = tf.squeeze(outputs_t_r_init)

    # attention target left
    att_t_l = bilinear_attention_layer(hiddens_t, outputs_t_l, sen_len_tr,
                                       2 * FLAGS.n_hidden, l2,
                                       FLAGS.random_base, 'l')
    outputs_l_init = tf.matmul(att_t_l, hiddens_t)
    outputs_l = tf.squeeze(outputs_l_init)
    # attention target right
    att_t_r = bilinear_attention_layer(hiddens_t, outputs_t_r, sen_len_tr,
                                       2 * FLAGS.n_hidden, l2,
                                       FLAGS.random_base, 'r')
    outputs_r_init = tf.matmul(att_t_r, hiddens_t)
    outputs_r = tf.squeeze(outputs_r_init)

    outputs_init_context = tf.concat([outputs_t_l_init, outputs_t_r_init], 1)
    outputs_init_target = tf.concat([outputs_l_init, outputs_r_init], 1)
    att_outputs_context = dot_produce_attention_layer(outputs_init_context,
                                                      None, 2 * FLAGS.n_hidden,
                                                      l2, FLAGS.random_base,
                                                      'fin1')
    att_outputs_target = dot_produce_attention_layer(outputs_init_target, None,
                                                     2 * FLAGS.n_hidden, l2,
                                                     FLAGS.random_base, 'fin2')
    outputs_l = tf.squeeze(
        tf.matmul(tf.expand_dims(att_outputs_target[:, :, 0], 2),
                  outputs_l_init))
    outputs_r = tf.squeeze(
        tf.matmul(tf.expand_dims(att_outputs_target[:, :, 1], 2),
                  outputs_r_init))
    outputs_t_l = tf.squeeze(
        tf.matmul(tf.expand_dims(att_outputs_context[:, :, 0], 2),
                  outputs_t_l_init))
    outputs_t_r = tf.squeeze(
        tf.matmul(tf.expand_dims(att_outputs_context[:, :, 1], 2),
                  outputs_t_r_init))

    for i in range(2):
        # attention target
        att_l = bilinear_attention_layer(hiddens_l, outputs_l, sen_len_fw,
                                         2 * FLAGS.n_hidden, l2,
                                         FLAGS.random_base, 'tl' + str(i))
        outputs_t_l_init = tf.matmul(att_l, hiddens_l)
        outputs_t_l = tf.squeeze(outputs_t_l_init)

        att_r = bilinear_attention_layer(hiddens_r, outputs_r, sen_len_bw,
                                         2 * FLAGS.n_hidden, l2,
                                         FLAGS.random_base, 'tr' + str(i))
        outputs_t_r_init = tf.matmul(att_r, hiddens_r)
        outputs_t_r = tf.squeeze(outputs_t_r_init)

        # attention left
        att_t_l = bilinear_attention_layer(hiddens_t, outputs_t_l, sen_len_tr,
                                           2 * FLAGS.n_hidden, l2,
                                           FLAGS.random_base, 'l' + str(i))
        outputs_l_init = tf.matmul(att_t_l, hiddens_t)
        outputs_l = tf.squeeze(outputs_l_init)

        # attention right
        att_t_r = bilinear_attention_layer(hiddens_t, outputs_t_r, sen_len_tr,
                                           2 * FLAGS.n_hidden, l2,
                                           FLAGS.random_base, 'r' + str(i))
        outputs_r_init = tf.matmul(att_t_r, hiddens_t)
        outputs_r = tf.squeeze(outputs_r_init)

        outputs_init_context = tf.concat([outputs_t_l_init, outputs_t_r_init],
                                         1)
        outputs_init_target = tf.concat([outputs_l_init, outputs_r_init], 1)
        att_outputs_context = dot_produce_attention_layer(
            outputs_init_context, None, 2 * FLAGS.n_hidden, l2,
            FLAGS.random_base, 'fin1' + str(i))
        att_outputs_target = dot_produce_attention_layer(
            outputs_init_target, None, 2 * FLAGS.n_hidden, l2,
            FLAGS.random_base, 'fin2' + str(i))
        outputs_l = tf.squeeze(
            tf.matmul(tf.expand_dims(att_outputs_target[:, :, 0], 2),
                      outputs_l_init))
        outputs_r = tf.squeeze(
            tf.matmul(tf.expand_dims(att_outputs_target[:, :, 1], 2),
                      outputs_r_init))
        outputs_t_l = tf.squeeze(
            tf.matmul(tf.expand_dims(att_outputs_context[:, :, 0], 2),
                      outputs_t_l_init))
        outputs_t_r = tf.squeeze(
            tf.matmul(tf.expand_dims(att_outputs_context[:, :, 1], 2),
                      outputs_t_r_init))
    outputs_fin = tf.concat([outputs_l, outputs_r, outputs_t_l, outputs_t_r],
                            1)
    prob = softmax_layer(outputs_fin, 8 * FLAGS.n_hidden, FLAGS.random_base,
                         keep_prob2, l2, FLAGS.n_class)
    return prob, att_l, att_r, att_t_l, att_t_r

예제 #4

파일 보기

파일: lcrModelAlt.py 프로젝트: gnoluna/HAABSA

def lcr_rot(n_asp,
            input_fw,
            input_bw,
            sen_len_fw,
            sen_len_bw,
            target,
            sen_len_tr,
            keep_prob1,
            keep_prob2,
            l2,
            _id='all'):
    print('I am lcr_rot_alt.')
    cell = tf.contrib.rnn.LSTMCell
    # left hidden
    input_fw = tf.nn.dropout(input_fw, keep_prob=keep_prob1)
    hiddens_l = bi_dynamic_rnn(cell, input_fw, FLAGS.n_hidden, sen_len_fw,
                               FLAGS.max_sentence_len, 'l' + _id, 'all')
    pool_l = reduce_mean_with_len(hiddens_l, sen_len_fw)

    # right hidden
    input_bw = tf.nn.dropout(input_bw, keep_prob=keep_prob1)
    hiddens_r = bi_dynamic_rnn(cell, input_bw, FLAGS.n_hidden, sen_len_bw,
                               FLAGS.max_sentence_len, 'r' + _id, 'all')
    pool_r = reduce_mean_with_len(hiddens_r, sen_len_bw)

    # target hidden
    target = tf.nn.dropout(target, keep_prob=keep_prob1)
    hiddens_t = bi_dynamic_rnn(cell, target, FLAGS.n_hidden, sen_len_tr,
                               FLAGS.max_sentence_len, 't' + _id, 'all')
    pool_t = reduce_mean_with_len(hiddens_t, sen_len_tr)

    # attention left
    att_l = bilinear_attention_layer(hiddens_l, pool_t, sen_len_fw,
                                     2 * FLAGS.n_hidden, l2, FLAGS.random_base,
                                     'tl')
    outputs_t_l = tf.squeeze(tf.matmul(att_l, hiddens_l))
    # attention right
    att_r = bilinear_attention_layer(hiddens_r, pool_t, sen_len_bw,
                                     2 * FLAGS.n_hidden, l2, FLAGS.random_base,
                                     'tr')
    outputs_t_r = tf.squeeze(tf.matmul(att_r, hiddens_r))

    # attention target left
    att_t_l = bilinear_attention_layer(hiddens_t, outputs_t_l, sen_len_tr,
                                       2 * FLAGS.n_hidden, l2,
                                       FLAGS.random_base, 'l')
    outputs_l = tf.squeeze(tf.matmul(att_t_l, hiddens_t))
    # attention target right
    att_t_r = bilinear_attention_layer(hiddens_t, outputs_t_r, sen_len_tr,
                                       2 * FLAGS.n_hidden, l2,
                                       FLAGS.random_base, 'r')
    outputs_r = tf.squeeze(tf.matmul(att_t_r, hiddens_t))

    for i in range(2):
        # attention target
        att_l = bilinear_attention_layer(hiddens_l, pool_t, sen_len_fw,
                                         2 * FLAGS.n_hidden, l2,
                                         FLAGS.random_base, 'tl' + str(i))
        outputs_t_l = tf.squeeze(tf.matmul(att_l, hiddens_l))

        att_r = bilinear_attention_layer(hiddens_r, pool_t, sen_len_bw,
                                         2 * FLAGS.n_hidden, l2,
                                         FLAGS.random_base, 'tr' + str(i))
        outputs_t_r = tf.squeeze(tf.matmul(att_r, hiddens_r))

        # attention left
        att_t_l = bilinear_attention_layer(hiddens_t, outputs_t_l, sen_len_tr,
                                           2 * FLAGS.n_hidden, l2,
                                           FLAGS.random_base, 'l' + str(i))
        outputs_l = tf.squeeze(tf.matmul(att_t_l, hiddens_t))
        # attention right
        att_t_r = bilinear_attention_layer(hiddens_t, outputs_t_r, sen_len_tr,
                                           2 * FLAGS.n_hidden, l2,
                                           FLAGS.random_base, 'r' + str(i))
        outputs_r = tf.squeeze(tf.matmul(att_t_r, hiddens_t))

    outputs = tf.concat([outputs_l, outputs_r, outputs_t_l, outputs_t_r], 1)
    prob = softmax_layer(outputs, 8 * FLAGS.n_hidden, FLAGS.random_base,
                         keep_prob2, l2, FLAGS.n_class)

    asp_size = tf.size(n_asp)
    begin = tf.map_fn(lambda x: tf.math.reduce_sum(n_asp[:x], 0),
                      tf.range(asp_size), tf.int32)
    prob_sen = tf.map_fn(
                lambda i: tf.clip_by_value(
                    tf.reduce_sum(tf.slice(prob, [begin[i], 0], [n_asp[i], FLAGS.n_class]), axis=0), \
                    clip_value_min = 0. , clip_value_max = 1.), \
                tf.range(asp_size), \
                dtype = tf.float32)

    return prob, prob_sen, outputs, att_l, att_r, att_t_l, att_t_r

예제 #5

파일 보기

파일: lcrDoubleRAA.py 프로젝트: Guangyao-Zhou/HABSADRAA

def lcr_rot(input_fw, input_bw, sen_len_fw, sen_len_bw, target, sen_len_tr, keep_prob1, keep_prob2, l2, _id='all'):
    print('I am a new lcr_rot_alt. Trival2021 model 1')
    cell = tf.contrib.rnn.LSTMCell
    # left hidden
    input_fw = tf.nn.dropout(input_fw, keep_prob=keep_prob1)
    hiddens_l = bi_dynamic_rnn(cell, input_fw, FLAGS.n_hidden, sen_len_fw, FLAGS.max_sentence_len, 'l' + _id, 'all')
    pool_l = reduce_mean_with_len(hiddens_l, sen_len_fw)

    # right hidden
    input_bw = tf.nn.dropout(input_bw, keep_prob=keep_prob1)
    hiddens_r = bi_dynamic_rnn(cell, input_bw, FLAGS.n_hidden, sen_len_bw, FLAGS.max_sentence_len, 'r' + _id, 'all')
    pool_r = reduce_mean_with_len(hiddens_r, sen_len_bw)

    # target hidden
    target = tf.nn.dropout(target, keep_prob=keep_prob1)
    hiddens_t = bi_dynamic_rnn(cell, target, FLAGS.n_hidden, sen_len_tr, FLAGS.max_sentence_len, 't' + _id, 'all')
    pool_t = reduce_mean_with_len(hiddens_t, sen_len_tr)

    # attention left and attention left target
    # attention target left
    att_t_l = bilinear_attention_layer(hiddens_t, pool_l, sen_len_tr, 2 * FLAGS.n_hidden, l2, FLAGS.random_base, 'l')
    outputs_l_init = tf.matmul(att_t_l, hiddens_t)
    outputs_l_org = tf.squeeze(outputs_l_init)

    # attention target right
    att_t_r = bilinear_attention_layer(hiddens_t, pool_r, sen_len_tr, 2 * FLAGS.n_hidden, l2, FLAGS.random_base, 'r')
    outputs_r_init = tf.matmul(att_t_r, hiddens_t)
    outputs_r_org = tf.squeeze(outputs_r_init)
    
    # attention left
    att_l = bilinear_attention_layer(hiddens_l, pool_t, sen_len_fw, 2 * FLAGS.n_hidden, l2, FLAGS.random_base, 'tl')
    outputs_t_l_init = tf.matmul(att_l, hiddens_l)
    outputs_t_l_org = tf.squeeze(outputs_t_l_init)
    
    # attention right
    att_r = bilinear_attention_layer(hiddens_r, pool_t, sen_len_bw, 2 * FLAGS.n_hidden, l2, FLAGS.random_base, 'tr')
    outputs_t_r_init = tf.matmul(att_r, hiddens_r)
    outputs_t_r_org = tf.squeeze(outputs_t_r_init)
    
    # attention target left
    att_t_l = bilinear_attention_layer(hiddens_t, outputs_t_l_org, sen_len_tr, 2 * FLAGS.n_hidden, l2, FLAGS.random_base, 'l5')
    outputs_l_init = tf.matmul(att_t_l, hiddens_t)
    outputs_l = tf.squeeze(outputs_l_init)
    
    # attention target right
    att_t_r = bilinear_attention_layer(hiddens_t, outputs_t_r_org, sen_len_tr, 2 * FLAGS.n_hidden, l2, FLAGS.random_base, 'r5')
    outputs_r_init = tf.matmul(att_t_r, hiddens_t)
    outputs_r = tf.squeeze(outputs_r_init)
    
    # attention left
    att_l = bilinear_attention_layer(hiddens_l, outputs_l_org, sen_len_fw, 2 * FLAGS.n_hidden, l2, FLAGS.random_base, 'tl5')
    outputs_t_l_init = tf.matmul(att_l, hiddens_l)
    outputs_t_l = tf.squeeze(outputs_t_l_init)
    
    # attention right
    att_r = bilinear_attention_layer(hiddens_r, outputs_r_org, sen_len_bw, 2 * FLAGS.n_hidden, l2, FLAGS.random_base, 'tr5')
    outputs_t_r_init = tf.matmul(att_r, hiddens_r)
    outputs_t_r = tf.squeeze(outputs_t_r_init)
    
    outputs_init_1 = tf.concat([outputs_l_init, outputs_t_l_init], 1)
    att_outputs_1 = dot_produce_attention_layer(outputs_init_1, None, 2 * FLAGS.n_hidden, l2, FLAGS.random_base, 'fin_aoa2')
    outputs_l = tf.squeeze(tf.matmul(tf.expand_dims(att_outputs_1[:,:,0], 2), outputs_l_init))
    #outputs_r = tf.squeeze(tf.matmul(tf.expand_dims(att_outputs[:,:,1], 2), outputs_r_init))
    outputs_t_l = tf.squeeze(tf.matmul(tf.expand_dims(att_outputs_1[:,:,1], 2), outputs_t_l_init))
    #outputs_t_r = tf.squeeze(tf.matmul(tf.expand_dims(att_outputs[:,:,3], 2), outputs_t_r_init))
    
    outputs_init_2 = tf.concat([outputs_r_init, outputs_t_r_init], 1)
    att_outputs_2 = dot_produce_attention_layer(outputs_init_2, None, 2 * FLAGS.n_hidden, l2, FLAGS.random_base, 'fin_aoar')
    outputs_r = tf.squeeze(tf.matmul(tf.expand_dims(att_outputs_2[:,:,0], 2), outputs_r_init))
    #outputs_r = tf.squeeze(tf.matmul(tf.expand_dims(att_outputs[:,:,1], 2), outputs_r_init))
    outputs_t_r = tf.squeeze(tf.matmul(tf.expand_dims(att_outputs_2[:,:,1], 2), outputs_t_r_init))
    #outputs_t_r = tf.squeeze(tf.matmul(tf.expand_dims(att_outputs[:,:,3], 2), outputs_t_r_init))
    

    for i in range(1):
        '''
        # attention left
        att_t_l = bilinear_attention_layer(hiddens_t, outputs_t_l, sen_len_tr, 2 * FLAGS.n_hidden, l2, FLAGS.random_base, 'l'+str(i))
        outputs_l_init = tf.matmul(att_t_l, hiddens_t)
        outputs_l = tf.squeeze(outputs_l_init)
                                                       
        # attention right
        att_t_r = bilinear_attention_layer(hiddens_t, outputs_t_r, sen_len_tr, 2 * FLAGS.n_hidden, l2, FLAGS.random_base, 'r'+str(i))
        outputs_r_init = tf.matmul(att_t_r, hiddens_t)
        outputs_r = tf.squeeze(outputs_r_init) 
        '''
        #attention target left
        att_l = bilinear_attention_layer(hiddens_l, outputs_l, sen_len_fw, 2 * FLAGS.n_hidden, l2, FLAGS.random_base, 'tl'+str(i))
        outputs_t_l_init = tf.matmul(att_l, hiddens_l)
        outputs_t_l = tf.squeeze(outputs_t_l_init)
        
        #attention target right
        att_r = bilinear_attention_layer(hiddens_r, outputs_r, sen_len_bw, 2 * FLAGS.n_hidden, l2, FLAGS.random_base, 'tr'+str(i))
        outputs_t_r_init = tf.matmul(att_r, hiddens_r)
        outputs_t_r = tf.squeeze(outputs_t_r_init)
        #print(outputs_t_r.shape)
        
        # attention left
        att_t_l = bilinear_attention_layer(hiddens_t, outputs_t_l, sen_len_tr, 2 * FLAGS.n_hidden, l2, FLAGS.random_base, 'l'+str(i))
        outputs_l_init = tf.matmul(att_t_l, hiddens_t)
        outputs_l = tf.squeeze(outputs_l_init)
                                                       
        # attention right
        att_t_r = bilinear_attention_layer(hiddens_t, outputs_t_r, sen_len_tr, 2 * FLAGS.n_hidden, l2, FLAGS.random_base, 'r'+str(i))
        outputs_r_init = tf.matmul(att_t_r, hiddens_t)
        outputs_r = tf.squeeze(outputs_r_init) 
        
       
    outputs = tf.concat([outputs_l, outputs_r, outputs_t_l, outputs_t_r], 1)
    prob = softmax_layer(outputs, 8 * FLAGS.n_hidden, FLAGS.random_base, keep_prob2, l2, FLAGS.n_class)
    return prob, att_l, att_r, att_t_l, att_t_r