Python GRUCell 예제들, torch.nn.modules.rnn.GRUCell Python 예제들

예제 #1

0

파일 보기

파일: event2mind.py 프로젝트: enesozi/event2mind

 def __init__(self, num_classes: int, input_dim: int,
              output_dim: int) -> None:
     super().__init__()
     self.embedder = Embedding(num_classes, input_dim)
     self.decoder_cell = GRUCell(input_dim, output_dim)
     self.output_projection_layer = Linear(output_dim, num_classes)
     self.recall = UnigramRecall()

예제 #2

0

파일 보기

파일: rnn_baselines.py 프로젝트: klauscc/variational-transformer

    def __init__(self,
                 input_dim,
                 latent_dim,
                 device,
                 concat_mask=False,
                 obsrv_std=0.1,
                 use_binary_classif=False,
                 linear_classifier=False,
                 classif_per_tp=False,
                 input_space_decay=False,
                 cell="gru",
                 n_units=100,
                 n_labels=1,
                 train_classif_w_reconstr=False):

        super(Classic_RNN,
              self).__init__(input_dim,
                             latent_dim,
                             device,
                             obsrv_std=obsrv_std,
                             use_binary_classif=use_binary_classif,
                             classif_per_tp=classif_per_tp,
                             linear_classifier=linear_classifier,
                             n_labels=n_labels,
                             train_classif_w_reconstr=train_classif_w_reconstr)

        self.concat_mask = concat_mask

        encoder_dim = int(input_dim)
        if concat_mask:
            encoder_dim = encoder_dim * 2

        self.decoder = nn.Sequential(
            nn.Linear(latent_dim, n_units),
            nn.Tanh(),
            nn.Linear(n_units, input_dim),
        )

        #utils.init_network_weights(self.encoder)
        utils.init_network_weights(self.decoder)

        if cell == "gru":
            self.rnn_cell = GRUCell(encoder_dim + 1,
                                    latent_dim)  # +1 for delta t
        elif cell == "expdecay":
            self.rnn_cell = GRUCellExpDecay(input_size=encoder_dim,
                                            input_size_for_decay=input_dim,
                                            hidden_size=latent_dim,
                                            device=device)
        else:
            raise Exception("Unknown RNN cell: {}".format(cell))

        if input_space_decay:
            self.w_input_decay = Parameter(torch.Tensor(1, int(input_dim))).to(
                self.device)
            self.b_input_decay = Parameter(torch.Tensor(1, int(input_dim))).to(
                self.device)
        self.input_space_decay = input_space_decay

        self.z0_net = lambda hidden_state: hidden_state

예제 #3

0

파일 보기

    def __init__(self,
                 vocab: Vocabulary,
                 token_embedder: TextFieldEmbedder,
                 document_encoder: Seq2VecEncoder,
                 utterance_encoder: Seq2VecEncoder,
                 context_encoder: Seq2SeqEncoder,
                 beam_size: int = None,
                 max_decoding_steps: int = 50,
                 scheduled_sampling_ratio: float = 0.,
                 use_bleu: bool = True) -> None:
        super(MultiTurnHred, self).__init__(vocab)
        self._scheduled_sampling_ratio = scheduled_sampling_ratio

        # We need the start symbol to provide as the input at the first timestep of decoding, and
        # end symbol as a way to indicate the end of the decoded sequence.
        self._start_index = self.vocab.get_token_index(START_SYMBOL)
        self._end_index = self.vocab.get_token_index(END_SYMBOL)

        if use_bleu:
            pad_index = self.vocab.get_token_index(self.vocab._padding_token)  # pylint: disable=protected-access
            self._bleu = BLEU(exclude_indices={pad_index, self._end_index, self._start_index})
        else:
            self._bleu = None

        # At prediction time, we use a beam search to find the most likely sequence of target tokens.
        self._beam_size = beam_size or 1
        self._max_decoding_steps = max_decoding_steps
        self._beam_search = BeamSearch(self._end_index, max_steps=max_decoding_steps, beam_size=self._beam_size)

        # At prediction time, we use a beam search to find the most likely sequence of target tokens.
        self._max_decoding_steps = max_decoding_steps

        # Dense embedding of word level tokens.
        self._token_embedder = token_embedder

        # Document word level encoder.
        self._document_encoder = document_encoder

        # Dialogue word level encoder.
        self._utterance_encoder = utterance_encoder

        # Sentence level encoder.
        self._context_encoder = context_encoder

        num_classes = self.vocab.get_vocab_size()

        document_output_dim = self._document_encoder.get_output_dim()
        utterance_output_dim = self._utterance_encoder.get_output_dim()
        context_output_dim = self._context_encoder.get_output_dim()
        decoder_output_dim = utterance_output_dim
        decoder_input_dim = token_embedder.get_output_dim() + document_output_dim + context_output_dim

        # We'll use an LSTM cell as the recurrent cell that produces a hidden state
        # for the decoder at each time step.
        # TODO (pradeep): Do not hardcode decoder cell type.
        self._decoder_cell = GRUCell(decoder_input_dim, decoder_output_dim)

        # We project the hidden state from the decoder into the output vocabulary space
        # in order to get log probabilities of each target token, at each time step.
        self._output_projection_layer = Linear(decoder_output_dim, num_classes)

예제 #4

0

파일 보기

파일: gru_cells.py 프로젝트: zhenglei2015/SeaRNN-open

    def __init__(self, input_size, hidden_size, num_layers=1, dropout=0.0):
        super(StackedGRU, self).__init__()
        self.dropout = nn.Dropout(dropout)
        self.num_layers = num_layers
        self.layers = nn.ModuleList()

        for i in range(num_layers):
            self.layers.append(GRUCell(input_size, hidden_size))
            input_size = hidden_size

예제 #5

0

파일 보기

파일: event2mind.py 프로젝트: aman313/latent_reregularization

 def __init__(self, name: str, event2mind: Event2Mind, num_classes: int,
              input_dim: int, output_dim: int) -> None:
     self.embedder = Embedding(num_classes, input_dim)
     event2mind.add_module(f"{name}_embedder", self.embedder)
     self.decoder_cell = GRUCell(input_dim, output_dim)
     event2mind.add_module(f"{name}_decoder_cell", self.decoder_cell)
     self.output_projection_layer = Linear(output_dim, num_classes)
     event2mind.add_module(f"{name}_output_project_layer",
                           self.output_projection_layer)
     self.recall = UnigramRecall()

예제 #6

0

파일 보기

파일: model.py 프로젝트: lingyongyan/bootstrapnet

 def __init__(self, opt):
     super(BootDecoder, self).__init__()
     self.opt = opt
     self.rnn_step = opt['rnn_step']
     self.dropout = opt['dropout']
     self.seed_count = opt['seed_count']
     self.ave_method = opt['ave_method']
     self.min_match = max(1, opt['min_match'])
     self.layers = nn.ModuleList()
     self.n_class, self.n_feature = opt['num_class'], opt['num_feature']
     self.rnn_cell = GRUCell(self.n_feature, self.n_feature)
     self.layer_norm = nn.LayerNorm(self.n_feature)
     self.dev = False

예제 #7

0

파일 보기