Python CRF Beispiele, torchcrf.CRF Python Beispiele

Beispiel #1

0

Datei anzeigen

class opinionBERT(nn.Module):
    def __init__(self, bert_name: str, num_labels: int, num_layers: int,
                 hidden_size: int, dropout_prob: float, rnn_type: str,
                 bidirectional: bool, use_crf: bool, freeze_bert: bool):

        super().__init__()
        self.bert = BertModel.from_pretrained(bert_name)
        if freeze_bert:
            self.bert.requires_grad = False
        if num_layers > 0:
            if rnn_type == "gru":
                self.rnn = nn.GRU(self.bert.config.hidden_size,
                                  hidden_size,
                                  num_layers=num_layers,
                                  bidirectional=bidirectional,
                                  batch_first=True)
            else:
                self.rnn = nn.LSTM(self.bert.config.hidden_size,
                                   hidden_size,
                                   num_layers=num_layers,
                                   bidirectional=bidirectional,
                                   batch_first=True)
        else:
            self.rnn = nn.Identity()
        self.classifier = nn.Linear((1 + bidirectional) * hidden_size,
                                    num_labels)
        self.dropout = nn.Dropout(dropout_prob)
        self.use_crf = use_crf
        if self.use_crf:
            self.crf = CRF(num_labels, batch_first=True)

    def forward(self,
                input_ids,
                attn_mask,
                crf_attn_mask,
                tags=None,
                class_weights=None):
        bert_output = self.bert(input_ids, attn_mask)
        bert_output = bert_output.last_hidden_state
        bert_output = self.dropout(bert_output)

        rnn_output, _ = self.rnn(bert_output)

        logits = self.classifier(rnn_output)

        if self.use_crf:
            pred = self.crf.decode(logits, crf_attn_mask)
        else:
            detached_logits = logits.detach().cpu().numpy()
            pred = [
                list(sentence_pred)
                for sentence_pred in np.argmax(detached_logits, axis=2)
            ]

        if tags is not None:
            if self.use_crf:
                loss = -self.crf(
                    logits, tags, mask=crf_attn_mask, reduction="mean")
            else:
                num_labels = logits.shape[-1]
                if class_weights is not None:
                    loss_fct = nn.CrossEntropyLoss(weight=class_weights)
                else:
                    loss_fct = nn.CrossEntropyLoss()
                active_loss = attn_mask.view(-1) == 1
                active_logits = logits.view(-1, num_labels)
                active_labels = torch.where(
                    active_loss, tags.view(-1),
                    torch.Tensor([loss_fct.ignore_index
                                  ]).type_as(tags)).long()
                loss = loss_fct(active_logits, active_labels)
            return loss, pred
        else:
            return pred

Beispiel #2

0

Datei anzeigen

    def __init__(self, config):
        super().__init__()

        self.birnn = BiRNN(config)
        # self.transitions = nn.Parameter(torch.randn(config.num_classes, config.num_classes)) # 转移矩阵，随机初始化
        self.crf = CRF(config.num_classes, batch_first=True)

Beispiel #3

0

Datei anzeigen

Datei: neural_wsd.py Projekt: alexpopov23/DLinNLP

                     hidden_layers,
                     dropout,
                     output_layers,
                     lemma2synsets,
                     synset2id,
                     known_pos,
                     known_entity_tags,
                     use_flair=use_flair,
                     combine_WN_FN=combine_WN_FN)
    model.to(device)
    loss_func_embed = torch.nn.MSELoss()
    if crf_layer is True:
        if "classify_wsd" in output_layers:
            loss_func_classify = torch.nn.CrossEntropyLoss(ignore_index=-100)
        if "pos_tagger" in output_layers:
            loss_func_pos = CRF(len(known_pos), batch_first=True)
        if "ner" in output_layers:
            loss_func_ner = CRF(len(known_entity_tags), batch_first=True)
    else:
        loss_func_classify = torch.nn.CrossEntropyLoss(ignore_index=-100)
        loss_func_pos = torch.nn.CrossEntropyLoss()
        loss_func_ner = torch.nn.CrossEntropyLoss()
    # loss_func_classify = torch.nn.BCEWithLogitsLoss()
    optimizer = torch.optim.Adam(model.parameters())
    # optimizer = torch.optim.SGD(model.parameters(), lr=learning_rate)

    # Eval loop
    if args.mode == "evaluate":
        model.load_state_dict(torch.load(args.save_path))
        model.eval()
        test_accuracy_embed, test_accuracy_classify, log = eval_loop(

Beispiel #4

0

Datei anzeigen

Datei: models.py Projekt: elsheikh21/named_entity_recognition

class CRF_Model(nn.Module):
    def __init__(self, hparams):
        super(CRF_Model, self).__init__()
        self._device = 'cuda' if torch.cuda.is_available() else 'cpu'
        self.name = hparams.model_name
        self.word_embedding = nn.Embedding(
            hparams.vocab_size, hparams.embedding_dim)
        if hparams.embeddings is not None:
            print("initializing embeddings from pretrained")
            self.word_embedding.weight.data.copy_(hparams.embeddings)

        self.lstm = nn.LSTM(hparams.embedding_dim, hparams.hidden_dim,
                            bidirectional=hparams.bidirectional,
                            num_layers=hparams.num_layers,
                            dropout=hparams.dropout if hparams.num_layers > 1 else 0,
                            batch_first=True)

        lstm_output_dim = hparams.hidden_dim if hparams.bidirectional is False else hparams.hidden_dim * 2
        self.dropout = nn.Dropout(hparams.dropout)
        self.classifier = nn.Linear(lstm_output_dim, hparams.num_classes)
        self.crf = CRF(hparams.num_classes, batch_first=True)

    def forward(self, x):
        # [Samples_Num, Seq_Len]
        embeddings = self.word_embedding(x)
        embeddings = self.dropout(embeddings)
        # [Samples_Num, Seq_Len]
        o, _ = self.lstm(embeddings)
        # [Samples_Num, Seq_Len, Tags_Num]
        o = self.dropout(o)
        # [Samples_Num, Seq_Len, Tags_Num]
        logits = self.classifier(o)
        # [Samples_Num, Seq_Len]
        return logits

    def log_probs(self, x, tags, mask=None):
        emissions = self(x)
        return self.crf(emissions, tags, mask=mask)

    def predict(self, x):
        emissions = self(x)
        return self.crf.decode(emissions)

    def predict_new(self, x, mask=None):
        emissions = self(x)
        return self.crf.decode(emissions, mask=mask)

    def save_checkpoint(self, model_path):
        """
        Saves the model checkpoint
        Args:
            model_path:

        Returns:

        """
        torch.save(self, model_path)
        model_checkpoint = model_path.replace('.pt', '.pth')
        torch.save(self.state_dict(), model_checkpoint)

    def load_model(self, path):
        """
        Loads the model from a given path, loads it to the available device whether its CUDA or CPU
        Args:
            path:

        Returns:

        """
        state_dict = torch.load(path) if self._device == 'cuda' else torch.load(path,
                                                                                map_location=torch.device(self._device))
        self.load_state_dict(state_dict)

    def encode_tokens(self, tokens, word2idx):
        """
        Helper method during prediction
        Encodes the tokens passed during prediction time, fetches word idx from word2idx
        Args:
            tokens:
            word2idx:

        Returns:

        """
        data = []
        for sentence in tokens:
            paragraph = []
            for i in sentence:
                paragraph.append(word2idx.get(i, 1))
            paragraph = torch.LongTensor(paragraph).to(self._device)
            data.append(paragraph)
        return pad_sequence(data, batch_first=True, padding_value=0)

Beispiel #5

0

Datei anzeigen

def make_crf(num_tags=5):
    return CRF(num_tags)

Beispiel #6

0

Datei anzeigen

class RobertaLSTMCRF(RobertaForTokenClassification):
    def __init__(self, config, lstm_hidden_size, lstm_layers):
        super().__init__(config)
        self.lstm = torch.nn.LSTM(
            input_size=config.hidden_size,
            hidden_size=lstm_hidden_size,
            num_layers=lstm_layers,
            dropout=0.2,
            batch_first=True,
            bidirectional=True,
        )
        self.crf = CRF(config.num_labels, batch_first=True)

        del self.classifier
        self.classifier = torch.nn.Linear(2 * lstm_hidden_size,
                                          config.num_labels)

    def forward(
        self,
        input_ids,
        attention_mask=None,
        token_type_ids=None,
        labels=None,
        prediction_mask=None,
    ):

        outputs = self.roberta(
            input_ids,
            attention_mask,
            token_type_ids,
            output_hidden_states=True,
            return_dict=False,
        )
        # seq_output, all_hidden_states, all_self_attntions, all_cross_attentions

        sequence_output = outputs[
            0]  # outputs[1] is pooled output which is none.

        sequence_output = self.dropout(sequence_output)

        lstm_out, *_ = self.lstm(sequence_output)
        sequence_output = self.dropout(lstm_out)

        logits = self.classifier(sequence_output)

        ## CRF
        mask = prediction_mask
        mask = mask[:, :logits.size(1)].contiguous()

        # print(logits)

        if labels is not None:
            labels = labels[:, :logits.size(1)].contiguous()
            loss = -self.crf(
                logits, labels, mask=mask.bool(), reduction="token_mean")

        tags = self.crf.decode(logits, mask.bool())
        # print(tags)
        if labels is not None:
            return (loss, logits, tags)
        else:
            return (logits, tags)

Beispiel #7

0

Datei anzeigen

Datei: test_crf.py Projekt: yumoh/crf

 def test_full(self):
     crf = CRF(10, batch_first=True)
     assert crf.batch_first

Beispiel #8

0

Datei anzeigen