def test_sequence_classification_encode_no_text_passed(): explainer_string = "I love you, I hate you" seq_explainer = SequenceClassificationExplainer(explainer_string, MODEL, TOKENIZER) tokens = seq_explainer.encode() assert isinstance(tokens, list) assert tokens[0] != seq_explainer.cls_token_id assert tokens[-1] != seq_explainer.sep_token_id assert len(tokens) >= len(explainer_string.split(" "))
def test_sequence_classification_encode(): seq_explainer = SequenceClassificationExplainer(DISTILBERT_MODEL, DISTILBERT_TOKENIZER) _input = "this is a sample of text to be encoded" tokens = seq_explainer.encode(_input) assert isinstance(tokens, list) assert tokens[0] != seq_explainer.cls_token_id assert tokens[-1] != seq_explainer.sep_token_id assert len(tokens) >= len(_input.split(" "))