Пример #1
0
    def test_transformation(self):

        sent1 = "The quick brown fox jumps over the lazy dog."
        data_sample = SASample({'x': sent1, 'y': "negative"})
        swap_ins = Punctuation()
        x = swap_ins.transform(data_sample, n=10)

        # test the form
        for _sample in x:
            self.assertEqual(
                ''.join(filter(str.isalpha, _sample.get_text('x'))),
                ''.join(filter(str.isalpha, data_sample.get_text('x'))))
            self.assertTrue(_sample.get_text('x') != data_sample.get_text('x'))

        self.assertTrue(10 >= len(x))

        import random
        random.seed(100)
        x = swap_ins.transform(data_sample, n=1)
        x = x[0]
        # test the data
        self.assertTrue('{ The quick brown fox jumps over the lazy dog; }' ==
                        x.get_text('x'))

        special_sample = SASample({'x': '', 'y': "negative"})
        self.assertEqual(1, len(swap_ins.transform(special_sample)))
        special_sample = SASample({'x': '~!@#$%^7890"\'', 'y': "negative"})
        self.assertEqual(1, len(swap_ins.transform(special_sample)))
Пример #2
0
    def test_transformation(self):
        sent2 = 'The quick brown fox jumps over the lazy dog. '
        data_sample = SASample({'x': sent2, 'y': "negative"})
        import random
        random.seed(100)
        swap_ins = MLM(device='cpu')

        x = swap_ins.transform(data_sample, n=5)
        self.assertEqual(5, len(x))
        tokens = []
        for _sample in x:
            self.assertTrue(
                _sample.get_words('x')[:2] == data_sample.get_words('x')[:2])
            self.assertTrue(
                _sample.get_words('x')[3] == data_sample.get_words('x')[3])
            self.assertTrue(
                _sample.get_words('x')[-5:] == data_sample.get_words('x')[-5:])
            tokens.append(
                _sample.get_words('x')[2] + _sample.get_words('x')[4])

        self.assertTrue(5 == len(set(tokens)))

        special_sample = SASample({'x': '', 'y': "negative"})
        self.assertEqual([], swap_ins.transform(special_sample))
        special_sample = SASample({'x': '~!@#$%^7890"\'', 'y': "negative"})
        special_sample = swap_ins.transform(special_sample)[0]
        self.assertEqual('epilogue "\'', special_sample.get_text('x'))
Пример #3
0
    def test_transformation(self):
        # test the change num
        change_sample = swap_ins.transform(data_sample, n=5)
        self.assertEqual(5, len(change_sample))

        # test if the item change
        begin = []
        end = []
        for sample in change_sample:
            self.assertTrue(sent1 in sample.get_text('x'))
            index = sample.get_text('x').index(sent1)
            begin.append(sample.get_text('x')[:index])
            end.append(sample.get_text('x')[index + len(sent1):])

        # test if the n change samples not equal
        self.assertEqual(len(set(begin)), 5)
        self.assertEqual(len(set(end)), 5)

        random.seed(100)
        special_sample = SASample({'x': '~!@#$%^7890"\'', 'y': "negative"})
        special_sample = swap_ins.transform(special_sample)[0]
        self.assertEqual('I actually wanted to talk to you, ~!@#$%^7890 "\'',
                         special_sample.get_text('x'))