コード例 #1
0
class RemoveCapsTest(unittest.TestCase):

    def setUp(self):
        self.op = RemoveCapsGreedy()

    def test_run_greedy(self):
        self.op = RemoveCapsGreedy()
        self.test_data = '''Removes all non-proper-noun capitals from a given text. Removes capital letters from text, even for Bill Clinton. Accepts as input a non-tokenized string.'''
        self.assertEqual(self.op.run(self.test_data),
        '''removes all non-proper-noun capitals from a given text. removes capital letters from text, even for bill clinton. accepts as input a non-tokenized string.''')

    def test_run_preserve_nnp(self):
        self.op = RemoveCapsPreserveNNP()
        self.test_data = '''Removes all non-proper-noun capitals from a given text. Removes capital letters from text, even for Bill Clinton. Accepts as input a non-tokenized string.'''
        self.assertEqual(self.op.run(self.test_data),
        '''removes all non-proper-noun capitals from a given text. removes capital letters from text, even for Bill Clinton. accepts as input a non-tokenized string.''')
コード例 #2
0
class RemoveCapsTest(unittest.TestCase):
    def setUp(self):
        self.op = RemoveCapsGreedy()

    def test_run_greedy(self):
        self.op = RemoveCapsGreedy()
        test_data = [
            Corpus(
                "0", "",
                "Removes all non-proper-noun capitals from a given text. Removes capital letters from text, even for Bill Clinton. Accepts as input a non-tokenized string."
            )
        ]
        desired_results = {
            "0":
            "removes all non-proper-noun capitals from a given text. removes capital letters from text, even for bill clinton. accepts as input a non-tokenized string."
        }
        results = self.op.run(test_data)
        self.assertIsNotNone(results)
        for corpus in results:
            self.assertEqual(corpus.contents, desired_results[corpus.id])

    def test_run_preserve_nnp(self):
        self.op = RemoveCapsPreserveNNP()
        test_data = [
            Corpus(
                "0", "",
                "Removes all non-proper-noun capitals from a given text. Removes capital letters from text, even for Bill Clinton. Accepts as input a non-tokenized string."
            )
        ]
        desired_results = {
            "0":
            "removes all non-proper-noun capitals from a given text. removes capital letters from text, even for Bill Clinton. accepts as input a non-tokenized string."
        }
        results = self.op.run(test_data)
        self.assertIsNotNone(results)
        for corpus in results:
            self.assertEqual(corpus.contents, desired_results[corpus.id])