Ejemplo n.º 1
0
    def test_parse_tokens(self):
        """ test_parse_tokens """
        # print(__doc__, sys.stderr)

        options = 0

        # No RIGHT-WALL, no CAPS
        options |= BIT_STRIP
        # tokens = parse_tokens(self.tokens_all_walls, options)
        # self.assertTrue(self.cmp_lists(tokens, ['###LEFT-WALL###', 'dad', 'was', 'not', 'a',
        #                                         'parent', 'before', '.']))

        # Tokens without walls
        tokens = parse_tokens(self.tokens_no_walls, options)[0]
        self.assertTrue(
            self.cmp_lists(tokens,
                           ['###LEFT-WALL###', 'eagle', 'has', 'wing', '.']))

        # RIGHT-WALL and CAPS, no STRIP
        options |= (BIT_RWALL | BIT_CAPS)
        options &= ~BIT_STRIP
        tokens = parse_tokens(self.tokens_all_walls, options)[0]
        self.assertTrue(
            self.cmp_lists(tokens, [
                '###LEFT-WALL###', 'Dad[!]', 'was.v-d', 'not.e', 'a',
                'parent.n', 'before', '.', '###RIGHT-WALL###'
            ]))

        # Tokens without walls
        tokens = parse_tokens(self.tokens_no_walls, options)[0]
        # print(tokens, file=sys.stdout)
        self.assertTrue(
            self.cmp_lists(tokens,
                           ['###LEFT-WALL###', 'eagle', 'has', 'wing', '.']))
Ejemplo n.º 2
0
    def test_parse_no_period_if_no_period(self):
        options = 0
        options |= BIT_STRIP | BIT_NO_PERIOD | BIT_RWALL
        tokens = parse_tokens(self.tokens_no_walls_no_period, options)[0]

        # print(tokens)

        self.assertTrue(
            self.cmp_lists(tokens,
                           ['###LEFT-WALL###', 'eagle', 'has', 'wing']))
Ejemplo n.º 3
0
    def test_parse_tokens_no_walls_no_period(self):
        options = 0
        options |= BIT_STRIP | BIT_NO_PERIOD | BIT_NO_LWALL
        tokens = parse_tokens(self.tokens_all_walls, options)[0]

        # print(tokens)

        self.assertTrue(
            self.cmp_lists(tokens,
                           ['dad', 'was', 'not', 'a', 'parent', 'before']))
Ejemplo n.º 4
0
    def test_parse_tokens_no_left_wall(self):
        # NO_LWALL and CAPS, no STRIP
        options = 0
        options |= BIT_CAPS | BIT_NO_LWALL
        # options |= (BIT_NO_LWALL | BIT_CAPS)
        # options &= (~(BIT_STRIP | BIT_RWALL))
        tokens = parse_tokens(self.tokens_all_walls, options)[0]

        # print(tokens)

        self.assertTrue(
            self.cmp_lists(
                tokens,
                ['Dad[!]', 'was.v-d', 'not.e', 'a', 'parent.n', 'before', '.'
                 ]))
Ejemplo n.º 5
0
    def test_parse_gutenchildren_bug_002(self):
        options = BIT_NO_LWALL | BIT_NO_PERIOD | BIT_STRIP

        tokens = parse_tokens(gutenberg_children_bug_002t, options)[0]

        self.assertEqual(tokens, gutenberg_children_bug_002tr)