Python parse_tokens 예제들

프로그래밍 언어: Python

네임스페이스/패키지 이름: src.grammar_tester.psparse

메소드/함수: parse_tokens

hotexamples.com에서의 예제들: 8

Python parse_tokens - 8개의 예제가 발견되었습니다. 이것들은 오픈소스 프로젝트에서 추출된 Python의 src.grammar_tester.psparse.parse_tokens에 대한 실세계 최고 등급의 예제들입니다. 예제들을 평가하여 예제의 품질 향상에 도움을 줄 수 있습니다.

예제 #1

파일 보기

파일: test_psparse.py 프로젝트: alexcasar/snet

    def test_parse_tokens(self):
        """ test_parse_tokens """

        options = 0

        # No RIGHT-WALL, no CAPS
        options |= BIT_STRIP
        # tokens = parse_tokens(self.tokens_all_walls, options)
        # self.assertTrue(self.cmp_lists(tokens, ['###LEFT-WALL###', 'dad', 'was', 'not', 'a',
        #                                         'parent', 'before', '.']))

        # Tokens without walls
        tokens = parse_tokens(self.tokens_no_walls, options)[0]
        self.assertTrue(
            self.cmp_lists(tokens,
                           ['###LEFT-WALL###', 'eagle', 'has', 'wing', '.']))

        # RIGHT-WALL and CAPS, no STRIP
        options |= (BIT_RWALL | BIT_CAPS)
        options &= ~BIT_STRIP
        tokens = parse_tokens(self.tokens_all_walls, options)[0]
        self.assertTrue(
            self.cmp_lists(tokens, [
                '###LEFT-WALL###', 'Dad[!]', 'was.v-d', 'not.e', 'a',
                'parent.n', 'before', '.', '###RIGHT-WALL###'
            ]))

        # Tokens without walls
        tokens = parse_tokens(self.tokens_no_walls, options)[0]
        # print(tokens, file=sys.stdout)
        self.assertTrue(
            self.cmp_lists(tokens,
                           ['###LEFT-WALL###', 'eagle', 'has', 'wing', '.']))

예제 #2

파일 보기

파일: test_psparse.py 프로젝트: alexcasar/snet

    def test_parse_gutenchildren_bug_002(self):
        """ Test for number of tokens (bug from Gutenberg Children corpus) """
        options = BIT_NO_LWALL | BIT_NO_PERIOD | BIT_STRIP

        tokens = parse_tokens(gutenberg_children_bug_002t, options)[0]

        self.assertEqual(tokens, gutenberg_children_bug_002tr)

예제 #3

파일 보기

    def test_parse_no_period_if_no_period(self):
        """ Test for parsing sentence with no walls and period """
        options = 0
        options |= BIT_STRIP | BIT_NO_PERIOD | BIT_RWALL
        tokens = parse_tokens(self.tokens_no_walls_no_period, options)[0]

        self.assertTrue(self.cmp_lists(tokens, ['###LEFT-WALL###', 'eagle', 'has', 'wing']))

예제 #4

파일 보기

    def test_parse_tokens_no_period(self):
        options = 0
        options |= BIT_STRIP | BIT_NO_PERIOD | BIT_RWALL
        tokens = parse_tokens(self.tokens_no_walls, options)[0]

        print(tokens)

        self.assertTrue(self.cmp_lists(tokens, ['###LEFT-WALL###', 'eagle', 'has', 'wing']))

예제 #5

파일 보기

    def test_parse_tokens_no_walls_no_period(self):
        options = 0
        options |= BIT_STRIP | BIT_NO_PERIOD | BIT_NO_LWALL
        tokens = parse_tokens(self.tokens_all_walls, options)[0]

        # print(tokens)

        self.assertTrue(self.cmp_lists(tokens, ['dad', 'was', 'not', 'a', 'parent', 'before']))

예제 #6

파일 보기

    def test_parse_tokens_no_left_wall(self):
        # NO_LWALL and CAPS, no STRIP
        options = 0
        options |= BIT_CAPS | BIT_NO_LWALL
        # options |= (BIT_NO_LWALL | BIT_CAPS)
        # options &= (~(BIT_STRIP | BIT_RWALL))
        tokens = parse_tokens(self.tokens_all_walls, options)[0]

        # print(tokens)

        self.assertTrue(self.cmp_lists(tokens, ['Dad[!]', 'was.v-d', 'not.e', 'a',
                                                'parent.n', 'before', '.']))

예제 #7

파일 보기

    def test_parse_tokens_alice_004(self):
        """ Test for proper parsing of square brackets revealed by Alice in Wonderland corpus """
        options = BIT_STRIP | BIT_NO_LWALL | BIT_NO_PERIOD

        post = "(LEFT-WALL)(posting.g)(date.n)(:.j)(@date@[?].a)([)(ebook[?].a)([#])(@number@[?].n)(])(release.n)" \
               "(date.n)(:.j)([@date@])(last.ord)(updated.v-d)(:.v)(@date@[?].n)"

        ref = ["###LEFT-WALL###", "posting", "date", ":", "@date@", "[", "ebook", "[#]", "@number@", "]", "release",
               "date", ":", "[@date@]", "last", "updated", ":", "@date@"]

        tokens = parse_tokens(post, options)[0]
        self.assertEqual(ref, tokens)

예제 #8

파일 보기

파일: test_psparse.py 프로젝트: alexcasar/snet

    def test_parse_tokens_alice_003(self):
        """ Test for proper parsing of '[(]' revealed by Alice in Wonderland corpus """
        options = BIT_STRIP | BIT_NO_LWALL | BIT_NO_PERIOD

        # sent = "(alice had no idea what latitude was, or longitude either, but thought they were nice grand words to say.)"
        post = "(LEFT-WALL)([(])(alice[?].n)(had.v-d)(no.misc-d)(idea.n)(what)(latitude.n-u)(was.v-d)(,)(or.ij)" \
               "(longitude.n-u)(either.r)(,)([but])(thought.q-d)(they)(were.v-d)(nice.a)(grand.a)(words.n)(to.r)(say.v)" \
               "(.)([)])"
        ref = \
        ["###LEFT-WALL###", "[(]", "alice", "had", "no", "idea", "what", "latitude", "was", ",", "or", "longitude",
        "either", ",", "[but]", "thought", "they", "were", "nice", "grand", "words", "to", "say", ".", "[)]"]

        tokens = parse_tokens(post, options)[0]
        self.assertEqual(ref, tokens)